diff --git "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" --- "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" +++ "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 6.1467, "train/learning_rate": 2.9295774647887323e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 8792, "_timestamp": 1648150136, "_step": 1500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 12.0, 5.0, 14.0, 11.0, 15.0, 19.0, 21.0, 35.0, 31.0, 30.0, 31.0, 34.0, 44.0, 50.0, 46.0, 50.0, 59.0, 52.0, 44.0, 49.0, 53.0, 34.0, 43.0, 26.0, 34.0, 30.0, 22.0, 28.0, 12.0, 11.0, 18.0, 10.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-76.76399993896484, -74.40105438232422, -72.0381088256836, -69.6751708984375, -67.31222534179688, -64.94927978515625, -62.586334228515625, -60.223392486572266, -57.860450744628906, -55.49750518798828, -53.13456344604492, -50.7716178894043, -48.40867614746094, -46.04573059082031, -43.68278503417969, -41.31984329223633, -38.9568977355957, -36.59395217895508, -34.23101043701172, -31.868064880371094, -29.505123138427734, -27.14217758178711, -24.779233932495117, -22.416290283203125, -20.053346633911133, -17.69040298461914, -15.327459335327148, -12.96451473236084, -10.601571083068848, -8.238627433776855, -5.875682830810547, -3.5127391815185547, -1.1497955322265625, 1.2131483554840088, 3.57609224319458, 5.9390363693237305, 8.301980018615723, 10.664923667907715, 13.027868270874023, 15.390811920166016, 17.753755569458008, 20.11669921875, 22.479642868041992, 24.842586517333984, 27.20553207397461, 29.56847381591797, 31.931419372558594, 34.29436492919922, 36.65730667114258, 39.0202522277832, 41.38319396972656, 43.74613952636719, 46.10908126831055, 48.47202682495117, 50.83496856689453, 53.197914123535156, 55.56085968017578, 57.923805236816406, 60.286746978759766, 62.64969253540039, 65.01263427734375, 67.37557983398438, 69.738525390625, 72.10147094726562, 74.46440887451172]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 10.0, 7.0, 11.0, 15.0, 12.0, 12.0, 13.0, 21.0, 23.0, 43.0, 36.0, 23.0, 29.0, 41.0, 44.0, 32.0, 35.0, 35.0, 43.0, 44.0, 40.0, 45.0, 33.0, 41.0, 45.0, 39.0, 39.0, 37.0, 32.0, 16.0, 20.0, 18.0, 11.0, 10.0, 11.0, 7.0, 4.0, 6.0, 5.0, 7.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.36962890625, -73.99669647216797, -71.62376403808594, -69.25082397460938, -66.87789154052734, -64.50495910644531, -62.132022857666016, -59.75908660888672, -57.38615417480469, -55.013221740722656, -52.64028549194336, -50.26734924316406, -47.89441680908203, -45.521484375, -43.1485481262207, -40.775611877441406, -38.402679443359375, -36.029747009277344, -33.65681076049805, -31.283876419067383, -28.91094207763672, -26.538007736206055, -24.16507339477539, -21.792139053344727, -19.419204711914062, -17.0462703704834, -14.673336029052734, -12.30040168762207, -9.927467346191406, -7.554533004760742, -5.181598663330078, -2.808664321899414, -0.43572235107421875, 1.9372119903564453, 4.310146331787109, 6.683080673217773, 9.056015014648438, 11.428949356079102, 13.801883697509766, 16.17481803894043, 18.547752380371094, 20.920686721801758, 23.293621063232422, 25.666555404663086, 28.03948974609375, 30.412424087524414, 32.78535842895508, 35.158294677734375, 37.531227111816406, 39.90415954589844, 42.277095794677734, 44.65003204345703, 47.02296447753906, 49.395896911621094, 51.76883316040039, 54.14176940917969, 56.51470184326172, 58.88763427734375, 61.26057052612305, 63.633506774902344, 66.00643920898438, 68.3793716430664, 70.75230407714844, 73.125244140625, 75.49817657470703]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 6.0, 9.0, 14.0, 27.0, 35.0, 46.0, 82.0, 127.0, 171.0, 257.0, 425.0, 728.0, 1040.0, 1733.0, 2959.0, 5107.0, 8602.0, 15147.0, 26827.0, 49759.0, 98897.0, 213474.0, 466717.0, 845852.0, 1003888.0, 738701.0, 371978.0, 166536.0, 80016.0, 41160.0, 22709.0, 12576.0, 7309.0, 4294.0, 2614.0, 1636.0, 994.0, 615.0, 448.0, 262.0, 190.0, 104.0, 79.0, 51.0, 33.0, 20.0, 10.0, 6.0, 2.0, 9.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-58.78125, -56.96435546875, -55.1474609375, -53.33056640625, -51.513671875, -49.69677734375, -47.8798828125, -46.06298828125, -44.24609375, -42.42919921875, -40.6123046875, -38.79541015625, -36.978515625, -35.16162109375, -33.3447265625, -31.52783203125, -29.7109375, -27.89404296875, -26.0771484375, -24.26025390625, -22.443359375, -20.62646484375, -18.8095703125, -16.99267578125, -15.17578125, -13.35888671875, -11.5419921875, -9.72509765625, -7.908203125, -6.09130859375, -4.2744140625, -2.45751953125, -0.640625, 1.17626953125, 2.9931640625, 4.81005859375, 6.626953125, 8.44384765625, 10.2607421875, 12.07763671875, 13.89453125, 15.71142578125, 17.5283203125, 19.34521484375, 21.162109375, 22.97900390625, 24.7958984375, 26.61279296875, 28.4296875, 30.24658203125, 32.0634765625, 33.88037109375, 35.697265625, 37.51416015625, 39.3310546875, 41.14794921875, 42.96484375, 44.78173828125, 46.5986328125, 48.41552734375, 50.232421875, 52.04931640625, 53.8662109375, 55.68310546875, 57.5]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 4.0, 8.0, 9.0, 11.0, 21.0, 15.0, 16.0, 30.0, 26.0, 27.0, 40.0, 31.0, 36.0, 34.0, 25.0, 45.0, 38.0, 34.0, 47.0, 34.0, 34.0, 38.0, 36.0, 41.0, 42.0, 44.0, 29.0, 30.0, 21.0, 30.0, 13.0, 20.0, 17.0, 12.0, 12.0, 9.0, 8.0, 3.0, 6.0, 3.0, 1.0, 6.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-51.1875, -49.6796875, -48.171875, -46.6640625, -45.15625, -43.6484375, -42.140625, -40.6328125, -39.125, -37.6171875, -36.109375, -34.6015625, -33.09375, -31.5859375, -30.078125, -28.5703125, -27.0625, -25.5546875, -24.046875, -22.5390625, -21.03125, -19.5234375, -18.015625, -16.5078125, -15.0, -13.4921875, -11.984375, -10.4765625, -8.96875, -7.4609375, -5.953125, -4.4453125, -2.9375, -1.4296875, 0.078125, 1.5859375, 3.09375, 4.6015625, 6.109375, 7.6171875, 9.125, 10.6328125, 12.140625, 13.6484375, 15.15625, 16.6640625, 18.171875, 19.6796875, 21.1875, 22.6953125, 24.203125, 25.7109375, 27.21875, 28.7265625, 30.234375, 31.7421875, 33.25, 34.7578125, 36.265625, 37.7734375, 39.28125, 40.7890625, 42.296875, 43.8046875, 45.3125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 5.0, 2.0, 18.0, 19.0, 28.0, 39.0, 76.0, 126.0, 218.0, 302.0, 441.0, 721.0, 1171.0, 1840.0, 2899.0, 4451.0, 6985.0, 10857.0, 16873.0, 25684.0, 40440.0, 62593.0, 96444.0, 149259.0, 230161.0, 350462.0, 523388.0, 694209.0, 648769.0, 458932.0, 303585.0, 198958.0, 129110.0, 84110.0, 53490.0, 35039.0, 22238.0, 14390.0, 9427.0, 5936.0, 3773.0, 2490.0, 1639.0, 998.0, 636.0, 375.0, 253.0, 169.0, 112.0, 58.0, 34.0, 26.0, 14.0, 9.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.0654296875, -37.755859375, -36.4462890625, -35.13671875, -33.8271484375, -32.517578125, -31.2080078125, -29.8984375, -28.5888671875, -27.279296875, -25.9697265625, -24.66015625, -23.3505859375, -22.041015625, -20.7314453125, -19.421875, -18.1123046875, -16.802734375, -15.4931640625, -14.18359375, -12.8740234375, -11.564453125, -10.2548828125, -8.9453125, -7.6357421875, -6.326171875, -5.0166015625, -3.70703125, -2.3974609375, -1.087890625, 0.2216796875, 1.53125, 2.8408203125, 4.150390625, 5.4599609375, 6.76953125, 8.0791015625, 9.388671875, 10.6982421875, 12.0078125, 13.3173828125, 14.626953125, 15.9365234375, 17.24609375, 18.5556640625, 19.865234375, 21.1748046875, 22.484375, 23.7939453125, 25.103515625, 26.4130859375, 27.72265625, 29.0322265625, 30.341796875, 31.6513671875, 32.9609375, 34.2705078125, 35.580078125, 36.8896484375, 38.19921875, 39.5087890625, 40.818359375, 42.1279296875, 43.4375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 6.0, 7.0, 11.0, 16.0, 11.0, 13.0, 20.0, 32.0, 32.0, 45.0, 49.0, 64.0, 79.0, 108.0, 105.0, 135.0, 154.0, 189.0, 252.0, 291.0, 334.0, 311.0, 337.0, 302.0, 217.0, 181.0, 171.0, 129.0, 111.0, 81.0, 49.0, 60.0, 43.0, 33.0, 25.0, 18.0, 19.0, 4.0, 8.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -20.9765625, -20.265625, -19.5546875, -18.84375, -18.1328125, -17.421875, -16.7109375, -16.0, -15.2890625, -14.578125, -13.8671875, -13.15625, -12.4453125, -11.734375, -11.0234375, -10.3125, -9.6015625, -8.890625, -8.1796875, -7.46875, -6.7578125, -6.046875, -5.3359375, -4.625, -3.9140625, -3.203125, -2.4921875, -1.78125, -1.0703125, -0.359375, 0.3515625, 1.0625, 1.7734375, 2.484375, 3.1953125, 3.90625, 4.6171875, 5.328125, 6.0390625, 6.75, 7.4609375, 8.171875, 8.8828125, 9.59375, 10.3046875, 11.015625, 11.7265625, 12.4375, 13.1484375, 13.859375, 14.5703125, 15.28125, 15.9921875, 16.703125, 17.4140625, 18.125, 18.8359375, 19.546875, 20.2578125, 20.96875, 21.6796875, 22.390625, 23.1015625, 23.8125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [6.0, 2.0, 1.0, 3.0, 8.0, 1.0, 2.0, 8.0, 9.0, 6.0, 12.0, 5.0, 11.0, 14.0, 15.0, 23.0, 27.0, 19.0, 33.0, 32.0, 38.0, 28.0, 48.0, 34.0, 50.0, 42.0, 41.0, 45.0, 23.0, 44.0, 47.0, 34.0, 37.0, 41.0, 35.0, 31.0, 22.0, 26.0, 17.0, 16.0, 9.0, 16.0, 8.0, 7.0, 12.0, 5.0, 4.0, 4.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.57273864746094, -36.1736946105957, -34.77465057373047, -33.37560272216797, -31.976558685302734, -30.5775146484375, -29.178468704223633, -27.779422760009766, -26.38037872314453, -24.981334686279297, -23.58228874206543, -22.183242797851562, -20.784198760986328, -19.385154724121094, -17.986108779907227, -16.58706283569336, -15.188018798828125, -13.788973808288574, -12.389928817749023, -10.990883827209473, -9.591838836669922, -8.192793846130371, -6.79374885559082, -5.3947038650512695, -3.9956588745117188, -2.596613883972168, -1.1975688934326172, 0.2014760971069336, 1.6005210876464844, 2.999566078186035, 4.398611068725586, 5.797656059265137, 7.1967010498046875, 8.595746040344238, 9.994791030883789, 11.39383602142334, 12.79288101196289, 14.191926002502441, 15.590970993041992, 16.99001693725586, 18.389060974121094, 19.788105010986328, 21.187150955200195, 22.586196899414062, 23.985240936279297, 25.38428497314453, 26.7833309173584, 28.182376861572266, 29.5814208984375, 30.980464935302734, 32.37950897216797, 33.77855682373047, 35.1776008605957, 36.57664489746094, 37.97569274902344, 39.37473678588867, 40.773780822753906, 42.17282485961914, 43.571868896484375, 44.970916748046875, 46.36996078491211, 47.769004821777344, 49.168052673339844, 50.56709671020508, 51.96614074707031]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 14.0, 12.0, 22.0, 15.0, 13.0, 22.0, 25.0, 25.0, 36.0, 39.0, 31.0, 43.0, 30.0, 44.0, 36.0, 48.0, 45.0, 41.0, 40.0, 46.0, 45.0, 34.0, 36.0, 27.0, 34.0, 21.0, 38.0, 31.0, 18.0, 15.0, 12.0, 15.0, 13.0, 5.0, 10.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.23810958862305, -50.60106658935547, -48.964027404785156, -47.326988220214844, -45.689945220947266, -44.05290222167969, -42.415863037109375, -40.77882385253906, -39.141780853271484, -37.504737854003906, -35.867698669433594, -34.23065948486328, -32.5936164855957, -30.956575393676758, -29.319534301757812, -27.682493209838867, -26.045452117919922, -24.408411026000977, -22.77136993408203, -21.134328842163086, -19.49728775024414, -17.860246658325195, -16.22320556640625, -14.586164474487305, -12.94912338256836, -11.312082290649414, -9.675041198730469, -8.038000106811523, -6.400959014892578, -4.763917922973633, -3.1268768310546875, -1.4898357391357422, 0.14720916748046875, 1.784250259399414, 3.4212913513183594, 5.058332443237305, 6.69537353515625, 8.332414627075195, 9.96945571899414, 11.606496810913086, 13.243537902832031, 14.880578994750977, 16.517620086669922, 18.154661178588867, 19.791702270507812, 21.428743362426758, 23.065784454345703, 24.70282554626465, 26.339866638183594, 27.97690773010254, 29.613948822021484, 31.25098991394043, 32.888031005859375, 34.52507019042969, 36.162113189697266, 37.799156188964844, 39.436195373535156, 41.07323455810547, 42.71027755737305, 44.347320556640625, 45.98435974121094, 47.62139892578125, 49.25844192504883, 50.895484924316406, 52.53252410888672]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 8.0, 10.0, 14.0, 24.0, 22.0, 52.0, 61.0, 72.0, 134.0, 163.0, 217.0, 310.0, 465.0, 673.0, 921.0, 1326.0, 1938.0, 2735.0, 4152.0, 6321.0, 9412.0, 14956.0, 23222.0, 37404.0, 61517.0, 104184.0, 171522.0, 217572.0, 151798.0, 90522.0, 54027.0, 32978.0, 20683.0, 13218.0, 8351.0, 5557.0, 3764.0, 2514.0, 1701.0, 1203.0, 829.0, 591.0, 420.0, 284.0, 205.0, 152.0, 107.0, 62.0, 57.0, 52.0, 22.0, 20.0, 16.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.2421875, -13.773193359375, -13.30419921875, -12.835205078125, -12.3662109375, -11.897216796875, -11.42822265625, -10.959228515625, -10.490234375, -10.021240234375, -9.55224609375, -9.083251953125, -8.6142578125, -8.145263671875, -7.67626953125, -7.207275390625, -6.73828125, -6.269287109375, -5.80029296875, -5.331298828125, -4.8623046875, -4.393310546875, -3.92431640625, -3.455322265625, -2.986328125, -2.517333984375, -2.04833984375, -1.579345703125, -1.1103515625, -0.641357421875, -0.17236328125, 0.296630859375, 0.765625, 1.234619140625, 1.70361328125, 2.172607421875, 2.6416015625, 3.110595703125, 3.57958984375, 4.048583984375, 4.517578125, 4.986572265625, 5.45556640625, 5.924560546875, 6.3935546875, 6.862548828125, 7.33154296875, 7.800537109375, 8.26953125, 8.738525390625, 9.20751953125, 9.676513671875, 10.1455078125, 10.614501953125, 11.08349609375, 11.552490234375, 12.021484375, 12.490478515625, 12.95947265625, 13.428466796875, 13.8974609375, 14.366455078125, 14.83544921875, 15.304443359375, 15.7734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 4.0, 10.0, 11.0, 15.0, 10.0, 17.0, 20.0, 18.0, 31.0, 34.0, 29.0, 32.0, 46.0, 33.0, 39.0, 31.0, 53.0, 36.0, 38.0, 42.0, 52.0, 53.0, 38.0, 38.0, 35.0, 37.0, 24.0, 34.0, 22.0, 27.0, 23.0, 15.0, 12.0, 18.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-50.75, -49.13232421875, -47.5146484375, -45.89697265625, -44.279296875, -42.66162109375, -41.0439453125, -39.42626953125, -37.80859375, -36.19091796875, -34.5732421875, -32.95556640625, -31.337890625, -29.72021484375, -28.1025390625, -26.48486328125, -24.8671875, -23.24951171875, -21.6318359375, -20.01416015625, -18.396484375, -16.77880859375, -15.1611328125, -13.54345703125, -11.92578125, -10.30810546875, -8.6904296875, -7.07275390625, -5.455078125, -3.83740234375, -2.2197265625, -0.60205078125, 1.015625, 2.63330078125, 4.2509765625, 5.86865234375, 7.486328125, 9.10400390625, 10.7216796875, 12.33935546875, 13.95703125, 15.57470703125, 17.1923828125, 18.81005859375, 20.427734375, 22.04541015625, 23.6630859375, 25.28076171875, 26.8984375, 28.51611328125, 30.1337890625, 31.75146484375, 33.369140625, 34.98681640625, 36.6044921875, 38.22216796875, 39.83984375, 41.45751953125, 43.0751953125, 44.69287109375, 46.310546875, 47.92822265625, 49.5458984375, 51.16357421875, 52.78125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 7.0, 11.0, 20.0, 17.0, 30.0, 33.0, 50.0, 61.0, 90.0, 131.0, 154.0, 228.0, 305.0, 413.0, 561.0, 712.0, 1045.0, 1466.0, 2129.0, 3173.0, 4653.0, 7034.0, 10973.0, 17562.0, 29559.0, 51494.0, 95468.0, 174625.0, 249152.0, 173201.0, 93555.0, 51044.0, 29480.0, 17488.0, 10599.0, 6943.0, 4602.0, 3084.0, 2083.0, 1518.0, 1029.0, 726.0, 533.0, 397.0, 290.0, 226.0, 168.0, 110.0, 110.0, 74.0, 46.0, 26.0, 28.0, 24.0, 12.0, 5.0, 6.0, 1.0, 4.0, 1.0], "bins": [-9.34375, -9.05615234375, -8.7685546875, -8.48095703125, -8.193359375, -7.90576171875, -7.6181640625, -7.33056640625, -7.04296875, -6.75537109375, -6.4677734375, -6.18017578125, -5.892578125, -5.60498046875, -5.3173828125, -5.02978515625, -4.7421875, -4.45458984375, -4.1669921875, -3.87939453125, -3.591796875, -3.30419921875, -3.0166015625, -2.72900390625, -2.44140625, -2.15380859375, -1.8662109375, -1.57861328125, -1.291015625, -1.00341796875, -0.7158203125, -0.42822265625, -0.140625, 0.14697265625, 0.4345703125, 0.72216796875, 1.009765625, 1.29736328125, 1.5849609375, 1.87255859375, 2.16015625, 2.44775390625, 2.7353515625, 3.02294921875, 3.310546875, 3.59814453125, 3.8857421875, 4.17333984375, 4.4609375, 4.74853515625, 5.0361328125, 5.32373046875, 5.611328125, 5.89892578125, 6.1865234375, 6.47412109375, 6.76171875, 7.04931640625, 7.3369140625, 7.62451171875, 7.912109375, 8.19970703125, 8.4873046875, 8.77490234375, 9.0625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 2.0, 7.0, 10.0, 12.0, 14.0, 13.0, 28.0, 28.0, 23.0, 24.0, 31.0, 30.0, 29.0, 31.0, 37.0, 33.0, 29.0, 39.0, 30.0, 44.0, 50.0, 39.0, 52.0, 38.0, 32.0, 26.0, 34.0, 35.0, 28.0, 24.0, 28.0, 22.0, 11.0, 13.0, 12.0, 12.0, 5.0, 10.0, 3.0, 0.0, 7.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-32.78125, -31.740234375, -30.69921875, -29.658203125, -28.6171875, -27.576171875, -26.53515625, -25.494140625, -24.453125, -23.412109375, -22.37109375, -21.330078125, -20.2890625, -19.248046875, -18.20703125, -17.166015625, -16.125, -15.083984375, -14.04296875, -13.001953125, -11.9609375, -10.919921875, -9.87890625, -8.837890625, -7.796875, -6.755859375, -5.71484375, -4.673828125, -3.6328125, -2.591796875, -1.55078125, -0.509765625, 0.53125, 1.572265625, 2.61328125, 3.654296875, 4.6953125, 5.736328125, 6.77734375, 7.818359375, 8.859375, 9.900390625, 10.94140625, 11.982421875, 13.0234375, 14.064453125, 15.10546875, 16.146484375, 17.1875, 18.228515625, 19.26953125, 20.310546875, 21.3515625, 22.392578125, 23.43359375, 24.474609375, 25.515625, 26.556640625, 27.59765625, 28.638671875, 29.6796875, 30.720703125, 31.76171875, 32.802734375, 33.84375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 16.0, 14.0, 12.0, 26.0, 43.0, 59.0, 70.0, 91.0, 125.0, 163.0, 239.0, 291.0, 388.0, 474.0, 609.0, 735.0, 1003.0, 1468.0, 2039.0, 3189.0, 5626.0, 12499.0, 34069.0, 119452.0, 485091.0, 270299.0, 67033.0, 21133.0, 8524.0, 4172.0, 2546.0, 1763.0, 1282.0, 962.0, 740.0, 561.0, 418.0, 296.0, 243.0, 162.0, 150.0, 122.0, 91.0, 86.0, 56.0, 46.0, 24.0, 13.0, 16.0, 9.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.314453125, -2.2392578125, -2.1640625, -2.0888671875, -2.013671875, -1.9384765625, -1.86328125, -1.7880859375, -1.712890625, -1.6376953125, -1.5625, -1.4873046875, -1.412109375, -1.3369140625, -1.26171875, -1.1865234375, -1.111328125, -1.0361328125, -0.9609375, -0.8857421875, -0.810546875, -0.7353515625, -0.66015625, -0.5849609375, -0.509765625, -0.4345703125, -0.359375, -0.2841796875, -0.208984375, -0.1337890625, -0.05859375, 0.0166015625, 0.091796875, 0.1669921875, 0.2421875, 0.3173828125, 0.392578125, 0.4677734375, 0.54296875, 0.6181640625, 0.693359375, 0.7685546875, 0.84375, 0.9189453125, 0.994140625, 1.0693359375, 1.14453125, 1.2197265625, 1.294921875, 1.3701171875, 1.4453125, 1.5205078125, 1.595703125, 1.6708984375, 1.74609375, 1.8212890625, 1.896484375, 1.9716796875, 2.046875, 2.1220703125, 2.197265625, 2.2724609375, 2.34765625, 2.4228515625, 2.498046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 7.0, 12.0, 14.0, 7.0, 25.0, 18.0, 39.0, 52.0, 72.0, 91.0, 109.0, 98.0, 91.0, 66.0, 67.0, 45.0, 31.0, 20.0, 21.0, 7.0, 13.0, 10.0, 13.0, 7.0, 4.0, 9.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0003771781921386719, -0.0003664456307888031, -0.0003557130694389343, -0.00034498050808906555, -0.0003342479467391968, -0.000323515385389328, -0.00031278282403945923, -0.00030205026268959045, -0.0002913177013397217, -0.0002805851399898529, -0.00026985257863998413, -0.00025912001729011536, -0.0002483874559402466, -0.0002376548945903778, -0.00022692233324050903, -0.00021618977189064026, -0.00020545721054077148, -0.0001947246491909027, -0.00018399208784103394, -0.00017325952649116516, -0.0001625269651412964, -0.0001517944037914276, -0.00014106184244155884, -0.00013032928109169006, -0.00011959671974182129, -0.00010886415839195251, -9.813159704208374e-05, -8.739903569221497e-05, -7.666647434234619e-05, -6.593391299247742e-05, -5.520135164260864e-05, -4.446879029273987e-05, -3.3736228942871094e-05, -2.300366759300232e-05, -1.2271106243133545e-05, -1.5385448932647705e-06, 9.194016456604004e-06, 1.992657780647278e-05, 3.065913915634155e-05, 4.139170050621033e-05, 5.21242618560791e-05, 6.285682320594788e-05, 7.358938455581665e-05, 8.432194590568542e-05, 9.50545072555542e-05, 0.00010578706860542297, 0.00011651962995529175, 0.00012725219130516052, 0.0001379847526550293, 0.00014871731400489807, 0.00015944987535476685, 0.00017018243670463562, 0.0001809149980545044, 0.00019164755940437317, 0.00020238012075424194, 0.00021311268210411072, 0.0002238452434539795, 0.00023457780480384827, 0.00024531036615371704, 0.0002560429275035858, 0.0002667754888534546, 0.00027750805020332336, 0.00028824061155319214, 0.0002989731729030609, 0.0003097057342529297]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 4.0, 7.0, 18.0, 11.0, 21.0, 34.0, 49.0, 71.0, 73.0, 114.0, 155.0, 210.0, 312.0, 391.0, 613.0, 892.0, 1284.0, 1834.0, 2899.0, 4784.0, 7962.0, 14832.0, 27926.0, 52817.0, 101789.0, 205569.0, 302036.0, 152431.0, 77731.0, 40768.0, 21520.0, 11644.0, 6433.0, 3860.0, 2346.0, 1511.0, 986.0, 764.0, 497.0, 344.0, 283.0, 204.0, 144.0, 87.0, 99.0, 52.0, 44.0, 25.0, 26.0, 18.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8330078125, -1.7779541015625, -1.722900390625, -1.6678466796875, -1.61279296875, -1.5577392578125, -1.502685546875, -1.4476318359375, -1.392578125, -1.3375244140625, -1.282470703125, -1.2274169921875, -1.17236328125, -1.1173095703125, -1.062255859375, -1.0072021484375, -0.9521484375, -0.8970947265625, -0.842041015625, -0.7869873046875, -0.73193359375, -0.6768798828125, -0.621826171875, -0.5667724609375, -0.51171875, -0.4566650390625, -0.401611328125, -0.3465576171875, -0.29150390625, -0.2364501953125, -0.181396484375, -0.1263427734375, -0.0712890625, -0.0162353515625, 0.038818359375, 0.0938720703125, 0.14892578125, 0.2039794921875, 0.259033203125, 0.3140869140625, 0.369140625, 0.4241943359375, 0.479248046875, 0.5343017578125, 0.58935546875, 0.6444091796875, 0.699462890625, 0.7545166015625, 0.8095703125, 0.8646240234375, 0.919677734375, 0.9747314453125, 1.02978515625, 1.0848388671875, 1.139892578125, 1.1949462890625, 1.25, 1.3050537109375, 1.360107421875, 1.4151611328125, 1.47021484375, 1.5252685546875, 1.580322265625, 1.6353759765625, 1.6904296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 5.0, 17.0, 12.0, 25.0, 40.0, 39.0, 64.0, 84.0, 105.0, 127.0, 125.0, 100.0, 68.0, 50.0, 31.0, 23.0, 22.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81982421875, -0.7948226928710938, -0.7698211669921875, -0.7448196411132812, -0.719818115234375, -0.6948165893554688, -0.6698150634765625, -0.6448135375976562, -0.61981201171875, -0.5948104858398438, -0.5698089599609375, -0.5448074340820312, -0.519805908203125, -0.49480438232421875, -0.4698028564453125, -0.44480133056640625, -0.4197998046875, -0.39479827880859375, -0.3697967529296875, -0.34479522705078125, -0.319793701171875, -0.29479217529296875, -0.2697906494140625, -0.24478912353515625, -0.21978759765625, -0.19478607177734375, -0.1697845458984375, -0.14478302001953125, -0.119781494140625, -0.09477996826171875, -0.0697784423828125, -0.04477691650390625, -0.019775390625, 0.00522613525390625, 0.0302276611328125, 0.05522918701171875, 0.080230712890625, 0.10523223876953125, 0.1302337646484375, 0.15523529052734375, 0.18023681640625, 0.20523834228515625, 0.2302398681640625, 0.25524139404296875, 0.280242919921875, 0.30524444580078125, 0.3302459716796875, 0.35524749755859375, 0.3802490234375, 0.40525054931640625, 0.4302520751953125, 0.45525360107421875, 0.480255126953125, 0.5052566528320312, 0.5302581787109375, 0.5552597045898438, 0.58026123046875, 0.6052627563476562, 0.6302642822265625, 0.6552658081054688, 0.680267333984375, 0.7052688598632812, 0.7302703857421875, 0.7552719116210938, 0.7802734375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 4.0, 8.0, 3.0, 5.0, 8.0, 6.0, 10.0, 9.0, 11.0, 19.0, 18.0, 17.0, 21.0, 22.0, 28.0, 37.0, 40.0, 42.0, 37.0, 43.0, 43.0, 39.0, 40.0, 41.0, 32.0, 38.0, 58.0, 33.0, 32.0, 34.0, 37.0, 34.0, 22.0, 26.0, 18.0, 9.0, 17.0, 10.0, 9.0, 8.0, 8.0, 7.0, 3.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75106430053711, -34.4222297668457, -33.0933952331543, -31.76456069946289, -30.435726165771484, -29.106891632080078, -27.77805519104004, -26.449220657348633, -25.120386123657227, -23.79155158996582, -22.462717056274414, -21.133882522583008, -19.80504608154297, -18.476211547851562, -17.147377014160156, -15.81854248046875, -14.489707946777344, -13.160873413085938, -11.832038879394531, -10.503203392028809, -9.174368858337402, -7.845534324645996, -6.516699314117432, -5.187864303588867, -3.859029769897461, -2.5301949977874756, -1.2013602256774902, 0.12747454643249512, 1.4563093185424805, 2.7851438522338867, 4.113978862762451, 5.442813873291016, 6.771648406982422, 8.100482940673828, 9.429317474365234, 10.758152961730957, 12.086987495422363, 13.41582202911377, 14.744657516479492, 16.0734920501709, 17.402326583862305, 18.73116111755371, 20.059995651245117, 21.388830184936523, 22.717666625976562, 24.04650115966797, 25.375335693359375, 26.70417022705078, 28.033004760742188, 29.361839294433594, 30.690673828125, 32.019508361816406, 33.34834289550781, 34.67717742919922, 36.006011962890625, 37.33484649658203, 38.66368103027344, 39.992515563964844, 41.32135009765625, 42.650184631347656, 43.97901916503906, 45.30785369873047, 46.636688232421875, 47.96552276611328, 49.29436111450195]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 13.0, 18.0, 17.0, 13.0, 22.0, 18.0, 24.0, 34.0, 38.0, 34.0, 33.0, 41.0, 34.0, 42.0, 38.0, 43.0, 47.0, 42.0, 50.0, 40.0, 36.0, 41.0, 26.0, 31.0, 30.0, 29.0, 40.0, 21.0, 14.0, 19.0, 13.0, 9.0, 15.0, 6.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.53192901611328, -46.9837646484375, -45.435604095458984, -43.8874397277832, -42.33927917480469, -40.791114807128906, -39.242950439453125, -37.69478988647461, -36.14662551879883, -34.59846115112305, -33.05030059814453, -31.50213623046875, -29.9539737701416, -28.405811309814453, -26.857648849487305, -25.309486389160156, -23.761323928833008, -22.21316146850586, -20.66499900817871, -19.116836547851562, -17.56867218017578, -16.020509719848633, -14.472347259521484, -12.92418384552002, -11.376021385192871, -9.827858924865723, -8.279695510864258, -6.731533050537109, -5.183370113372803, -3.635207176208496, -2.0870447158813477, -0.5388813018798828, 1.0092811584472656, 2.5574440956115723, 4.105607032775879, 5.653769493103027, 7.201932430267334, 8.75009536743164, 10.298257827758789, 11.846421241760254, 13.394583702087402, 14.94274616241455, 16.490909576416016, 18.039072036743164, 19.587234497070312, 21.135398864746094, 22.68355941772461, 24.23172378540039, 25.77988624572754, 27.328048706054688, 28.876211166381836, 30.424373626708984, 31.972537994384766, 33.52069854736328, 35.06886291503906, 36.617027282714844, 38.16518783569336, 39.71335220336914, 41.261512756347656, 42.80967712402344, 44.35783767700195, 45.906002044677734, 47.45416259765625, 49.00232696533203, 50.55049133300781]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 14.0, 19.0, 34.0, 34.0, 65.0, 88.0, 156.0, 237.0, 367.0, 694.0, 1083.0, 1770.0, 3008.0, 5093.0, 9000.0, 15690.0, 27925.0, 48449.0, 80961.0, 124227.0, 163614.0, 173269.0, 144431.0, 100625.0, 62438.0, 36619.0, 20665.0, 11604.0, 6768.0, 3864.0, 2235.0, 1359.0, 802.0, 489.0, 313.0, 203.0, 98.0, 77.0, 56.0, 34.0, 30.0, 11.0, 8.0, 6.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0], "bins": [-56.46875, -54.8662109375, -53.263671875, -51.6611328125, -50.05859375, -48.4560546875, -46.853515625, -45.2509765625, -43.6484375, -42.0458984375, -40.443359375, -38.8408203125, -37.23828125, -35.6357421875, -34.033203125, -32.4306640625, -30.828125, -29.2255859375, -27.623046875, -26.0205078125, -24.41796875, -22.8154296875, -21.212890625, -19.6103515625, -18.0078125, -16.4052734375, -14.802734375, -13.2001953125, -11.59765625, -9.9951171875, -8.392578125, -6.7900390625, -5.1875, -3.5849609375, -1.982421875, -0.3798828125, 1.22265625, 2.8251953125, 4.427734375, 6.0302734375, 7.6328125, 9.2353515625, 10.837890625, 12.4404296875, 14.04296875, 15.6455078125, 17.248046875, 18.8505859375, 20.453125, 22.0556640625, 23.658203125, 25.2607421875, 26.86328125, 28.4658203125, 30.068359375, 31.6708984375, 33.2734375, 34.8759765625, 36.478515625, 38.0810546875, 39.68359375, 41.2861328125, 42.888671875, 44.4912109375, 46.09375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 3.0, 13.0, 9.0, 15.0, 14.0, 23.0, 16.0, 26.0, 30.0, 32.0, 29.0, 40.0, 43.0, 34.0, 44.0, 32.0, 35.0, 32.0, 57.0, 31.0, 47.0, 39.0, 28.0, 44.0, 28.0, 42.0, 24.0, 25.0, 27.0, 15.0, 25.0, 19.0, 14.0, 15.0, 8.0, 6.0, 2.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-41.6875, -40.388671875, -39.08984375, -37.791015625, -36.4921875, -35.193359375, -33.89453125, -32.595703125, -31.296875, -29.998046875, -28.69921875, -27.400390625, -26.1015625, -24.802734375, -23.50390625, -22.205078125, -20.90625, -19.607421875, -18.30859375, -17.009765625, -15.7109375, -14.412109375, -13.11328125, -11.814453125, -10.515625, -9.216796875, -7.91796875, -6.619140625, -5.3203125, -4.021484375, -2.72265625, -1.423828125, -0.125, 1.173828125, 2.47265625, 3.771484375, 5.0703125, 6.369140625, 7.66796875, 8.966796875, 10.265625, 11.564453125, 12.86328125, 14.162109375, 15.4609375, 16.759765625, 18.05859375, 19.357421875, 20.65625, 21.955078125, 23.25390625, 24.552734375, 25.8515625, 27.150390625, 28.44921875, 29.748046875, 31.046875, 32.345703125, 33.64453125, 34.943359375, 36.2421875, 37.541015625, 38.83984375, 40.138671875, 41.4375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 12.0, 15.0, 29.0, 52.0, 61.0, 107.0, 155.0, 266.0, 324.0, 531.0, 844.0, 1243.0, 1771.0, 2653.0, 3804.0, 5529.0, 8156.0, 11468.0, 16253.0, 22623.0, 31352.0, 42234.0, 55734.0, 70818.0, 85547.0, 97684.0, 103224.0, 100233.0, 89133.0, 74539.0, 59448.0, 45309.0, 33851.0, 24842.0, 17851.0, 12555.0, 8914.0, 6168.0, 4297.0, 3019.0, 1938.0, 1332.0, 893.0, 581.0, 412.0, 267.0, 165.0, 105.0, 82.0, 40.0, 40.0, 24.0, 16.0, 8.0, 4.0, 4.0, 0.0, 1.0], "bins": [-33.96875, -32.927734375, -31.88671875, -30.845703125, -29.8046875, -28.763671875, -27.72265625, -26.681640625, -25.640625, -24.599609375, -23.55859375, -22.517578125, -21.4765625, -20.435546875, -19.39453125, -18.353515625, -17.3125, -16.271484375, -15.23046875, -14.189453125, -13.1484375, -12.107421875, -11.06640625, -10.025390625, -8.984375, -7.943359375, -6.90234375, -5.861328125, -4.8203125, -3.779296875, -2.73828125, -1.697265625, -0.65625, 0.384765625, 1.42578125, 2.466796875, 3.5078125, 4.548828125, 5.58984375, 6.630859375, 7.671875, 8.712890625, 9.75390625, 10.794921875, 11.8359375, 12.876953125, 13.91796875, 14.958984375, 16.0, 17.041015625, 18.08203125, 19.123046875, 20.1640625, 21.205078125, 22.24609375, 23.287109375, 24.328125, 25.369140625, 26.41015625, 27.451171875, 28.4921875, 29.533203125, 30.57421875, 31.615234375, 32.65625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 8.0, 14.0, 14.0, 23.0, 14.0, 16.0, 16.0, 22.0, 23.0, 33.0, 27.0, 36.0, 36.0, 36.0, 33.0, 35.0, 30.0, 40.0, 50.0, 38.0, 38.0, 35.0, 31.0, 48.0, 36.0, 32.0, 24.0, 30.0, 22.0, 19.0, 30.0, 16.0, 15.0, 16.0, 9.0, 10.0, 7.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.578125, -28.71826171875, -27.8583984375, -26.99853515625, -26.138671875, -25.27880859375, -24.4189453125, -23.55908203125, -22.69921875, -21.83935546875, -20.9794921875, -20.11962890625, -19.259765625, -18.39990234375, -17.5400390625, -16.68017578125, -15.8203125, -14.96044921875, -14.1005859375, -13.24072265625, -12.380859375, -11.52099609375, -10.6611328125, -9.80126953125, -8.94140625, -8.08154296875, -7.2216796875, -6.36181640625, -5.501953125, -4.64208984375, -3.7822265625, -2.92236328125, -2.0625, -1.20263671875, -0.3427734375, 0.51708984375, 1.376953125, 2.23681640625, 3.0966796875, 3.95654296875, 4.81640625, 5.67626953125, 6.5361328125, 7.39599609375, 8.255859375, 9.11572265625, 9.9755859375, 10.83544921875, 11.6953125, 12.55517578125, 13.4150390625, 14.27490234375, 15.134765625, 15.99462890625, 16.8544921875, 17.71435546875, 18.57421875, 19.43408203125, 20.2939453125, 21.15380859375, 22.013671875, 22.87353515625, 23.7333984375, 24.59326171875, 25.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 10.0, 13.0, 17.0, 32.0, 47.0, 76.0, 82.0, 156.0, 250.0, 408.0, 610.0, 1019.0, 1644.0, 2726.0, 4698.0, 8139.0, 13733.0, 23702.0, 39669.0, 65343.0, 101249.0, 139405.0, 161635.0, 154019.0, 120027.0, 82849.0, 51580.0, 30871.0, 18477.0, 10728.0, 6053.0, 3626.0, 2219.0, 1247.0, 800.0, 474.0, 342.0, 207.0, 149.0, 83.0, 48.0, 40.0, 20.0, 11.0, 12.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.84521484375, -8.5576171875, -8.27001953125, -7.982421875, -7.69482421875, -7.4072265625, -7.11962890625, -6.83203125, -6.54443359375, -6.2568359375, -5.96923828125, -5.681640625, -5.39404296875, -5.1064453125, -4.81884765625, -4.53125, -4.24365234375, -3.9560546875, -3.66845703125, -3.380859375, -3.09326171875, -2.8056640625, -2.51806640625, -2.23046875, -1.94287109375, -1.6552734375, -1.36767578125, -1.080078125, -0.79248046875, -0.5048828125, -0.21728515625, 0.0703125, 0.35791015625, 0.6455078125, 0.93310546875, 1.220703125, 1.50830078125, 1.7958984375, 2.08349609375, 2.37109375, 2.65869140625, 2.9462890625, 3.23388671875, 3.521484375, 3.80908203125, 4.0966796875, 4.38427734375, 4.671875, 4.95947265625, 5.2470703125, 5.53466796875, 5.822265625, 6.10986328125, 6.3974609375, 6.68505859375, 6.97265625, 7.26025390625, 7.5478515625, 7.83544921875, 8.123046875, 8.41064453125, 8.6982421875, 8.98583984375, 9.2734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 5.0, 12.0, 6.0, 10.0, 22.0, 24.0, 20.0, 40.0, 29.0, 43.0, 31.0, 54.0, 63.0, 50.0, 50.0, 64.0, 69.0, 61.0, 57.0, 55.0, 36.0, 25.0, 36.0, 30.0, 19.0, 16.0, 13.0, 19.0, 12.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0010442733764648438, -0.0010155066847801208, -0.000986739993095398, -0.000957973301410675, -0.0009292066097259521, -0.0009004399180412292, -0.0008716732263565063, -0.0008429065346717834, -0.0008141398429870605, -0.0007853731513023376, -0.0007566064596176147, -0.0007278397679328918, -0.0006990730762481689, -0.000670306384563446, -0.0006415396928787231, -0.0006127730011940002, -0.0005840063095092773, -0.0005552396178245544, -0.0005264729261398315, -0.0004977062344551086, -0.00046893954277038574, -0.00044017285108566284, -0.00041140615940093994, -0.00038263946771621704, -0.00035387277603149414, -0.00032510608434677124, -0.00029633939266204834, -0.00026757270097732544, -0.00023880600929260254, -0.00021003931760787964, -0.00018127262592315674, -0.00015250593423843384, -0.00012373924255371094, -9.497255086898804e-05, -6.620585918426514e-05, -3.7439167499542236e-05, -8.672475814819336e-06, 2.0094215869903564e-05, 4.8860907554626465e-05, 7.762759923934937e-05, 0.00010639429092407227, 0.00013516098260879517, 0.00016392767429351807, 0.00019269436597824097, 0.00022146105766296387, 0.00025022774934768677, 0.00027899444103240967, 0.00030776113271713257, 0.00033652782440185547, 0.00036529451608657837, 0.00039406120777130127, 0.00042282789945602417, 0.00045159459114074707, 0.00048036128282546997, 0.0005091279745101929, 0.0005378946661949158, 0.0005666613578796387, 0.0005954280495643616, 0.0006241947412490845, 0.0006529614329338074, 0.0006817281246185303, 0.0007104948163032532, 0.0007392615079879761, 0.000768028199672699, 0.0007967948913574219]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 10.0, 5.0, 11.0, 18.0, 31.0, 44.0, 66.0, 84.0, 160.0, 230.0, 366.0, 534.0, 838.0, 1271.0, 1955.0, 2828.0, 4604.0, 6809.0, 10267.0, 15653.0, 23464.0, 35101.0, 49693.0, 69651.0, 90727.0, 111006.0, 122430.0, 119602.0, 103771.0, 83126.0, 61383.0, 43579.0, 29917.0, 20103.0, 13434.0, 8836.0, 5822.0, 3754.0, 2566.0, 1582.0, 1109.0, 721.0, 480.0, 304.0, 202.0, 147.0, 90.0, 57.0, 44.0, 24.0, 22.0, 9.0, 10.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.671875, -6.455322265625, -6.23876953125, -6.022216796875, -5.8056640625, -5.589111328125, -5.37255859375, -5.156005859375, -4.939453125, -4.722900390625, -4.50634765625, -4.289794921875, -4.0732421875, -3.856689453125, -3.64013671875, -3.423583984375, -3.20703125, -2.990478515625, -2.77392578125, -2.557373046875, -2.3408203125, -2.124267578125, -1.90771484375, -1.691162109375, -1.474609375, -1.258056640625, -1.04150390625, -0.824951171875, -0.6083984375, -0.391845703125, -0.17529296875, 0.041259765625, 0.2578125, 0.474365234375, 0.69091796875, 0.907470703125, 1.1240234375, 1.340576171875, 1.55712890625, 1.773681640625, 1.990234375, 2.206787109375, 2.42333984375, 2.639892578125, 2.8564453125, 3.072998046875, 3.28955078125, 3.506103515625, 3.72265625, 3.939208984375, 4.15576171875, 4.372314453125, 4.5888671875, 4.805419921875, 5.02197265625, 5.238525390625, 5.455078125, 5.671630859375, 5.88818359375, 6.104736328125, 6.3212890625, 6.537841796875, 6.75439453125, 6.970947265625, 7.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 10.0, 5.0, 6.0, 12.0, 10.0, 16.0, 16.0, 25.0, 21.0, 25.0, 26.0, 28.0, 41.0, 29.0, 56.0, 54.0, 53.0, 37.0, 33.0, 39.0, 34.0, 54.0, 44.0, 43.0, 30.0, 33.0, 31.0, 27.0, 20.0, 24.0, 16.0, 18.0, 12.0, 15.0, 9.0, 9.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.478515625, -3.377655029296875, -3.27679443359375, -3.175933837890625, -3.0750732421875, -2.974212646484375, -2.87335205078125, -2.772491455078125, -2.671630859375, -2.570770263671875, -2.46990966796875, -2.369049072265625, -2.2681884765625, -2.167327880859375, -2.06646728515625, -1.965606689453125, -1.86474609375, -1.763885498046875, -1.66302490234375, -1.562164306640625, -1.4613037109375, -1.360443115234375, -1.25958251953125, -1.158721923828125, -1.057861328125, -0.957000732421875, -0.85614013671875, -0.755279541015625, -0.6544189453125, -0.553558349609375, -0.45269775390625, -0.351837158203125, -0.2509765625, -0.150115966796875, -0.04925537109375, 0.051605224609375, 0.1524658203125, 0.253326416015625, 0.35418701171875, 0.455047607421875, 0.555908203125, 0.656768798828125, 0.75762939453125, 0.858489990234375, 0.9593505859375, 1.060211181640625, 1.16107177734375, 1.261932373046875, 1.36279296875, 1.463653564453125, 1.56451416015625, 1.665374755859375, 1.7662353515625, 1.867095947265625, 1.96795654296875, 2.068817138671875, 2.169677734375, 2.270538330078125, 2.37139892578125, 2.472259521484375, 2.5731201171875, 2.673980712890625, 2.77484130859375, 2.875701904296875, 2.9765625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 10.0, 7.0, 7.0, 10.0, 10.0, 14.0, 18.0, 18.0, 20.0, 38.0, 33.0, 43.0, 40.0, 43.0, 42.0, 44.0, 51.0, 45.0, 42.0, 38.0, 46.0, 47.0, 51.0, 38.0, 52.0, 21.0, 28.0, 17.0, 25.0, 17.0, 17.0, 11.0, 8.0, 12.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.775482177734375, -34.43992233276367, -33.10436248779297, -31.7688045501709, -30.433244705200195, -29.097684860229492, -27.762126922607422, -26.42656707763672, -25.091007232666016, -23.755447387695312, -22.41988754272461, -21.08432960510254, -19.748769760131836, -18.413209915161133, -17.077651977539062, -15.74209213256836, -14.406532287597656, -13.070972442626953, -11.735413551330566, -10.39985466003418, -9.064294815063477, -7.728735446929932, -6.393176078796387, -5.0576171875, -3.722057342529297, -2.386497974395752, -1.050938606262207, 0.2846207618713379, 1.6201801300048828, 2.9557394981384277, 4.291298866271973, 5.626857757568359, 6.962421417236328, 8.297981262207031, 9.633540153503418, 10.969099044799805, 12.304658889770508, 13.640218734741211, 14.975777626037598, 16.311336517333984, 17.646896362304688, 18.98245620727539, 20.318016052246094, 21.653573989868164, 22.989133834838867, 24.32469367980957, 25.66025161743164, 26.995811462402344, 28.331371307373047, 29.66693115234375, 31.002490997314453, 32.338050842285156, 33.673606872558594, 35.0091667175293, 36.3447265625, 37.6802864074707, 39.015846252441406, 40.35140609741211, 41.68696594238281, 43.022525787353516, 44.35808563232422, 45.693641662597656, 47.02920150756836, 48.36476135253906, 49.700321197509766]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 9.0, 12.0, 8.0, 10.0, 6.0, 13.0, 17.0, 13.0, 19.0, 23.0, 25.0, 24.0, 28.0, 30.0, 28.0, 38.0, 38.0, 26.0, 35.0, 36.0, 35.0, 42.0, 36.0, 42.0, 40.0, 36.0, 35.0, 25.0, 42.0, 24.0, 27.0, 24.0, 24.0, 20.0, 14.0, 18.0, 10.0, 12.0, 5.0, 8.0, 8.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-42.815799713134766, -41.51879119873047, -40.22178268432617, -38.924774169921875, -37.627769470214844, -36.33076095581055, -35.03375244140625, -33.73674392700195, -32.439735412597656, -31.14272689819336, -29.845718383789062, -28.5487117767334, -27.2517032623291, -25.954694747924805, -24.65768814086914, -23.360679626464844, -22.063671112060547, -20.76666259765625, -19.469654083251953, -18.17264747619629, -16.875638961791992, -15.578630447387695, -14.281622886657715, -12.984615325927734, -11.687606811523438, -10.39059829711914, -9.09359073638916, -7.7965826988220215, -6.499574661254883, -5.202566623687744, -3.9055585861206055, -2.608551025390625, -1.3115386962890625, -0.014530658721923828, 1.2824773788452148, 2.5794854164123535, 3.876493453979492, 5.173501491546631, 6.4705095291137695, 7.76751708984375, 9.064525604248047, 10.361534118652344, 11.658541679382324, 12.955549240112305, 14.252557754516602, 15.549566268920898, 16.846572875976562, 18.14358139038086, 19.440589904785156, 20.737598419189453, 22.03460693359375, 23.331613540649414, 24.62862205505371, 25.925630569458008, 27.222637176513672, 28.51964569091797, 29.816654205322266, 31.113662719726562, 32.41067123413086, 33.707679748535156, 35.00468444824219, 36.301692962646484, 37.59870147705078, 38.89570999145508, 40.192718505859375]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 8.0, 1.0, 9.0, 13.0, 16.0, 28.0, 51.0, 80.0, 126.0, 210.0, 350.0, 537.0, 963.0, 1618.0, 2866.0, 4832.0, 8682.0, 15577.0, 27837.0, 51138.0, 93677.0, 172073.0, 312669.0, 530886.0, 749148.0, 785362.0, 604804.0, 374983.0, 209391.0, 113314.0, 60885.0, 32608.0, 17926.0, 9750.0, 5282.0, 2959.0, 1606.0, 899.0, 478.0, 261.0, 153.0, 104.0, 55.0, 33.0, 25.0, 10.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.875, -35.65185546875, -34.4287109375, -33.20556640625, -31.982421875, -30.75927734375, -29.5361328125, -28.31298828125, -27.08984375, -25.86669921875, -24.6435546875, -23.42041015625, -22.197265625, -20.97412109375, -19.7509765625, -18.52783203125, -17.3046875, -16.08154296875, -14.8583984375, -13.63525390625, -12.412109375, -11.18896484375, -9.9658203125, -8.74267578125, -7.51953125, -6.29638671875, -5.0732421875, -3.85009765625, -2.626953125, -1.40380859375, -0.1806640625, 1.04248046875, 2.265625, 3.48876953125, 4.7119140625, 5.93505859375, 7.158203125, 8.38134765625, 9.6044921875, 10.82763671875, 12.05078125, 13.27392578125, 14.4970703125, 15.72021484375, 16.943359375, 18.16650390625, 19.3896484375, 20.61279296875, 21.8359375, 23.05908203125, 24.2822265625, 25.50537109375, 26.728515625, 27.95166015625, 29.1748046875, 30.39794921875, 31.62109375, 32.84423828125, 34.0673828125, 35.29052734375, 36.513671875, 37.73681640625, 38.9599609375, 40.18310546875, 41.40625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 6.0, 4.0, 14.0, 15.0, 11.0, 13.0, 15.0, 22.0, 20.0, 23.0, 28.0, 32.0, 39.0, 22.0, 29.0, 38.0, 34.0, 29.0, 31.0, 50.0, 34.0, 37.0, 38.0, 41.0, 45.0, 38.0, 20.0, 41.0, 30.0, 26.0, 23.0, 23.0, 19.0, 10.0, 22.0, 12.0, 7.0, 7.0, 7.0, 10.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-29.65625, -28.754150390625, -27.85205078125, -26.949951171875, -26.0478515625, -25.145751953125, -24.24365234375, -23.341552734375, -22.439453125, -21.537353515625, -20.63525390625, -19.733154296875, -18.8310546875, -17.928955078125, -17.02685546875, -16.124755859375, -15.22265625, -14.320556640625, -13.41845703125, -12.516357421875, -11.6142578125, -10.712158203125, -9.81005859375, -8.907958984375, -8.005859375, -7.103759765625, -6.20166015625, -5.299560546875, -4.3974609375, -3.495361328125, -2.59326171875, -1.691162109375, -0.7890625, 0.113037109375, 1.01513671875, 1.917236328125, 2.8193359375, 3.721435546875, 4.62353515625, 5.525634765625, 6.427734375, 7.329833984375, 8.23193359375, 9.134033203125, 10.0361328125, 10.938232421875, 11.84033203125, 12.742431640625, 13.64453125, 14.546630859375, 15.44873046875, 16.350830078125, 17.2529296875, 18.155029296875, 19.05712890625, 19.959228515625, 20.861328125, 21.763427734375, 22.66552734375, 23.567626953125, 24.4697265625, 25.371826171875, 26.27392578125, 27.176025390625, 28.078125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 18.0, 22.0, 45.0, 80.0, 104.0, 173.0, 323.0, 566.0, 904.0, 1587.0, 2745.0, 4749.0, 8539.0, 15419.0, 26822.0, 47246.0, 81289.0, 136823.0, 223031.0, 341555.0, 479969.0, 594881.0, 618156.0, 533476.0, 399456.0, 267673.0, 169155.0, 101378.0, 59523.0, 33956.0, 19152.0, 10982.0, 6254.0, 3540.0, 1959.0, 1146.0, 605.0, 384.0, 223.0, 138.0, 88.0, 45.0, 30.0, 27.0, 9.0, 14.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-34.25, -33.248779296875, -32.24755859375, -31.246337890625, -30.2451171875, -29.243896484375, -28.24267578125, -27.241455078125, -26.240234375, -25.239013671875, -24.23779296875, -23.236572265625, -22.2353515625, -21.234130859375, -20.23291015625, -19.231689453125, -18.23046875, -17.229248046875, -16.22802734375, -15.226806640625, -14.2255859375, -13.224365234375, -12.22314453125, -11.221923828125, -10.220703125, -9.219482421875, -8.21826171875, -7.217041015625, -6.2158203125, -5.214599609375, -4.21337890625, -3.212158203125, -2.2109375, -1.209716796875, -0.20849609375, 0.792724609375, 1.7939453125, 2.795166015625, 3.79638671875, 4.797607421875, 5.798828125, 6.800048828125, 7.80126953125, 8.802490234375, 9.8037109375, 10.804931640625, 11.80615234375, 12.807373046875, 13.80859375, 14.809814453125, 15.81103515625, 16.812255859375, 17.8134765625, 18.814697265625, 19.81591796875, 20.817138671875, 21.818359375, 22.819580078125, 23.82080078125, 24.822021484375, 25.8232421875, 26.824462890625, 27.82568359375, 28.826904296875, 29.828125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 6.0, 5.0, 6.0, 1.0, 9.0, 9.0, 14.0, 15.0, 14.0, 22.0, 42.0, 48.0, 43.0, 66.0, 72.0, 91.0, 116.0, 134.0, 156.0, 179.0, 190.0, 223.0, 235.0, 258.0, 266.0, 244.0, 239.0, 210.0, 188.0, 204.0, 146.0, 142.0, 88.0, 98.0, 73.0, 56.0, 37.0, 43.0, 36.0, 12.0, 18.0, 14.0, 6.0, 6.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5390625, -14.0382080078125, -13.537353515625, -13.0364990234375, -12.53564453125, -12.0347900390625, -11.533935546875, -11.0330810546875, -10.5322265625, -10.0313720703125, -9.530517578125, -9.0296630859375, -8.52880859375, -8.0279541015625, -7.527099609375, -7.0262451171875, -6.525390625, -6.0245361328125, -5.523681640625, -5.0228271484375, -4.52197265625, -4.0211181640625, -3.520263671875, -3.0194091796875, -2.5185546875, -2.0177001953125, -1.516845703125, -1.0159912109375, -0.51513671875, -0.0142822265625, 0.486572265625, 0.9874267578125, 1.48828125, 1.9891357421875, 2.489990234375, 2.9908447265625, 3.49169921875, 3.9925537109375, 4.493408203125, 4.9942626953125, 5.4951171875, 5.9959716796875, 6.496826171875, 6.9976806640625, 7.49853515625, 7.9993896484375, 8.500244140625, 9.0010986328125, 9.501953125, 10.0028076171875, 10.503662109375, 11.0045166015625, 11.50537109375, 12.0062255859375, 12.507080078125, 13.0079345703125, 13.5087890625, 14.0096435546875, 14.510498046875, 15.0113525390625, 15.51220703125, 16.0130615234375, 16.513916015625, 17.0147705078125, 17.515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 6.0, 8.0, 4.0, 5.0, 5.0, 12.0, 13.0, 5.0, 16.0, 24.0, 30.0, 32.0, 28.0, 33.0, 34.0, 33.0, 32.0, 31.0, 27.0, 46.0, 50.0, 42.0, 42.0, 39.0, 42.0, 26.0, 32.0, 31.0, 30.0, 26.0, 36.0, 22.0, 23.0, 10.0, 19.0, 20.0, 12.0, 9.0, 11.0, 10.0, 13.0, 2.0, 6.0, 3.0, 2.0, 4.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-26.792695999145508, -25.934385299682617, -25.07607650756836, -24.21776580810547, -23.359455108642578, -22.50114631652832, -21.64283561706543, -20.784526824951172, -19.92621612548828, -19.06790542602539, -18.209596633911133, -17.351285934448242, -16.492977142333984, -15.634666442871094, -14.776355743408203, -13.918045997619629, -13.059736251831055, -12.20142650604248, -11.343116760253906, -10.484806060791016, -9.626496315002441, -8.768186569213867, -7.909876346588135, -7.051566123962402, -6.193256378173828, -5.334946632385254, -4.4766364097595215, -3.618326425552368, -2.760016441345215, -1.9017066955566406, -1.0433964729309082, -0.18508625030517578, 0.6732215881347656, 1.531531572341919, 2.3898415565490723, 3.2481515407562256, 4.106461524963379, 4.964771270751953, 5.8230814933776855, 6.681391716003418, 7.539701461791992, 8.398011207580566, 9.25632095336914, 10.114631652832031, 10.972941398620605, 11.83125114440918, 12.68956184387207, 13.547871589660645, 14.406181335449219, 15.264491081237793, 16.122800827026367, 16.981111526489258, 17.839420318603516, 18.697731018066406, 19.556041717529297, 20.414352416992188, 21.272661209106445, 22.130971908569336, 22.989280700683594, 23.847591400146484, 24.705902099609375, 25.564210891723633, 26.422521591186523, 27.28083038330078, 28.139141082763672]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 9.0, 10.0, 7.0, 16.0, 15.0, 17.0, 18.0, 17.0, 21.0, 21.0, 19.0, 32.0, 33.0, 32.0, 36.0, 34.0, 27.0, 33.0, 43.0, 41.0, 27.0, 36.0, 41.0, 36.0, 40.0, 47.0, 32.0, 34.0, 31.0, 34.0, 22.0, 21.0, 17.0, 14.0, 16.0, 11.0, 11.0, 14.0, 3.0, 6.0, 7.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0], "bins": [-37.08106231689453, -36.048091888427734, -35.01512145996094, -33.98215103149414, -32.949180603027344, -31.91621208190918, -30.883241653442383, -29.850271224975586, -28.817302703857422, -27.784332275390625, -26.751361846923828, -25.71839141845703, -24.685422897338867, -23.65245246887207, -22.619482040405273, -21.586511611938477, -20.55354118347168, -19.520570755004883, -18.487600326538086, -17.454631805419922, -16.421661376953125, -15.388690948486328, -14.355720520019531, -13.322750091552734, -12.289780616760254, -11.256810188293457, -10.223840713500977, -9.19087028503418, -8.157899856567383, -7.124930381774902, -6.0919599533081055, -5.058990001678467, -4.026020050048828, -2.9930500984191895, -1.9600799083709717, -0.9271097183227539, 0.10586023330688477, 1.1388301849365234, 2.1718006134033203, 3.204770565032959, 4.237740516662598, 5.270710468292236, 6.303680419921875, 7.336650848388672, 8.369621276855469, 9.40259075164795, 10.435561180114746, 11.468530654907227, 12.501501083374023, 13.53447151184082, 14.5674409866333, 15.600411415100098, 16.633380889892578, 17.666351318359375, 18.699321746826172, 19.73229217529297, 20.765262603759766, 21.798233032226562, 22.83120346069336, 23.864173889160156, 24.89714241027832, 25.930112838745117, 26.963083267211914, 27.99605369567871, 29.029022216796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 8.0, 9.0, 17.0, 20.0, 25.0, 46.0, 68.0, 82.0, 166.0, 231.0, 390.0, 643.0, 1234.0, 2080.0, 3606.0, 6607.0, 12110.0, 22856.0, 45175.0, 94152.0, 196177.0, 291995.0, 188593.0, 90129.0, 43534.0, 22096.0, 11901.0, 6363.0, 3476.0, 1930.0, 1154.0, 626.0, 413.0, 213.0, 146.0, 89.0, 68.0, 35.0, 34.0, 17.0, 10.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.8798828125, -8.556640625, -8.2333984375, -7.91015625, -7.5869140625, -7.263671875, -6.9404296875, -6.6171875, -6.2939453125, -5.970703125, -5.6474609375, -5.32421875, -5.0009765625, -4.677734375, -4.3544921875, -4.03125, -3.7080078125, -3.384765625, -3.0615234375, -2.73828125, -2.4150390625, -2.091796875, -1.7685546875, -1.4453125, -1.1220703125, -0.798828125, -0.4755859375, -0.15234375, 0.1708984375, 0.494140625, 0.8173828125, 1.140625, 1.4638671875, 1.787109375, 2.1103515625, 2.43359375, 2.7568359375, 3.080078125, 3.4033203125, 3.7265625, 4.0498046875, 4.373046875, 4.6962890625, 5.01953125, 5.3427734375, 5.666015625, 5.9892578125, 6.3125, 6.6357421875, 6.958984375, 7.2822265625, 7.60546875, 7.9287109375, 8.251953125, 8.5751953125, 8.8984375, 9.2216796875, 9.544921875, 9.8681640625, 10.19140625, 10.5146484375, 10.837890625, 11.1611328125, 11.484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 7.0, 6.0, 5.0, 9.0, 14.0, 18.0, 19.0, 21.0, 21.0, 24.0, 29.0, 31.0, 27.0, 39.0, 30.0, 21.0, 37.0, 36.0, 38.0, 41.0, 29.0, 46.0, 41.0, 34.0, 37.0, 46.0, 35.0, 35.0, 35.0, 22.0, 24.0, 28.0, 20.0, 14.0, 11.0, 8.0, 11.0, 8.0, 5.0, 11.0, 0.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.25, -33.20751953125, -32.1650390625, -31.12255859375, -30.080078125, -29.03759765625, -27.9951171875, -26.95263671875, -25.91015625, -24.86767578125, -23.8251953125, -22.78271484375, -21.740234375, -20.69775390625, -19.6552734375, -18.61279296875, -17.5703125, -16.52783203125, -15.4853515625, -14.44287109375, -13.400390625, -12.35791015625, -11.3154296875, -10.27294921875, -9.23046875, -8.18798828125, -7.1455078125, -6.10302734375, -5.060546875, -4.01806640625, -2.9755859375, -1.93310546875, -0.890625, 0.15185546875, 1.1943359375, 2.23681640625, 3.279296875, 4.32177734375, 5.3642578125, 6.40673828125, 7.44921875, 8.49169921875, 9.5341796875, 10.57666015625, 11.619140625, 12.66162109375, 13.7041015625, 14.74658203125, 15.7890625, 16.83154296875, 17.8740234375, 18.91650390625, 19.958984375, 21.00146484375, 22.0439453125, 23.08642578125, 24.12890625, 25.17138671875, 26.2138671875, 27.25634765625, 28.298828125, 29.34130859375, 30.3837890625, 31.42626953125, 32.46875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 11.0, 13.0, 26.0, 21.0, 35.0, 33.0, 53.0, 71.0, 105.0, 133.0, 211.0, 289.0, 467.0, 701.0, 1070.0, 1614.0, 2515.0, 4100.0, 6781.0, 11509.0, 19923.0, 35324.0, 63773.0, 114875.0, 191636.0, 231154.0, 156184.0, 89662.0, 49101.0, 27335.0, 15497.0, 9265.0, 5627.0, 3369.0, 2053.0, 1296.0, 825.0, 603.0, 381.0, 255.0, 205.0, 122.0, 89.0, 72.0, 48.0, 28.0, 22.0, 22.0, 20.0, 6.0, 3.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0], "bins": [-5.9765625, -5.79144287109375, -5.6063232421875, -5.42120361328125, -5.236083984375, -5.05096435546875, -4.8658447265625, -4.68072509765625, -4.49560546875, -4.31048583984375, -4.1253662109375, -3.94024658203125, -3.755126953125, -3.57000732421875, -3.3848876953125, -3.19976806640625, -3.0146484375, -2.82952880859375, -2.6444091796875, -2.45928955078125, -2.274169921875, -2.08905029296875, -1.9039306640625, -1.71881103515625, -1.53369140625, -1.34857177734375, -1.1634521484375, -0.97833251953125, -0.793212890625, -0.60809326171875, -0.4229736328125, -0.23785400390625, -0.052734375, 0.13238525390625, 0.3175048828125, 0.50262451171875, 0.687744140625, 0.87286376953125, 1.0579833984375, 1.24310302734375, 1.42822265625, 1.61334228515625, 1.7984619140625, 1.98358154296875, 2.168701171875, 2.35382080078125, 2.5389404296875, 2.72406005859375, 2.9091796875, 3.09429931640625, 3.2794189453125, 3.46453857421875, 3.649658203125, 3.83477783203125, 4.0198974609375, 4.20501708984375, 4.39013671875, 4.57525634765625, 4.7603759765625, 4.94549560546875, 5.130615234375, 5.31573486328125, 5.5008544921875, 5.68597412109375, 5.87109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 10.0, 5.0, 9.0, 15.0, 24.0, 14.0, 14.0, 18.0, 21.0, 29.0, 27.0, 31.0, 26.0, 26.0, 26.0, 46.0, 38.0, 43.0, 31.0, 29.0, 33.0, 41.0, 46.0, 34.0, 36.0, 33.0, 28.0, 30.0, 26.0, 20.0, 26.0, 26.0, 22.0, 10.0, 19.0, 14.0, 11.0, 16.0, 5.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.890625, -24.128662109375, -23.36669921875, -22.604736328125, -21.8427734375, -21.080810546875, -20.31884765625, -19.556884765625, -18.794921875, -18.032958984375, -17.27099609375, -16.509033203125, -15.7470703125, -14.985107421875, -14.22314453125, -13.461181640625, -12.69921875, -11.937255859375, -11.17529296875, -10.413330078125, -9.6513671875, -8.889404296875, -8.12744140625, -7.365478515625, -6.603515625, -5.841552734375, -5.07958984375, -4.317626953125, -3.5556640625, -2.793701171875, -2.03173828125, -1.269775390625, -0.5078125, 0.254150390625, 1.01611328125, 1.778076171875, 2.5400390625, 3.302001953125, 4.06396484375, 4.825927734375, 5.587890625, 6.349853515625, 7.11181640625, 7.873779296875, 8.6357421875, 9.397705078125, 10.15966796875, 10.921630859375, 11.68359375, 12.445556640625, 13.20751953125, 13.969482421875, 14.7314453125, 15.493408203125, 16.25537109375, 17.017333984375, 17.779296875, 18.541259765625, 19.30322265625, 20.065185546875, 20.8271484375, 21.589111328125, 22.35107421875, 23.113037109375, 23.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 2.0, 5.0, 5.0, 12.0, 17.0, 23.0, 41.0, 65.0, 90.0, 147.0, 215.0, 321.0, 464.0, 712.0, 1049.0, 1636.0, 2597.0, 4381.0, 7449.0, 13190.0, 25049.0, 51079.0, 112902.0, 292708.0, 305728.0, 117507.0, 52355.0, 25641.0, 13472.0, 7696.0, 4474.0, 2675.0, 1678.0, 1043.0, 681.0, 471.0, 326.0, 210.0, 156.0, 93.0, 67.0, 43.0, 36.0, 18.0, 7.0, 4.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.642578125, -0.6218643188476562, -0.6011505126953125, -0.5804367065429688, -0.559722900390625, -0.5390090942382812, -0.5182952880859375, -0.49758148193359375, -0.47686767578125, -0.45615386962890625, -0.4354400634765625, -0.41472625732421875, -0.394012451171875, -0.37329864501953125, -0.3525848388671875, -0.33187103271484375, -0.3111572265625, -0.29044342041015625, -0.2697296142578125, -0.24901580810546875, -0.228302001953125, -0.20758819580078125, -0.1868743896484375, -0.16616058349609375, -0.14544677734375, -0.12473297119140625, -0.1040191650390625, -0.08330535888671875, -0.062591552734375, -0.04187774658203125, -0.0211639404296875, -0.00045013427734375, 0.020263671875, 0.04097747802734375, 0.0616912841796875, 0.08240509033203125, 0.103118896484375, 0.12383270263671875, 0.1445465087890625, 0.16526031494140625, 0.18597412109375, 0.20668792724609375, 0.2274017333984375, 0.24811553955078125, 0.268829345703125, 0.28954315185546875, 0.3102569580078125, 0.33097076416015625, 0.3516845703125, 0.37239837646484375, 0.3931121826171875, 0.41382598876953125, 0.434539794921875, 0.45525360107421875, 0.4759674072265625, 0.49668121337890625, 0.51739501953125, 0.5381088256835938, 0.5588226318359375, 0.5795364379882812, 0.600250244140625, 0.6209640502929688, 0.6416778564453125, 0.6623916625976562, 0.68310546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 5.0, 4.0, 9.0, 9.0, 11.0, 9.0, 26.0, 31.0, 41.0, 47.0, 78.0, 67.0, 85.0, 98.0, 83.0, 93.0, 75.0, 68.0, 44.0, 25.0, 25.0, 17.0, 17.0, 11.0, 4.0, 2.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013875961303710938, -0.00013453513383865356, -0.00013031065464019775, -0.00012608617544174194, -0.00012186169624328613, -0.00011763721704483032, -0.00011341273784637451, -0.0001091882586479187, -0.00010496377944946289, -0.00010073930025100708, -9.651482105255127e-05, -9.229034185409546e-05, -8.806586265563965e-05, -8.384138345718384e-05, -7.961690425872803e-05, -7.539242506027222e-05, -7.11679458618164e-05, -6.69434666633606e-05, -6.271898746490479e-05, -5.8494508266448975e-05, -5.4270029067993164e-05, -5.0045549869537354e-05, -4.582107067108154e-05, -4.159659147262573e-05, -3.737211227416992e-05, -3.314763307571411e-05, -2.89231538772583e-05, -2.469867467880249e-05, -2.047419548034668e-05, -1.624971628189087e-05, -1.2025237083435059e-05, -7.800757884979248e-06, -3.5762786865234375e-06, 6.48200511932373e-07, 4.872679710388184e-06, 9.097158908843994e-06, 1.3321638107299805e-05, 1.7546117305755615e-05, 2.1770596504211426e-05, 2.5995075702667236e-05, 3.0219554901123047e-05, 3.444403409957886e-05, 3.866851329803467e-05, 4.289299249649048e-05, 4.711747169494629e-05, 5.13419508934021e-05, 5.556643009185791e-05, 5.979090929031372e-05, 6.401538848876953e-05, 6.823986768722534e-05, 7.246434688568115e-05, 7.668882608413696e-05, 8.091330528259277e-05, 8.513778448104858e-05, 8.93622636795044e-05, 9.35867428779602e-05, 9.781122207641602e-05, 0.00010203570127487183, 0.00010626018047332764, 0.00011048465967178345, 0.00011470913887023926, 0.00011893361806869507, 0.00012315809726715088, 0.0001273825764656067, 0.0001316070556640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 14.0, 13.0, 26.0, 37.0, 64.0, 75.0, 148.0, 229.0, 309.0, 460.0, 720.0, 1164.0, 1596.0, 2425.0, 3783.0, 5639.0, 8214.0, 12556.0, 18439.0, 27743.0, 43322.0, 67580.0, 113405.0, 225121.0, 215368.0, 110426.0, 65864.0, 41577.0, 27561.0, 18191.0, 12057.0, 8014.0, 5526.0, 3687.0, 2398.0, 1587.0, 1186.0, 725.0, 453.0, 300.0, 194.0, 120.0, 76.0, 60.0, 31.0, 26.0, 9.0, 13.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.1015625, -1.067108154296875, -1.03265380859375, -0.998199462890625, -0.9637451171875, -0.929290771484375, -0.89483642578125, -0.860382080078125, -0.825927734375, -0.791473388671875, -0.75701904296875, -0.722564697265625, -0.6881103515625, -0.653656005859375, -0.61920166015625, -0.584747314453125, -0.55029296875, -0.515838623046875, -0.48138427734375, -0.446929931640625, -0.4124755859375, -0.378021240234375, -0.34356689453125, -0.309112548828125, -0.274658203125, -0.240203857421875, -0.20574951171875, -0.171295166015625, -0.1368408203125, -0.102386474609375, -0.06793212890625, -0.033477783203125, 0.0009765625, 0.035430908203125, 0.06988525390625, 0.104339599609375, 0.1387939453125, 0.173248291015625, 0.20770263671875, 0.242156982421875, 0.276611328125, 0.311065673828125, 0.34552001953125, 0.379974365234375, 0.4144287109375, 0.448883056640625, 0.48333740234375, 0.517791748046875, 0.55224609375, 0.586700439453125, 0.62115478515625, 0.655609130859375, 0.6900634765625, 0.724517822265625, 0.75897216796875, 0.793426513671875, 0.827880859375, 0.862335205078125, 0.89678955078125, 0.931243896484375, 0.9656982421875, 1.000152587890625, 1.03460693359375, 1.069061279296875, 1.103515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 2.0, 9.0, 7.0, 5.0, 6.0, 15.0, 13.0, 9.0, 16.0, 17.0, 15.0, 20.0, 40.0, 23.0, 22.0, 41.0, 40.0, 39.0, 41.0, 39.0, 53.0, 37.0, 44.0, 49.0, 33.0, 45.0, 47.0, 29.0, 30.0, 22.0, 26.0, 17.0, 21.0, 16.0, 18.0, 16.0, 11.0, 12.0, 6.0, 12.0, 9.0, 5.0, 7.0, 5.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51513671875, -0.49884033203125, -0.4825439453125, -0.46624755859375, -0.449951171875, -0.43365478515625, -0.4173583984375, -0.40106201171875, -0.384765625, -0.36846923828125, -0.3521728515625, -0.33587646484375, -0.319580078125, -0.30328369140625, -0.2869873046875, -0.27069091796875, -0.25439453125, -0.23809814453125, -0.2218017578125, -0.20550537109375, -0.189208984375, -0.17291259765625, -0.1566162109375, -0.14031982421875, -0.1240234375, -0.10772705078125, -0.0914306640625, -0.07513427734375, -0.058837890625, -0.04254150390625, -0.0262451171875, -0.00994873046875, 0.00634765625, 0.02264404296875, 0.0389404296875, 0.05523681640625, 0.071533203125, 0.08782958984375, 0.1041259765625, 0.12042236328125, 0.13671875, 0.15301513671875, 0.1693115234375, 0.18560791015625, 0.201904296875, 0.21820068359375, 0.2344970703125, 0.25079345703125, 0.26708984375, 0.28338623046875, 0.2996826171875, 0.31597900390625, 0.332275390625, 0.34857177734375, 0.3648681640625, 0.38116455078125, 0.3974609375, 0.41375732421875, 0.4300537109375, 0.44635009765625, 0.462646484375, 0.47894287109375, 0.4952392578125, 0.51153564453125, 0.52783203125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 4.0, 5.0, 8.0, 5.0, 5.0, 4.0, 5.0, 13.0, 12.0, 7.0, 19.0, 21.0, 32.0, 37.0, 24.0, 32.0, 28.0, 34.0, 30.0, 33.0, 32.0, 41.0, 46.0, 43.0, 49.0, 39.0, 35.0, 34.0, 33.0, 30.0, 30.0, 29.0, 20.0, 26.0, 24.0, 19.0, 13.0, 18.0, 11.0, 10.0, 15.0, 9.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.985017776489258, -24.15036964416504, -23.315719604492188, -22.48107147216797, -21.64642333984375, -20.81177520751953, -19.977127075195312, -19.14247703552246, -18.307828903198242, -17.473180770874023, -16.638530731201172, -15.803882598876953, -14.969234466552734, -14.134586334228516, -13.29993724822998, -12.465288162231445, -11.630640029907227, -10.795991897583008, -9.961342811584473, -9.126693725585938, -8.292045593261719, -7.457396984100342, -6.622748374938965, -5.788099765777588, -4.953451156616211, -4.118802547454834, -3.284153938293457, -2.44950532913208, -1.6148567199707031, -0.7802081108093262, 0.05444049835205078, 0.8890891075134277, 1.7237358093261719, 2.558384418487549, 3.393033027648926, 4.227681636810303, 5.06233024597168, 5.896978855133057, 6.731627464294434, 7.5662760734558105, 8.400924682617188, 9.235572814941406, 10.070221900939941, 10.904870986938477, 11.739519119262695, 12.574167251586914, 13.40881633758545, 14.243465423583984, 15.078113555908203, 15.912761688232422, 16.74740982055664, 17.582059860229492, 18.41670799255371, 19.25135612487793, 20.08600616455078, 20.920654296875, 21.75530242919922, 22.589950561523438, 23.424598693847656, 24.259248733520508, 25.093896865844727, 25.928544998168945, 26.763195037841797, 27.597843170166016, 28.432491302490234]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 8.0, 6.0, 11.0, 8.0, 20.0, 13.0, 16.0, 18.0, 23.0, 19.0, 20.0, 21.0, 30.0, 36.0, 31.0, 36.0, 32.0, 25.0, 38.0, 44.0, 38.0, 28.0, 36.0, 43.0, 36.0, 44.0, 39.0, 39.0, 33.0, 31.0, 29.0, 20.0, 20.0, 16.0, 16.0, 13.0, 15.0, 12.0, 10.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0], "bins": [-36.0355110168457, -35.02525329589844, -34.01499938964844, -33.00474166870117, -31.99448585510254, -30.984230041503906, -29.97397232055664, -28.963716506958008, -27.953460693359375, -26.943204879760742, -25.93294906616211, -24.922691345214844, -23.91243553161621, -22.902179718017578, -21.891921997070312, -20.88166618347168, -19.871410369873047, -18.861154556274414, -17.85089874267578, -16.840641021728516, -15.830385208129883, -14.82012939453125, -13.8098726272583, -12.799615859985352, -11.789360046386719, -10.779104232788086, -9.768847465515137, -8.758590698242188, -7.748334884643555, -6.738078594207764, -5.727822303771973, -4.717566013336182, -3.7073116302490234, -2.6970553398132324, -1.6867990493774414, -0.6765427589416504, 0.3337135314941406, 1.3439698219299316, 2.3542261123657227, 3.3644824028015137, 4.374738693237305, 5.384994983673096, 6.395251274108887, 7.405507564544678, 8.415763854980469, 9.426019668579102, 10.43627643585205, 11.446533203125, 12.456789016723633, 13.467044830322266, 14.477301597595215, 15.487558364868164, 16.497814178466797, 17.50806999206543, 18.518325805664062, 19.528583526611328, 20.53883934020996, 21.549095153808594, 22.55935287475586, 23.569608688354492, 24.579864501953125, 25.590120315551758, 26.60037612915039, 27.610633850097656, 28.62088966369629]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 18.0, 25.0, 33.0, 59.0, 75.0, 135.0, 216.0, 336.0, 499.0, 806.0, 1220.0, 1895.0, 3004.0, 4638.0, 7107.0, 11272.0, 16655.0, 26070.0, 37936.0, 54132.0, 73634.0, 93420.0, 110857.0, 119017.0, 115028.0, 100234.0, 80725.0, 60672.0, 43070.0, 29446.0, 19709.0, 12975.0, 8470.0, 5513.0, 3430.0, 2231.0, 1457.0, 902.0, 562.0, 356.0, 253.0, 152.0, 102.0, 77.0, 44.0, 38.0, 20.0, 8.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.3125, -24.560791015625, -23.80908203125, -23.057373046875, -22.3056640625, -21.553955078125, -20.80224609375, -20.050537109375, -19.298828125, -18.547119140625, -17.79541015625, -17.043701171875, -16.2919921875, -15.540283203125, -14.78857421875, -14.036865234375, -13.28515625, -12.533447265625, -11.78173828125, -11.030029296875, -10.2783203125, -9.526611328125, -8.77490234375, -8.023193359375, -7.271484375, -6.519775390625, -5.76806640625, -5.016357421875, -4.2646484375, -3.512939453125, -2.76123046875, -2.009521484375, -1.2578125, -0.506103515625, 0.24560546875, 0.997314453125, 1.7490234375, 2.500732421875, 3.25244140625, 4.004150390625, 4.755859375, 5.507568359375, 6.25927734375, 7.010986328125, 7.7626953125, 8.514404296875, 9.26611328125, 10.017822265625, 10.76953125, 11.521240234375, 12.27294921875, 13.024658203125, 13.7763671875, 14.528076171875, 15.27978515625, 16.031494140625, 16.783203125, 17.534912109375, 18.28662109375, 19.038330078125, 19.7900390625, 20.541748046875, 21.29345703125, 22.045166015625, 22.796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 9.0, 8.0, 12.0, 7.0, 8.0, 10.0, 19.0, 27.0, 13.0, 19.0, 34.0, 23.0, 26.0, 36.0, 31.0, 28.0, 45.0, 43.0, 31.0, 24.0, 32.0, 44.0, 31.0, 39.0, 45.0, 37.0, 38.0, 44.0, 23.0, 27.0, 26.0, 18.0, 20.0, 19.0, 14.0, 11.0, 12.0, 9.0, 13.0, 7.0, 10.0, 6.0, 8.0, 1.0, 3.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.953125, -31.007080078125, -30.06103515625, -29.114990234375, -28.1689453125, -27.222900390625, -26.27685546875, -25.330810546875, -24.384765625, -23.438720703125, -22.49267578125, -21.546630859375, -20.6005859375, -19.654541015625, -18.70849609375, -17.762451171875, -16.81640625, -15.870361328125, -14.92431640625, -13.978271484375, -13.0322265625, -12.086181640625, -11.14013671875, -10.194091796875, -9.248046875, -8.302001953125, -7.35595703125, -6.409912109375, -5.4638671875, -4.517822265625, -3.57177734375, -2.625732421875, -1.6796875, -0.733642578125, 0.21240234375, 1.158447265625, 2.1044921875, 3.050537109375, 3.99658203125, 4.942626953125, 5.888671875, 6.834716796875, 7.78076171875, 8.726806640625, 9.6728515625, 10.618896484375, 11.56494140625, 12.510986328125, 13.45703125, 14.403076171875, 15.34912109375, 16.295166015625, 17.2412109375, 18.187255859375, 19.13330078125, 20.079345703125, 21.025390625, 21.971435546875, 22.91748046875, 23.863525390625, 24.8095703125, 25.755615234375, 26.70166015625, 27.647705078125, 28.59375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 11.0, 10.0, 14.0, 38.0, 52.0, 86.0, 117.0, 199.0, 301.0, 471.0, 758.0, 1179.0, 1893.0, 2936.0, 4710.0, 7352.0, 11558.0, 17986.0, 27315.0, 41302.0, 59787.0, 83020.0, 105926.0, 123196.0, 126494.0, 116638.0, 95008.0, 72064.0, 50858.0, 34281.0, 22643.0, 14670.0, 9339.0, 6009.0, 3716.0, 2471.0, 1499.0, 955.0, 603.0, 405.0, 254.0, 162.0, 97.0, 54.0, 39.0, 28.0, 20.0, 16.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.40625, -25.561767578125, -24.71728515625, -23.872802734375, -23.0283203125, -22.183837890625, -21.33935546875, -20.494873046875, -19.650390625, -18.805908203125, -17.96142578125, -17.116943359375, -16.2724609375, -15.427978515625, -14.58349609375, -13.739013671875, -12.89453125, -12.050048828125, -11.20556640625, -10.361083984375, -9.5166015625, -8.672119140625, -7.82763671875, -6.983154296875, -6.138671875, -5.294189453125, -4.44970703125, -3.605224609375, -2.7607421875, -1.916259765625, -1.07177734375, -0.227294921875, 0.6171875, 1.461669921875, 2.30615234375, 3.150634765625, 3.9951171875, 4.839599609375, 5.68408203125, 6.528564453125, 7.373046875, 8.217529296875, 9.06201171875, 9.906494140625, 10.7509765625, 11.595458984375, 12.43994140625, 13.284423828125, 14.12890625, 14.973388671875, 15.81787109375, 16.662353515625, 17.5068359375, 18.351318359375, 19.19580078125, 20.040283203125, 20.884765625, 21.729248046875, 22.57373046875, 23.418212890625, 24.2626953125, 25.107177734375, 25.95166015625, 26.796142578125, 27.640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 5.0, 6.0, 10.0, 14.0, 9.0, 19.0, 14.0, 19.0, 16.0, 24.0, 26.0, 23.0, 35.0, 38.0, 46.0, 34.0, 47.0, 39.0, 39.0, 45.0, 34.0, 47.0, 44.0, 35.0, 38.0, 35.0, 29.0, 38.0, 26.0, 27.0, 22.0, 13.0, 20.0, 12.0, 5.0, 11.0, 11.0, 8.0, 6.0, 6.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.66552734375, -18.0029296875, -17.34033203125, -16.677734375, -16.01513671875, -15.3525390625, -14.68994140625, -14.02734375, -13.36474609375, -12.7021484375, -12.03955078125, -11.376953125, -10.71435546875, -10.0517578125, -9.38916015625, -8.7265625, -8.06396484375, -7.4013671875, -6.73876953125, -6.076171875, -5.41357421875, -4.7509765625, -4.08837890625, -3.42578125, -2.76318359375, -2.1005859375, -1.43798828125, -0.775390625, -0.11279296875, 0.5498046875, 1.21240234375, 1.875, 2.53759765625, 3.2001953125, 3.86279296875, 4.525390625, 5.18798828125, 5.8505859375, 6.51318359375, 7.17578125, 7.83837890625, 8.5009765625, 9.16357421875, 9.826171875, 10.48876953125, 11.1513671875, 11.81396484375, 12.4765625, 13.13916015625, 13.8017578125, 14.46435546875, 15.126953125, 15.78955078125, 16.4521484375, 17.11474609375, 17.77734375, 18.43994140625, 19.1025390625, 19.76513671875, 20.427734375, 21.09033203125, 21.7529296875, 22.41552734375, 23.078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 10.0, 12.0, 10.0, 21.0, 36.0, 61.0, 104.0, 162.0, 287.0, 461.0, 723.0, 1212.0, 2166.0, 3869.0, 6845.0, 12007.0, 21242.0, 36080.0, 61034.0, 94711.0, 131739.0, 158696.0, 157202.0, 129108.0, 91212.0, 58018.0, 34815.0, 20048.0, 11341.0, 6521.0, 3607.0, 2146.0, 1238.0, 710.0, 394.0, 253.0, 162.0, 88.0, 53.0, 42.0, 24.0, 29.0, 7.0, 7.0, 7.0, 9.0, 6.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.5546875, -7.302490234375, -7.05029296875, -6.798095703125, -6.5458984375, -6.293701171875, -6.04150390625, -5.789306640625, -5.537109375, -5.284912109375, -5.03271484375, -4.780517578125, -4.5283203125, -4.276123046875, -4.02392578125, -3.771728515625, -3.51953125, -3.267333984375, -3.01513671875, -2.762939453125, -2.5107421875, -2.258544921875, -2.00634765625, -1.754150390625, -1.501953125, -1.249755859375, -0.99755859375, -0.745361328125, -0.4931640625, -0.240966796875, 0.01123046875, 0.263427734375, 0.515625, 0.767822265625, 1.02001953125, 1.272216796875, 1.5244140625, 1.776611328125, 2.02880859375, 2.281005859375, 2.533203125, 2.785400390625, 3.03759765625, 3.289794921875, 3.5419921875, 3.794189453125, 4.04638671875, 4.298583984375, 4.55078125, 4.802978515625, 5.05517578125, 5.307373046875, 5.5595703125, 5.811767578125, 6.06396484375, 6.316162109375, 6.568359375, 6.820556640625, 7.07275390625, 7.324951171875, 7.5771484375, 7.829345703125, 8.08154296875, 8.333740234375, 8.5859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 8.0, 5.0, 14.0, 4.0, 19.0, 15.0, 15.0, 22.0, 24.0, 27.0, 35.0, 29.0, 37.0, 39.0, 43.0, 41.0, 48.0, 43.0, 52.0, 45.0, 44.0, 53.0, 39.0, 38.0, 33.0, 31.0, 30.0, 34.0, 22.0, 19.0, 18.0, 16.0, 9.0, 3.0, 4.0, 4.0, 11.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006666183471679688, -0.000645853579044342, -0.0006250888109207153, -0.0006043240427970886, -0.0005835592746734619, -0.0005627945065498352, -0.0005420297384262085, -0.0005212649703025818, -0.0005005002021789551, -0.00047973543405532837, -0.00045897066593170166, -0.00043820589780807495, -0.00041744112968444824, -0.00039667636156082153, -0.0003759115934371948, -0.0003551468253135681, -0.0003343820571899414, -0.0003136172890663147, -0.000292852520942688, -0.0002720877528190613, -0.00025132298469543457, -0.00023055821657180786, -0.00020979344844818115, -0.00018902868032455444, -0.00016826391220092773, -0.00014749914407730103, -0.00012673437595367432, -0.00010596960783004761, -8.52048397064209e-05, -6.444007158279419e-05, -4.367530345916748e-05, -2.291053533554077e-05, -2.1457672119140625e-06, 1.8619000911712646e-05, 3.9383769035339355e-05, 6.0148537158966064e-05, 8.091330528259277e-05, 0.00010167807340621948, 0.0001224428415298462, 0.0001432076096534729, 0.0001639723777770996, 0.00018473714590072632, 0.00020550191402435303, 0.00022626668214797974, 0.00024703145027160645, 0.00026779621839523315, 0.00028856098651885986, 0.00030932575464248657, 0.0003300905227661133, 0.00035085529088974, 0.0003716200590133667, 0.0003923848271369934, 0.0004131495952606201, 0.0004339143633842468, 0.00045467913150787354, 0.00047544389963150024, 0.000496208667755127, 0.0005169734358787537, 0.0005377382040023804, 0.0005585029721260071, 0.0005792677402496338, 0.0006000325083732605, 0.0006207972764968872, 0.0006415620446205139, 0.0006623268127441406]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 6.0, 5.0, 7.0, 11.0, 11.0, 17.0, 35.0, 70.0, 86.0, 122.0, 194.0, 296.0, 442.0, 639.0, 1054.0, 1599.0, 2462.0, 3604.0, 5780.0, 8853.0, 13682.0, 20424.0, 30360.0, 44378.0, 62751.0, 83193.0, 103048.0, 117263.0, 119380.0, 110422.0, 91763.0, 70352.0, 51416.0, 35401.0, 24139.0, 15735.0, 10151.0, 6721.0, 4436.0, 2902.0, 1764.0, 1244.0, 783.0, 517.0, 374.0, 214.0, 158.0, 119.0, 75.0, 45.0, 20.0, 13.0, 12.0, 9.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-5.9453125, -5.7484130859375, -5.551513671875, -5.3546142578125, -5.15771484375, -4.9608154296875, -4.763916015625, -4.5670166015625, -4.3701171875, -4.1732177734375, -3.976318359375, -3.7794189453125, -3.58251953125, -3.3856201171875, -3.188720703125, -2.9918212890625, -2.794921875, -2.5980224609375, -2.401123046875, -2.2042236328125, -2.00732421875, -1.8104248046875, -1.613525390625, -1.4166259765625, -1.2197265625, -1.0228271484375, -0.825927734375, -0.6290283203125, -0.43212890625, -0.2352294921875, -0.038330078125, 0.1585693359375, 0.35546875, 0.5523681640625, 0.749267578125, 0.9461669921875, 1.14306640625, 1.3399658203125, 1.536865234375, 1.7337646484375, 1.9306640625, 2.1275634765625, 2.324462890625, 2.5213623046875, 2.71826171875, 2.9151611328125, 3.112060546875, 3.3089599609375, 3.505859375, 3.7027587890625, 3.899658203125, 4.0965576171875, 4.29345703125, 4.4903564453125, 4.687255859375, 4.8841552734375, 5.0810546875, 5.2779541015625, 5.474853515625, 5.6717529296875, 5.86865234375, 6.0655517578125, 6.262451171875, 6.4593505859375, 6.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 12.0, 6.0, 10.0, 7.0, 15.0, 21.0, 19.0, 22.0, 23.0, 21.0, 25.0, 42.0, 37.0, 37.0, 40.0, 51.0, 40.0, 46.0, 48.0, 46.0, 40.0, 35.0, 41.0, 45.0, 31.0, 39.0, 29.0, 29.0, 27.0, 19.0, 16.0, 18.0, 14.0, 16.0, 9.0, 9.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12109375, -2.04443359375, -1.9677734375, -1.89111328125, -1.814453125, -1.73779296875, -1.6611328125, -1.58447265625, -1.5078125, -1.43115234375, -1.3544921875, -1.27783203125, -1.201171875, -1.12451171875, -1.0478515625, -0.97119140625, -0.89453125, -0.81787109375, -0.7412109375, -0.66455078125, -0.587890625, -0.51123046875, -0.4345703125, -0.35791015625, -0.28125, -0.20458984375, -0.1279296875, -0.05126953125, 0.025390625, 0.10205078125, 0.1787109375, 0.25537109375, 0.33203125, 0.40869140625, 0.4853515625, 0.56201171875, 0.638671875, 0.71533203125, 0.7919921875, 0.86865234375, 0.9453125, 1.02197265625, 1.0986328125, 1.17529296875, 1.251953125, 1.32861328125, 1.4052734375, 1.48193359375, 1.55859375, 1.63525390625, 1.7119140625, 1.78857421875, 1.865234375, 1.94189453125, 2.0185546875, 2.09521484375, 2.171875, 2.24853515625, 2.3251953125, 2.40185546875, 2.478515625, 2.55517578125, 2.6318359375, 2.70849609375, 2.78515625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 3.0, 6.0, 10.0, 10.0, 10.0, 14.0, 17.0, 18.0, 24.0, 25.0, 29.0, 25.0, 30.0, 36.0, 38.0, 29.0, 33.0, 40.0, 32.0, 58.0, 43.0, 36.0, 35.0, 32.0, 38.0, 31.0, 38.0, 28.0, 24.0, 32.0, 23.0, 22.0, 15.0, 14.0, 15.0, 17.0, 12.0, 12.0, 7.0, 7.0, 8.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-26.03148078918457, -25.20361328125, -24.37574577331543, -23.54787826538086, -22.720012664794922, -21.89214324951172, -21.06427764892578, -20.23641014099121, -19.40854263305664, -18.58067512512207, -17.7528076171875, -16.92494010925293, -16.09707260131836, -15.269206047058105, -14.441339492797852, -13.613471984863281, -12.785604476928711, -11.95773696899414, -11.12986946105957, -10.302002906799316, -9.474135398864746, -8.646267890930176, -7.818400859832764, -6.990533828735352, -6.162666320800781, -5.334798812866211, -4.506931781768799, -3.6790645122528076, -2.8511972427368164, -2.023329734802246, -1.195462703704834, -0.3675956726074219, 0.46027374267578125, 1.2881410121917725, 2.1160082817077637, 2.943875551223755, 3.771742820739746, 4.599610328674316, 5.4274773597717285, 6.255344390869141, 7.083211898803711, 7.911079406738281, 8.738946914672852, 9.566813468933105, 10.394680976867676, 11.222548484802246, 12.0504150390625, 12.87828254699707, 13.70615005493164, 14.534017562866211, 15.361885070800781, 16.18975257873535, 17.017620086669922, 17.84548568725586, 18.67335319519043, 19.501220703125, 20.32908821105957, 21.15695571899414, 21.98482322692871, 22.81269073486328, 23.64055633544922, 24.468425750732422, 25.29629135131836, 26.12415885925293, 26.9520263671875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 2.0, 9.0, 11.0, 11.0, 12.0, 20.0, 7.0, 23.0, 26.0, 19.0, 26.0, 32.0, 34.0, 35.0, 31.0, 29.0, 40.0, 45.0, 46.0, 46.0, 50.0, 41.0, 45.0, 37.0, 38.0, 41.0, 35.0, 29.0, 25.0, 15.0, 24.0, 14.0, 17.0, 15.0, 16.0, 10.0, 4.0, 7.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.694969177246094, -37.5576286315918, -36.4202880859375, -35.2829475402832, -34.145606994628906, -33.00826644897461, -31.870925903320312, -30.733585357666016, -29.59624481201172, -28.458904266357422, -27.321563720703125, -26.184223175048828, -25.04688262939453, -23.909542083740234, -22.772201538085938, -21.63486099243164, -20.497520446777344, -19.360179901123047, -18.22283935546875, -17.085498809814453, -15.948158264160156, -14.81081771850586, -13.673477172851562, -12.536136627197266, -11.398796081542969, -10.261455535888672, -9.124114990234375, -7.986774444580078, -6.849433898925781, -5.712093353271484, -4.5747528076171875, -3.4374122619628906, -2.300067901611328, -1.1627273559570312, -0.025386810302734375, 1.1119537353515625, 2.2492942810058594, 3.3866348266601562, 4.523975372314453, 5.66131591796875, 6.798656463623047, 7.935997009277344, 9.07333755493164, 10.210678100585938, 11.348018646240234, 12.485359191894531, 13.622699737548828, 14.760040283203125, 15.897380828857422, 17.03472137451172, 18.172061920166016, 19.309402465820312, 20.44674301147461, 21.584083557128906, 22.721424102783203, 23.8587646484375, 24.996105194091797, 26.133445739746094, 27.27078628540039, 28.408126831054688, 29.545467376708984, 30.68280792236328, 31.820148468017578, 32.957489013671875, 34.09482955932617]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 8.0, 11.0, 20.0, 38.0, 52.0, 76.0, 119.0, 190.0, 292.0, 539.0, 793.0, 1246.0, 2062.0, 3357.0, 5557.0, 9295.0, 15438.0, 25912.0, 42749.0, 72071.0, 118019.0, 192117.0, 298676.0, 434699.0, 561954.0, 617314.0, 564054.0, 438563.0, 301935.0, 194043.0, 118567.0, 71150.0, 42292.0, 25314.0, 14523.0, 8700.0, 5033.0, 2947.0, 1788.0, 1027.0, 678.0, 418.0, 236.0, 145.0, 83.0, 78.0, 31.0, 23.0, 19.0, 17.0, 3.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.6875, -24.89697265625, -24.1064453125, -23.31591796875, -22.525390625, -21.73486328125, -20.9443359375, -20.15380859375, -19.36328125, -18.57275390625, -17.7822265625, -16.99169921875, -16.201171875, -15.41064453125, -14.6201171875, -13.82958984375, -13.0390625, -12.24853515625, -11.4580078125, -10.66748046875, -9.876953125, -9.08642578125, -8.2958984375, -7.50537109375, -6.71484375, -5.92431640625, -5.1337890625, -4.34326171875, -3.552734375, -2.76220703125, -1.9716796875, -1.18115234375, -0.390625, 0.39990234375, 1.1904296875, 1.98095703125, 2.771484375, 3.56201171875, 4.3525390625, 5.14306640625, 5.93359375, 6.72412109375, 7.5146484375, 8.30517578125, 9.095703125, 9.88623046875, 10.6767578125, 11.46728515625, 12.2578125, 13.04833984375, 13.8388671875, 14.62939453125, 15.419921875, 16.21044921875, 17.0009765625, 17.79150390625, 18.58203125, 19.37255859375, 20.1630859375, 20.95361328125, 21.744140625, 22.53466796875, 23.3251953125, 24.11572265625, 24.90625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 4.0, 7.0, 6.0, 9.0, 10.0, 15.0, 17.0, 19.0, 16.0, 21.0, 40.0, 28.0, 27.0, 35.0, 25.0, 32.0, 38.0, 34.0, 47.0, 52.0, 47.0, 42.0, 44.0, 44.0, 45.0, 42.0, 38.0, 32.0, 30.0, 20.0, 18.0, 14.0, 17.0, 12.0, 13.0, 13.0, 6.0, 9.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.625, -24.8134765625, -24.001953125, -23.1904296875, -22.37890625, -21.5673828125, -20.755859375, -19.9443359375, -19.1328125, -18.3212890625, -17.509765625, -16.6982421875, -15.88671875, -15.0751953125, -14.263671875, -13.4521484375, -12.640625, -11.8291015625, -11.017578125, -10.2060546875, -9.39453125, -8.5830078125, -7.771484375, -6.9599609375, -6.1484375, -5.3369140625, -4.525390625, -3.7138671875, -2.90234375, -2.0908203125, -1.279296875, -0.4677734375, 0.34375, 1.1552734375, 1.966796875, 2.7783203125, 3.58984375, 4.4013671875, 5.212890625, 6.0244140625, 6.8359375, 7.6474609375, 8.458984375, 9.2705078125, 10.08203125, 10.8935546875, 11.705078125, 12.5166015625, 13.328125, 14.1396484375, 14.951171875, 15.7626953125, 16.57421875, 17.3857421875, 18.197265625, 19.0087890625, 19.8203125, 20.6318359375, 21.443359375, 22.2548828125, 23.06640625, 23.8779296875, 24.689453125, 25.5009765625, 26.3125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 9.0, 17.0, 17.0, 21.0, 35.0, 56.0, 91.0, 146.0, 236.0, 340.0, 655.0, 950.0, 1692.0, 2852.0, 4745.0, 8020.0, 13380.0, 22244.0, 36098.0, 57711.0, 90912.0, 139418.0, 203197.0, 282004.0, 367576.0, 442338.0, 482714.0, 475844.0, 425993.0, 345635.0, 263620.0, 185393.0, 126242.0, 82282.0, 51021.0, 31837.0, 19567.0, 11857.0, 6911.0, 4241.0, 2466.0, 1529.0, 980.0, 514.0, 308.0, 223.0, 126.0, 88.0, 57.0, 36.0, 17.0, 11.0, 13.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.765625, -19.12548828125, -18.4853515625, -17.84521484375, -17.205078125, -16.56494140625, -15.9248046875, -15.28466796875, -14.64453125, -14.00439453125, -13.3642578125, -12.72412109375, -12.083984375, -11.44384765625, -10.8037109375, -10.16357421875, -9.5234375, -8.88330078125, -8.2431640625, -7.60302734375, -6.962890625, -6.32275390625, -5.6826171875, -5.04248046875, -4.40234375, -3.76220703125, -3.1220703125, -2.48193359375, -1.841796875, -1.20166015625, -0.5615234375, 0.07861328125, 0.71875, 1.35888671875, 1.9990234375, 2.63916015625, 3.279296875, 3.91943359375, 4.5595703125, 5.19970703125, 5.83984375, 6.47998046875, 7.1201171875, 7.76025390625, 8.400390625, 9.04052734375, 9.6806640625, 10.32080078125, 10.9609375, 11.60107421875, 12.2412109375, 12.88134765625, 13.521484375, 14.16162109375, 14.8017578125, 15.44189453125, 16.08203125, 16.72216796875, 17.3623046875, 18.00244140625, 18.642578125, 19.28271484375, 19.9228515625, 20.56298828125, 21.203125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 10.0, 5.0, 5.0, 5.0, 22.0, 21.0, 29.0, 45.0, 47.0, 62.0, 74.0, 104.0, 120.0, 147.0, 185.0, 187.0, 210.0, 213.0, 247.0, 249.0, 268.0, 200.0, 241.0, 234.0, 191.0, 197.0, 172.0, 121.0, 104.0, 96.0, 74.0, 58.0, 34.0, 30.0, 20.0, 19.0, 12.0, 8.0, 4.0, 6.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.5859375, -13.1600341796875, -12.734130859375, -12.3082275390625, -11.88232421875, -11.4564208984375, -11.030517578125, -10.6046142578125, -10.1787109375, -9.7528076171875, -9.326904296875, -8.9010009765625, -8.47509765625, -8.0491943359375, -7.623291015625, -7.1973876953125, -6.771484375, -6.3455810546875, -5.919677734375, -5.4937744140625, -5.06787109375, -4.6419677734375, -4.216064453125, -3.7901611328125, -3.3642578125, -2.9383544921875, -2.512451171875, -2.0865478515625, -1.66064453125, -1.2347412109375, -0.808837890625, -0.3829345703125, 0.04296875, 0.4688720703125, 0.894775390625, 1.3206787109375, 1.74658203125, 2.1724853515625, 2.598388671875, 3.0242919921875, 3.4501953125, 3.8760986328125, 4.302001953125, 4.7279052734375, 5.15380859375, 5.5797119140625, 6.005615234375, 6.4315185546875, 6.857421875, 7.2833251953125, 7.709228515625, 8.1351318359375, 8.56103515625, 8.9869384765625, 9.412841796875, 9.8387451171875, 10.2646484375, 10.6905517578125, 11.116455078125, 11.5423583984375, 11.96826171875, 12.3941650390625, 12.820068359375, 13.2459716796875, 13.671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 4.0, 10.0, 11.0, 19.0, 17.0, 21.0, 27.0, 27.0, 28.0, 32.0, 27.0, 38.0, 48.0, 29.0, 52.0, 44.0, 47.0, 38.0, 41.0, 33.0, 46.0, 35.0, 30.0, 35.0, 37.0, 24.0, 19.0, 12.0, 23.0, 22.0, 21.0, 17.0, 13.0, 7.0, 8.0, 7.0, 3.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-22.566545486450195, -21.856828689575195, -21.147111892700195, -20.437395095825195, -19.727680206298828, -19.017963409423828, -18.308246612548828, -17.598529815673828, -16.888813018798828, -16.179096221923828, -15.469379425048828, -14.759663581848145, -14.049946784973145, -13.340229988098145, -12.630514144897461, -11.920797348022461, -11.211080551147461, -10.501363754272461, -9.791646957397461, -9.081931114196777, -8.372214317321777, -7.662497520446777, -6.9527812004089355, -6.243064880371094, -5.533348083496094, -4.823631286621094, -4.113914966583252, -3.404198408126831, -2.69448184967041, -1.9847652912139893, -1.2750487327575684, -0.5653324127197266, 0.14438438415527344, 0.8541009426116943, 1.5638175010681152, 2.273534059524536, 2.983250617980957, 3.692967176437378, 4.402683734893799, 5.112400054931641, 5.822116851806641, 6.531833648681641, 7.241549968719482, 7.951266288757324, 8.660983085632324, 9.370699882507324, 10.080415725708008, 10.790132522583008, 11.499849319458008, 12.209566116333008, 12.919282913208008, 13.628998756408691, 14.338715553283691, 15.048432350158691, 15.758148193359375, 16.467864990234375, 17.177581787109375, 17.887298583984375, 18.597015380859375, 19.306732177734375, 20.016448974609375, 20.726163864135742, 21.435880661010742, 22.145597457885742, 22.855314254760742]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 6.0, 6.0, 7.0, 9.0, 10.0, 13.0, 10.0, 17.0, 20.0, 18.0, 17.0, 20.0, 18.0, 34.0, 34.0, 30.0, 40.0, 46.0, 42.0, 36.0, 45.0, 45.0, 40.0, 38.0, 47.0, 48.0, 40.0, 38.0, 23.0, 23.0, 29.0, 23.0, 21.0, 20.0, 13.0, 18.0, 14.0, 15.0, 10.0, 5.0, 2.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-32.794593811035156, -31.882802963256836, -30.971010208129883, -30.059219360351562, -29.14742660522461, -28.23563575744629, -27.32384490966797, -26.412052154541016, -25.500259399414062, -24.588468551635742, -23.67667579650879, -22.76488494873047, -21.853092193603516, -20.941301345825195, -20.029510498046875, -19.117717742919922, -18.2059268951416, -17.29413604736328, -16.382343292236328, -15.470552444458008, -14.558759689331055, -13.646968841552734, -12.735177040100098, -11.823385238647461, -10.911593437194824, -9.999801635742188, -9.08800983428955, -8.176218032836914, -7.2644267082214355, -6.352634906768799, -5.44084358215332, -4.529051780700684, -3.6172618865966797, -2.705470085144043, -1.7936785221099854, -0.8818869590759277, 0.029904842376708984, 0.9416966438293457, 1.8534879684448242, 2.765279769897461, 3.6770715713500977, 4.588863372802734, 5.500655174255371, 6.41244649887085, 7.324238300323486, 8.236030578613281, 9.147821426391602, 10.059613227844238, 10.971405029296875, 11.883196830749512, 12.794988632202148, 13.706779479980469, 14.618572235107422, 15.530363082885742, 16.442153930664062, 17.353946685791016, 18.26573944091797, 19.17753028869629, 20.089323043823242, 21.001113891601562, 21.912906646728516, 22.824697494506836, 23.736488342285156, 24.64828109741211, 25.56007194519043]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 16.0, 9.0, 18.0, 38.0, 48.0, 54.0, 83.0, 127.0, 187.0, 330.0, 521.0, 713.0, 1065.0, 1596.0, 2533.0, 3816.0, 5994.0, 9422.0, 14990.0, 23529.0, 38773.0, 62718.0, 103772.0, 164799.0, 206324.0, 154762.0, 96360.0, 58914.0, 36072.0, 22293.0, 13835.0, 8706.0, 5641.0, 3640.0, 2349.0, 1483.0, 1012.0, 683.0, 437.0, 290.0, 197.0, 120.0, 94.0, 65.0, 36.0, 36.0, 14.0, 17.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0], "bins": [-5.3203125, -5.165771484375, -5.01123046875, -4.856689453125, -4.7021484375, -4.547607421875, -4.39306640625, -4.238525390625, -4.083984375, -3.929443359375, -3.77490234375, -3.620361328125, -3.4658203125, -3.311279296875, -3.15673828125, -3.002197265625, -2.84765625, -2.693115234375, -2.53857421875, -2.384033203125, -2.2294921875, -2.074951171875, -1.92041015625, -1.765869140625, -1.611328125, -1.456787109375, -1.30224609375, -1.147705078125, -0.9931640625, -0.838623046875, -0.68408203125, -0.529541015625, -0.375, -0.220458984375, -0.06591796875, 0.088623046875, 0.2431640625, 0.397705078125, 0.55224609375, 0.706787109375, 0.861328125, 1.015869140625, 1.17041015625, 1.324951171875, 1.4794921875, 1.634033203125, 1.78857421875, 1.943115234375, 2.09765625, 2.252197265625, 2.40673828125, 2.561279296875, 2.7158203125, 2.870361328125, 3.02490234375, 3.179443359375, 3.333984375, 3.488525390625, 3.64306640625, 3.797607421875, 3.9521484375, 4.106689453125, 4.26123046875, 4.415771484375, 4.5703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 10.0, 6.0, 13.0, 15.0, 8.0, 13.0, 22.0, 13.0, 16.0, 21.0, 31.0, 36.0, 27.0, 37.0, 38.0, 36.0, 44.0, 41.0, 45.0, 49.0, 45.0, 47.0, 37.0, 45.0, 38.0, 33.0, 31.0, 21.0, 31.0, 28.0, 19.0, 20.0, 14.0, 7.0, 16.0, 9.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-33.78125, -32.843505859375, -31.90576171875, -30.968017578125, -30.0302734375, -29.092529296875, -28.15478515625, -27.217041015625, -26.279296875, -25.341552734375, -24.40380859375, -23.466064453125, -22.5283203125, -21.590576171875, -20.65283203125, -19.715087890625, -18.77734375, -17.839599609375, -16.90185546875, -15.964111328125, -15.0263671875, -14.088623046875, -13.15087890625, -12.213134765625, -11.275390625, -10.337646484375, -9.39990234375, -8.462158203125, -7.5244140625, -6.586669921875, -5.64892578125, -4.711181640625, -3.7734375, -2.835693359375, -1.89794921875, -0.960205078125, -0.0224609375, 0.915283203125, 1.85302734375, 2.790771484375, 3.728515625, 4.666259765625, 5.60400390625, 6.541748046875, 7.4794921875, 8.417236328125, 9.35498046875, 10.292724609375, 11.23046875, 12.168212890625, 13.10595703125, 14.043701171875, 14.9814453125, 15.919189453125, 16.85693359375, 17.794677734375, 18.732421875, 19.670166015625, 20.60791015625, 21.545654296875, 22.4833984375, 23.421142578125, 24.35888671875, 25.296630859375, 26.234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 20.0, 17.0, 28.0, 43.0, 59.0, 107.0, 144.0, 241.0, 340.0, 467.0, 686.0, 964.0, 1391.0, 2002.0, 2868.0, 4240.0, 6749.0, 10383.0, 15827.0, 25021.0, 40937.0, 66970.0, 110326.0, 169883.0, 199114.0, 146750.0, 91705.0, 55668.0, 34347.0, 21162.0, 13514.0, 8652.0, 5821.0, 3854.0, 2519.0, 1795.0, 1172.0, 875.0, 575.0, 396.0, 277.0, 217.0, 126.0, 93.0, 70.0, 47.0, 28.0, 18.0, 14.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.779296875, -3.662353515625, -3.54541015625, -3.428466796875, -3.3115234375, -3.194580078125, -3.07763671875, -2.960693359375, -2.84375, -2.726806640625, -2.60986328125, -2.492919921875, -2.3759765625, -2.259033203125, -2.14208984375, -2.025146484375, -1.908203125, -1.791259765625, -1.67431640625, -1.557373046875, -1.4404296875, -1.323486328125, -1.20654296875, -1.089599609375, -0.97265625, -0.855712890625, -0.73876953125, -0.621826171875, -0.5048828125, -0.387939453125, -0.27099609375, -0.154052734375, -0.037109375, 0.079833984375, 0.19677734375, 0.313720703125, 0.4306640625, 0.547607421875, 0.66455078125, 0.781494140625, 0.8984375, 1.015380859375, 1.13232421875, 1.249267578125, 1.3662109375, 1.483154296875, 1.60009765625, 1.717041015625, 1.833984375, 1.950927734375, 2.06787109375, 2.184814453125, 2.3017578125, 2.418701171875, 2.53564453125, 2.652587890625, 2.76953125, 2.886474609375, 3.00341796875, 3.120361328125, 3.2373046875, 3.354248046875, 3.47119140625, 3.588134765625, 3.705078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 5.0, 2.0, 8.0, 6.0, 10.0, 7.0, 11.0, 17.0, 12.0, 16.0, 17.0, 35.0, 20.0, 25.0, 29.0, 33.0, 36.0, 44.0, 35.0, 39.0, 37.0, 46.0, 42.0, 32.0, 45.0, 38.0, 33.0, 39.0, 32.0, 28.0, 39.0, 25.0, 19.0, 25.0, 25.0, 15.0, 12.0, 12.0, 14.0, 10.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.84375, -21.210693359375, -20.57763671875, -19.944580078125, -19.3115234375, -18.678466796875, -18.04541015625, -17.412353515625, -16.779296875, -16.146240234375, -15.51318359375, -14.880126953125, -14.2470703125, -13.614013671875, -12.98095703125, -12.347900390625, -11.71484375, -11.081787109375, -10.44873046875, -9.815673828125, -9.1826171875, -8.549560546875, -7.91650390625, -7.283447265625, -6.650390625, -6.017333984375, -5.38427734375, -4.751220703125, -4.1181640625, -3.485107421875, -2.85205078125, -2.218994140625, -1.5859375, -0.952880859375, -0.31982421875, 0.313232421875, 0.9462890625, 1.579345703125, 2.21240234375, 2.845458984375, 3.478515625, 4.111572265625, 4.74462890625, 5.377685546875, 6.0107421875, 6.643798828125, 7.27685546875, 7.909912109375, 8.54296875, 9.176025390625, 9.80908203125, 10.442138671875, 11.0751953125, 11.708251953125, 12.34130859375, 12.974365234375, 13.607421875, 14.240478515625, 14.87353515625, 15.506591796875, 16.1396484375, 16.772705078125, 17.40576171875, 18.038818359375, 18.671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 8.0, 15.0, 8.0, 24.0, 35.0, 44.0, 86.0, 104.0, 153.0, 246.0, 333.0, 509.0, 813.0, 1322.0, 1939.0, 3269.0, 5407.0, 9133.0, 15977.0, 30446.0, 60145.0, 128299.0, 291730.0, 264157.0, 114241.0, 54634.0, 28158.0, 15300.0, 8607.0, 4956.0, 3070.0, 1858.0, 1208.0, 801.0, 529.0, 351.0, 212.0, 154.0, 104.0, 46.0, 44.0, 16.0, 26.0, 6.0, 15.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.4072265625, -0.3940620422363281, -0.38089752197265625, -0.3677330017089844, -0.3545684814453125, -0.3414039611816406, -0.32823944091796875, -0.3150749206542969, -0.301910400390625, -0.2887458801269531, -0.27558135986328125, -0.2624168395996094, -0.2492523193359375, -0.23608779907226562, -0.22292327880859375, -0.20975875854492188, -0.19659423828125, -0.18342971801757812, -0.17026519775390625, -0.15710067749023438, -0.1439361572265625, -0.13077163696289062, -0.11760711669921875, -0.10444259643554688, -0.091278076171875, -0.07811355590820312, -0.06494903564453125, -0.051784515380859375, -0.0386199951171875, -0.025455474853515625, -0.01229095458984375, 0.000873565673828125, 0.0140380859375, 0.027202606201171875, 0.04036712646484375, 0.053531646728515625, 0.0666961669921875, 0.07986068725585938, 0.09302520751953125, 0.10618972778320312, 0.119354248046875, 0.13251876831054688, 0.14568328857421875, 0.15884780883789062, 0.1720123291015625, 0.18517684936523438, 0.19834136962890625, 0.21150588989257812, 0.22467041015625, 0.23783493041992188, 0.25099945068359375, 0.2641639709472656, 0.2773284912109375, 0.2904930114746094, 0.30365753173828125, 0.3168220520019531, 0.329986572265625, 0.3431510925292969, 0.35631561279296875, 0.3694801330566406, 0.3826446533203125, 0.3958091735839844, 0.40897369384765625, 0.4221382141113281, 0.435302734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 13.0, 12.0, 25.0, 20.0, 45.0, 40.0, 47.0, 59.0, 58.0, 76.0, 83.0, 62.0, 76.0, 75.0, 56.0, 42.0, 31.0, 25.0, 37.0, 20.0, 19.0, 17.0, 9.0, 4.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.638071060180664e-05, -9.363610297441483e-05, -9.089149534702301e-05, -8.81468877196312e-05, -8.540228009223938e-05, -8.265767246484756e-05, -7.991306483745575e-05, -7.716845721006393e-05, -7.442384958267212e-05, -7.16792419552803e-05, -6.893463432788849e-05, -6.619002670049667e-05, -6.344541907310486e-05, -6.070081144571304e-05, -5.795620381832123e-05, -5.521159619092941e-05, -5.24669885635376e-05, -4.972238093614578e-05, -4.697777330875397e-05, -4.423316568136215e-05, -4.148855805397034e-05, -3.874395042657852e-05, -3.5999342799186707e-05, -3.325473517179489e-05, -3.0510127544403076e-05, -2.776551991701126e-05, -2.5020912289619446e-05, -2.227630466222763e-05, -1.9531697034835815e-05, -1.6787089407444e-05, -1.4042481780052185e-05, -1.129787415266037e-05, -8.553266525268555e-06, -5.8086588978767395e-06, -3.0640512704849243e-06, -3.1944364309310913e-07, 2.425163984298706e-06, 5.169771611690521e-06, 7.914379239082336e-06, 1.0658986866474152e-05, 1.3403594493865967e-05, 1.6148202121257782e-05, 1.8892809748649597e-05, 2.1637417376041412e-05, 2.4382025003433228e-05, 2.7126632630825043e-05, 2.9871240258216858e-05, 3.261584788560867e-05, 3.536045551300049e-05, 3.8105063140392303e-05, 4.084967076778412e-05, 4.3594278395175934e-05, 4.633888602256775e-05, 4.9083493649959564e-05, 5.182810127735138e-05, 5.4572708904743195e-05, 5.731731653213501e-05, 6.0061924159526825e-05, 6.280653178691864e-05, 6.555113941431046e-05, 6.829574704170227e-05, 7.104035466909409e-05, 7.37849622964859e-05, 7.652956992387772e-05, 7.927417755126953e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 10.0, 13.0, 19.0, 29.0, 45.0, 53.0, 84.0, 111.0, 147.0, 188.0, 284.0, 401.0, 565.0, 773.0, 1031.0, 1473.0, 1988.0, 2952.0, 4091.0, 5925.0, 8667.0, 12880.0, 19325.0, 30095.0, 48167.0, 80823.0, 147926.0, 292938.0, 158100.0, 85087.0, 50282.0, 31013.0, 19809.0, 13231.0, 9032.0, 6103.0, 4352.0, 3017.0, 2097.0, 1586.0, 1086.0, 780.0, 574.0, 400.0, 297.0, 202.0, 156.0, 107.0, 74.0, 52.0, 38.0, 24.0, 12.0, 19.0, 15.0, 3.0, 9.0, 3.0, 1.0], "bins": [-1.1396484375, -1.1046295166015625, -1.069610595703125, -1.0345916748046875, -0.99957275390625, -0.9645538330078125, -0.929534912109375, -0.8945159912109375, -0.8594970703125, -0.8244781494140625, -0.789459228515625, -0.7544403076171875, -0.71942138671875, -0.6844024658203125, -0.649383544921875, -0.6143646240234375, -0.579345703125, -0.5443267822265625, -0.509307861328125, -0.4742889404296875, -0.43927001953125, -0.4042510986328125, -0.369232177734375, -0.3342132568359375, -0.2991943359375, -0.2641754150390625, -0.229156494140625, -0.1941375732421875, -0.15911865234375, -0.1240997314453125, -0.089080810546875, -0.0540618896484375, -0.01904296875, 0.0159759521484375, 0.050994873046875, 0.0860137939453125, 0.12103271484375, 0.1560516357421875, 0.191070556640625, 0.2260894775390625, 0.2611083984375, 0.2961273193359375, 0.331146240234375, 0.3661651611328125, 0.40118408203125, 0.4362030029296875, 0.471221923828125, 0.5062408447265625, 0.541259765625, 0.5762786865234375, 0.611297607421875, 0.6463165283203125, 0.68133544921875, 0.7163543701171875, 0.751373291015625, 0.7863922119140625, 0.8214111328125, 0.8564300537109375, 0.891448974609375, 0.9264678955078125, 0.96148681640625, 0.9965057373046875, 1.031524658203125, 1.0665435791015625, 1.1015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 15.0, 9.0, 10.0, 18.0, 15.0, 24.0, 23.0, 33.0, 39.0, 39.0, 36.0, 51.0, 45.0, 47.0, 42.0, 50.0, 52.0, 27.0, 42.0, 56.0, 39.0, 35.0, 33.0, 33.0, 27.0, 14.0, 29.0, 13.0, 20.0, 22.0, 6.0, 7.0, 4.0, 11.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6687393188476562, -0.6470489501953125, -0.6253585815429688, -0.603668212890625, -0.5819778442382812, -0.5602874755859375, -0.5385971069335938, -0.51690673828125, -0.49521636962890625, -0.4735260009765625, -0.45183563232421875, -0.430145263671875, -0.40845489501953125, -0.3867645263671875, -0.36507415771484375, -0.3433837890625, -0.32169342041015625, -0.3000030517578125, -0.27831268310546875, -0.256622314453125, -0.23493194580078125, -0.2132415771484375, -0.19155120849609375, -0.16986083984375, -0.14817047119140625, -0.1264801025390625, -0.10478973388671875, -0.083099365234375, -0.06140899658203125, -0.0397186279296875, -0.01802825927734375, 0.003662109375, 0.02535247802734375, 0.0470428466796875, 0.06873321533203125, 0.090423583984375, 0.11211395263671875, 0.1338043212890625, 0.15549468994140625, 0.17718505859375, 0.19887542724609375, 0.2205657958984375, 0.24225616455078125, 0.263946533203125, 0.28563690185546875, 0.3073272705078125, 0.32901763916015625, 0.3507080078125, 0.37239837646484375, 0.3940887451171875, 0.41577911376953125, 0.437469482421875, 0.45915985107421875, 0.4808502197265625, 0.5025405883789062, 0.52423095703125, 0.5459213256835938, 0.5676116943359375, 0.5893020629882812, 0.610992431640625, 0.6326828002929688, 0.6543731689453125, 0.6760635375976562, 0.69775390625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 1.0, 8.0, 7.0, 9.0, 8.0, 17.0, 16.0, 18.0, 27.0, 21.0, 35.0, 28.0, 24.0, 40.0, 41.0, 43.0, 39.0, 56.0, 40.0, 47.0, 29.0, 47.0, 44.0, 37.0, 28.0, 33.0, 40.0, 24.0, 20.0, 21.0, 22.0, 24.0, 16.0, 19.0, 13.0, 12.0, 10.0, 3.0, 7.0, 2.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-21.998687744140625, -21.287479400634766, -20.57627296447754, -19.86506462097168, -19.15385627746582, -18.442649841308594, -17.731441497802734, -17.020233154296875, -16.309024810791016, -15.597817420959473, -14.886609077453613, -14.17540168762207, -13.464193344116211, -12.752985954284668, -12.041778564453125, -11.330570220947266, -10.619363784790039, -9.908156394958496, -9.196948051452637, -8.485740661621094, -7.774532794952393, -7.063324928283691, -6.352117538452148, -5.640909671783447, -4.929701805114746, -4.218493938446045, -3.507286310195923, -2.796078681945801, -2.0848708152770996, -1.3736629486083984, -0.6624555587768555, 0.0487523078918457, 0.7599620819091797, 1.4711698293685913, 2.182377576828003, 2.893585205078125, 3.604793071746826, 4.316000938415527, 5.02720832824707, 5.7384161949157715, 6.449624061584473, 7.160831928253174, 7.872039794921875, 8.583247184753418, 9.294454574584961, 10.00566291809082, 10.716870307922363, 11.428077697753906, 12.139286041259766, 12.850493431091309, 13.561701774597168, 14.272909164428711, 14.98411750793457, 15.695324897766113, 16.406532287597656, 17.117740631103516, 17.828948974609375, 18.540157318115234, 19.25136375427246, 19.96257209777832, 20.67378044128418, 21.384986877441406, 22.096195220947266, 22.807403564453125, 23.51861000061035]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 8.0, 16.0, 9.0, 16.0, 22.0, 19.0, 14.0, 19.0, 27.0, 21.0, 42.0, 25.0, 37.0, 53.0, 45.0, 35.0, 44.0, 48.0, 38.0, 38.0, 47.0, 49.0, 38.0, 37.0, 28.0, 26.0, 27.0, 17.0, 29.0, 14.0, 20.0, 15.0, 11.0, 20.0, 6.0, 3.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-32.71379089355469, -31.807483673095703, -30.901174545288086, -29.9948673248291, -29.088558197021484, -28.1822509765625, -27.275943756103516, -26.3696346282959, -25.46332550048828, -24.557018280029297, -23.65070915222168, -22.744401931762695, -21.838092803955078, -20.931785583496094, -20.02547836303711, -19.119169235229492, -18.212862014770508, -17.306554794311523, -16.400245666503906, -15.493938446044922, -14.587629318237305, -13.68132209777832, -12.77501392364502, -11.868705749511719, -10.962397575378418, -10.056089401245117, -9.149781227111816, -8.243473052978516, -7.337165355682373, -6.430857181549072, -5.52454948425293, -4.618241310119629, -3.711935043334961, -2.80562686920166, -1.8993189334869385, -0.9930109977722168, -0.08670282363891602, 0.8196053504943848, 1.7259130477905273, 2.632221221923828, 3.538529396057129, 4.44483757019043, 5.3511457443237305, 6.257453441619873, 7.163761615753174, 8.070070266723633, 8.976377487182617, 9.882685661315918, 10.788993835449219, 11.69530200958252, 12.60161018371582, 13.507917404174805, 14.414226531982422, 15.320533752441406, 16.22684097290039, 17.133150100708008, 18.039459228515625, 18.94576644897461, 19.852075576782227, 20.75838279724121, 21.664691925048828, 22.570999145507812, 23.477306365966797, 24.383615493774414, 25.2899227142334]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 15.0, 14.0, 19.0, 52.0, 62.0, 110.0, 194.0, 270.0, 501.0, 839.0, 1361.0, 2290.0, 3860.0, 5927.0, 9516.0, 15094.0, 23730.0, 35654.0, 52885.0, 72420.0, 94124.0, 112422.0, 121855.0, 118929.0, 104563.0, 84320.0, 62879.0, 43681.0, 29623.0, 19234.0, 12253.0, 7738.0, 4669.0, 2833.0, 1824.0, 1078.0, 695.0, 403.0, 256.0, 127.0, 93.0, 60.0, 42.0, 10.0, 11.0, 15.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.576416015625, -16.96533203125, -16.354248046875, -15.7431640625, -15.132080078125, -14.52099609375, -13.909912109375, -13.298828125, -12.687744140625, -12.07666015625, -11.465576171875, -10.8544921875, -10.243408203125, -9.63232421875, -9.021240234375, -8.41015625, -7.799072265625, -7.18798828125, -6.576904296875, -5.9658203125, -5.354736328125, -4.74365234375, -4.132568359375, -3.521484375, -2.910400390625, -2.29931640625, -1.688232421875, -1.0771484375, -0.466064453125, 0.14501953125, 0.756103515625, 1.3671875, 1.978271484375, 2.58935546875, 3.200439453125, 3.8115234375, 4.422607421875, 5.03369140625, 5.644775390625, 6.255859375, 6.866943359375, 7.47802734375, 8.089111328125, 8.7001953125, 9.311279296875, 9.92236328125, 10.533447265625, 11.14453125, 11.755615234375, 12.36669921875, 12.977783203125, 13.5888671875, 14.199951171875, 14.81103515625, 15.422119140625, 16.033203125, 16.644287109375, 17.25537109375, 17.866455078125, 18.4775390625, 19.088623046875, 19.69970703125, 20.310791015625, 20.921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 7.0, 14.0, 14.0, 11.0, 18.0, 16.0, 25.0, 24.0, 24.0, 32.0, 26.0, 33.0, 34.0, 41.0, 41.0, 40.0, 40.0, 42.0, 42.0, 48.0, 36.0, 48.0, 37.0, 37.0, 30.0, 33.0, 24.0, 29.0, 22.0, 20.0, 17.0, 10.0, 19.0, 11.0, 12.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-31.6875, -30.821044921875, -29.95458984375, -29.088134765625, -28.2216796875, -27.355224609375, -26.48876953125, -25.622314453125, -24.755859375, -23.889404296875, -23.02294921875, -22.156494140625, -21.2900390625, -20.423583984375, -19.55712890625, -18.690673828125, -17.82421875, -16.957763671875, -16.09130859375, -15.224853515625, -14.3583984375, -13.491943359375, -12.62548828125, -11.759033203125, -10.892578125, -10.026123046875, -9.15966796875, -8.293212890625, -7.4267578125, -6.560302734375, -5.69384765625, -4.827392578125, -3.9609375, -3.094482421875, -2.22802734375, -1.361572265625, -0.4951171875, 0.371337890625, 1.23779296875, 2.104248046875, 2.970703125, 3.837158203125, 4.70361328125, 5.570068359375, 6.4365234375, 7.302978515625, 8.16943359375, 9.035888671875, 9.90234375, 10.768798828125, 11.63525390625, 12.501708984375, 13.3681640625, 14.234619140625, 15.10107421875, 15.967529296875, 16.833984375, 17.700439453125, 18.56689453125, 19.433349609375, 20.2998046875, 21.166259765625, 22.03271484375, 22.899169921875, 23.765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 7.0, 6.0, 24.0, 29.0, 56.0, 73.0, 140.0, 198.0, 309.0, 505.0, 772.0, 1244.0, 1843.0, 2980.0, 4468.0, 7231.0, 10932.0, 16330.0, 24482.0, 35929.0, 50522.0, 68351.0, 86802.0, 102874.0, 112295.0, 111534.0, 101826.0, 86078.0, 67043.0, 49485.0, 34780.0, 23800.0, 15906.0, 10475.0, 6804.0, 4558.0, 2918.0, 1848.0, 1166.0, 680.0, 460.0, 305.0, 174.0, 135.0, 73.0, 41.0, 23.0, 18.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-20.140625, -19.547607421875, -18.95458984375, -18.361572265625, -17.7685546875, -17.175537109375, -16.58251953125, -15.989501953125, -15.396484375, -14.803466796875, -14.21044921875, -13.617431640625, -13.0244140625, -12.431396484375, -11.83837890625, -11.245361328125, -10.65234375, -10.059326171875, -9.46630859375, -8.873291015625, -8.2802734375, -7.687255859375, -7.09423828125, -6.501220703125, -5.908203125, -5.315185546875, -4.72216796875, -4.129150390625, -3.5361328125, -2.943115234375, -2.35009765625, -1.757080078125, -1.1640625, -0.571044921875, 0.02197265625, 0.614990234375, 1.2080078125, 1.801025390625, 2.39404296875, 2.987060546875, 3.580078125, 4.173095703125, 4.76611328125, 5.359130859375, 5.9521484375, 6.545166015625, 7.13818359375, 7.731201171875, 8.32421875, 8.917236328125, 9.51025390625, 10.103271484375, 10.6962890625, 11.289306640625, 11.88232421875, 12.475341796875, 13.068359375, 13.661376953125, 14.25439453125, 14.847412109375, 15.4404296875, 16.033447265625, 16.62646484375, 17.219482421875, 17.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 10.0, 7.0, 5.0, 12.0, 20.0, 11.0, 23.0, 13.0, 21.0, 15.0, 28.0, 26.0, 34.0, 40.0, 34.0, 29.0, 23.0, 49.0, 36.0, 31.0, 46.0, 44.0, 37.0, 41.0, 27.0, 27.0, 39.0, 32.0, 28.0, 27.0, 29.0, 16.0, 18.0, 20.0, 14.0, 18.0, 8.0, 13.0, 13.0, 8.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.609375, -17.076904296875, -16.54443359375, -16.011962890625, -15.4794921875, -14.947021484375, -14.41455078125, -13.882080078125, -13.349609375, -12.817138671875, -12.28466796875, -11.752197265625, -11.2197265625, -10.687255859375, -10.15478515625, -9.622314453125, -9.08984375, -8.557373046875, -8.02490234375, -7.492431640625, -6.9599609375, -6.427490234375, -5.89501953125, -5.362548828125, -4.830078125, -4.297607421875, -3.76513671875, -3.232666015625, -2.7001953125, -2.167724609375, -1.63525390625, -1.102783203125, -0.5703125, -0.037841796875, 0.49462890625, 1.027099609375, 1.5595703125, 2.092041015625, 2.62451171875, 3.156982421875, 3.689453125, 4.221923828125, 4.75439453125, 5.286865234375, 5.8193359375, 6.351806640625, 6.88427734375, 7.416748046875, 7.94921875, 8.481689453125, 9.01416015625, 9.546630859375, 10.0791015625, 10.611572265625, 11.14404296875, 11.676513671875, 12.208984375, 12.741455078125, 13.27392578125, 13.806396484375, 14.3388671875, 14.871337890625, 15.40380859375, 15.936279296875, 16.46875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 11.0, 5.0, 16.0, 23.0, 24.0, 42.0, 64.0, 121.0, 179.0, 273.0, 456.0, 721.0, 1262.0, 1959.0, 3221.0, 5392.0, 8980.0, 14900.0, 24119.0, 39201.0, 60609.0, 88794.0, 118713.0, 140765.0, 143328.0, 124643.0, 94584.0, 65621.0, 42470.0, 26917.0, 16213.0, 9641.0, 6040.0, 3692.0, 2146.0, 1267.0, 834.0, 491.0, 299.0, 191.0, 121.0, 79.0, 40.0, 20.0, 23.0, 17.0, 12.0, 3.0, 6.0, 4.0, 1.0, 1.0, 3.0], "bins": [-7.01953125, -6.81951904296875, -6.6195068359375, -6.41949462890625, -6.219482421875, -6.01947021484375, -5.8194580078125, -5.61944580078125, -5.41943359375, -5.21942138671875, -5.0194091796875, -4.81939697265625, -4.619384765625, -4.41937255859375, -4.2193603515625, -4.01934814453125, -3.8193359375, -3.61932373046875, -3.4193115234375, -3.21929931640625, -3.019287109375, -2.81927490234375, -2.6192626953125, -2.41925048828125, -2.21923828125, -2.01922607421875, -1.8192138671875, -1.61920166015625, -1.419189453125, -1.21917724609375, -1.0191650390625, -0.81915283203125, -0.619140625, -0.41912841796875, -0.2191162109375, -0.01910400390625, 0.180908203125, 0.38092041015625, 0.5809326171875, 0.78094482421875, 0.98095703125, 1.18096923828125, 1.3809814453125, 1.58099365234375, 1.781005859375, 1.98101806640625, 2.1810302734375, 2.38104248046875, 2.5810546875, 2.78106689453125, 2.9810791015625, 3.18109130859375, 3.381103515625, 3.58111572265625, 3.7811279296875, 3.98114013671875, 4.18115234375, 4.38116455078125, 4.5811767578125, 4.78118896484375, 4.981201171875, 5.18121337890625, 5.3812255859375, 5.58123779296875, 5.78125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 16.0, 12.0, 19.0, 25.0, 29.0, 49.0, 44.0, 57.0, 64.0, 76.0, 65.0, 67.0, 65.0, 52.0, 56.0, 58.0, 43.0, 34.0, 29.0, 32.0, 22.0, 15.0, 10.0, 9.0, 6.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008831024169921875, -0.0008567050099372864, -0.0008303076028823853, -0.0008039101958274841, -0.000777512788772583, -0.0007511153817176819, -0.0007247179746627808, -0.0006983205676078796, -0.0006719231605529785, -0.0006455257534980774, -0.0006191283464431763, -0.0005927309393882751, -0.000566333532333374, -0.0005399361252784729, -0.0005135387182235718, -0.00048714131116867065, -0.00046074390411376953, -0.0004343464970588684, -0.0004079490900039673, -0.00038155168294906616, -0.00035515427589416504, -0.0003287568688392639, -0.0003023594617843628, -0.00027596205472946167, -0.00024956464767456055, -0.00022316724061965942, -0.0001967698335647583, -0.00017037242650985718, -0.00014397501945495605, -0.00011757761240005493, -9.118020534515381e-05, -6.478279829025269e-05, -3.838539123535156e-05, -1.198798418045044e-05, 1.4409422874450684e-05, 4.080682992935181e-05, 6.720423698425293e-05, 9.360164403915405e-05, 0.00011999905109405518, 0.0001463964581489563, 0.00017279386520385742, 0.00019919127225875854, 0.00022558867931365967, 0.0002519860863685608, 0.0002783834934234619, 0.00030478090047836304, 0.00033117830753326416, 0.0003575757145881653, 0.0003839731216430664, 0.00041037052869796753, 0.00043676793575286865, 0.0004631653428077698, 0.0004895627498626709, 0.000515960156917572, 0.0005423575639724731, 0.0005687549710273743, 0.0005951523780822754, 0.0006215497851371765, 0.0006479471921920776, 0.0006743445992469788, 0.0007007420063018799, 0.000727139413356781, 0.0007535368204116821, 0.0007799342274665833, 0.0008063316345214844]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 9.0, 10.0, 6.0, 8.0, 4.0, 16.0, 20.0, 39.0, 61.0, 98.0, 157.0, 219.0, 306.0, 471.0, 790.0, 1219.0, 1855.0, 2919.0, 4602.0, 7197.0, 11344.0, 17842.0, 27339.0, 42078.0, 61484.0, 85479.0, 109435.0, 126277.0, 130193.0, 116621.0, 93706.0, 69282.0, 48193.0, 32146.0, 20457.0, 13275.0, 8359.0, 5509.0, 3352.0, 2130.0, 1442.0, 883.0, 577.0, 436.0, 264.0, 160.0, 101.0, 63.0, 41.0, 33.0, 24.0, 16.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.30078125, -6.11083984375, -5.9208984375, -5.73095703125, -5.541015625, -5.35107421875, -5.1611328125, -4.97119140625, -4.78125, -4.59130859375, -4.4013671875, -4.21142578125, -4.021484375, -3.83154296875, -3.6416015625, -3.45166015625, -3.26171875, -3.07177734375, -2.8818359375, -2.69189453125, -2.501953125, -2.31201171875, -2.1220703125, -1.93212890625, -1.7421875, -1.55224609375, -1.3623046875, -1.17236328125, -0.982421875, -0.79248046875, -0.6025390625, -0.41259765625, -0.22265625, -0.03271484375, 0.1572265625, 0.34716796875, 0.537109375, 0.72705078125, 0.9169921875, 1.10693359375, 1.296875, 1.48681640625, 1.6767578125, 1.86669921875, 2.056640625, 2.24658203125, 2.4365234375, 2.62646484375, 2.81640625, 3.00634765625, 3.1962890625, 3.38623046875, 3.576171875, 3.76611328125, 3.9560546875, 4.14599609375, 4.3359375, 4.52587890625, 4.7158203125, 4.90576171875, 5.095703125, 5.28564453125, 5.4755859375, 5.66552734375, 5.85546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 4.0, 5.0, 4.0, 9.0, 12.0, 5.0, 11.0, 12.0, 14.0, 16.0, 34.0, 34.0, 35.0, 56.0, 42.0, 41.0, 49.0, 48.0, 65.0, 45.0, 65.0, 48.0, 36.0, 44.0, 43.0, 37.0, 34.0, 31.0, 19.0, 14.0, 18.0, 11.0, 16.0, 8.0, 10.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.10546875, -3.01123046875, -2.9169921875, -2.82275390625, -2.728515625, -2.63427734375, -2.5400390625, -2.44580078125, -2.3515625, -2.25732421875, -2.1630859375, -2.06884765625, -1.974609375, -1.88037109375, -1.7861328125, -1.69189453125, -1.59765625, -1.50341796875, -1.4091796875, -1.31494140625, -1.220703125, -1.12646484375, -1.0322265625, -0.93798828125, -0.84375, -0.74951171875, -0.6552734375, -0.56103515625, -0.466796875, -0.37255859375, -0.2783203125, -0.18408203125, -0.08984375, 0.00439453125, 0.0986328125, 0.19287109375, 0.287109375, 0.38134765625, 0.4755859375, 0.56982421875, 0.6640625, 0.75830078125, 0.8525390625, 0.94677734375, 1.041015625, 1.13525390625, 1.2294921875, 1.32373046875, 1.41796875, 1.51220703125, 1.6064453125, 1.70068359375, 1.794921875, 1.88916015625, 1.9833984375, 2.07763671875, 2.171875, 2.26611328125, 2.3603515625, 2.45458984375, 2.548828125, 2.64306640625, 2.7373046875, 2.83154296875, 2.92578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 3.0, 8.0, 9.0, 12.0, 19.0, 21.0, 19.0, 25.0, 38.0, 37.0, 37.0, 49.0, 40.0, 53.0, 54.0, 61.0, 45.0, 45.0, 40.0, 58.0, 35.0, 47.0, 32.0, 28.0, 29.0, 20.0, 18.0, 22.0, 18.0, 22.0, 14.0, 8.0, 8.0, 4.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.414396286010742, -24.58373260498047, -23.753070831298828, -22.922407150268555, -22.09174346923828, -21.26108169555664, -20.430418014526367, -19.599754333496094, -18.769092559814453, -17.93842887878418, -17.10776710510254, -16.277103424072266, -15.446440696716309, -14.615777969360352, -13.785114288330078, -12.954451560974121, -12.123788833618164, -11.293126106262207, -10.46246337890625, -9.631799697875977, -8.80113697052002, -7.9704742431640625, -7.139811038970947, -6.309147834777832, -5.478485107421875, -4.647822380065918, -3.8171591758728027, -2.9864962100982666, -2.1558332443237305, -1.3251705169677734, -0.4945073127746582, 0.33615589141845703, 1.1668205261230469, 1.997483491897583, 2.828146457672119, 3.6588094234466553, 4.489472389221191, 5.320135116577148, 6.150798320770264, 6.981461524963379, 7.812124252319336, 8.642786979675293, 9.47344970703125, 10.304113388061523, 11.13477611541748, 11.965438842773438, 12.796102523803711, 13.626765251159668, 14.457427978515625, 15.288090705871582, 16.11875343322754, 16.949417114257812, 17.780078887939453, 18.610742568969727, 19.44140625, 20.27206802368164, 21.102731704711914, 21.933395385742188, 22.764057159423828, 23.5947208404541, 24.425384521484375, 25.256046295166016, 26.08670997619629, 26.917373657226562, 27.748035430908203]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 9.0, 6.0, 3.0, 5.0, 9.0, 14.0, 7.0, 18.0, 12.0, 16.0, 24.0, 22.0, 19.0, 36.0, 28.0, 31.0, 28.0, 35.0, 32.0, 31.0, 40.0, 30.0, 34.0, 38.0, 45.0, 51.0, 47.0, 34.0, 33.0, 27.0, 18.0, 25.0, 29.0, 20.0, 18.0, 24.0, 22.0, 11.0, 12.0, 6.0, 8.0, 8.0, 6.0, 5.0, 6.0, 9.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-28.657997131347656, -27.8220157623291, -26.986034393310547, -26.150053024291992, -25.314071655273438, -24.478090286254883, -23.642108917236328, -22.806129455566406, -21.97014617919922, -21.134164810180664, -20.29818344116211, -19.462202072143555, -18.626220703125, -17.790239334106445, -16.95425796508789, -16.11827850341797, -15.282297134399414, -14.44631576538086, -13.610334396362305, -12.77435302734375, -11.938371658325195, -11.10239028930664, -10.266409873962402, -9.430428504943848, -8.594447135925293, -7.758465766906738, -6.922484397888184, -6.086503505706787, -5.250522136688232, -4.414540767669678, -3.5785598754882812, -2.7425785064697266, -1.906595230102539, -1.070613980293274, -0.2346327304840088, 0.6013484001159668, 1.4373297691345215, 2.273311138153076, 3.1092920303344727, 3.9452733993530273, 4.781254768371582, 5.617236137390137, 6.453217506408691, 7.289198398590088, 8.125179290771484, 8.961160659790039, 9.797142028808594, 10.633123397827148, 11.469104766845703, 12.305086135864258, 13.141067504882812, 13.977048873901367, 14.813030242919922, 15.649011611938477, 16.48499298095703, 17.320972442626953, 18.15695571899414, 18.992937088012695, 19.82891845703125, 20.664899826049805, 21.50088119506836, 22.336862564086914, 23.17284393310547, 24.00882339477539, 24.844804763793945]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 13.0, 17.0, 16.0, 23.0, 59.0, 71.0, 142.0, 233.0, 355.0, 624.0, 979.0, 1659.0, 2754.0, 4437.0, 7442.0, 12478.0, 20401.0, 33396.0, 54626.0, 87447.0, 139413.0, 213990.0, 317024.0, 432895.0, 532935.0, 567224.0, 520805.0, 415208.0, 298943.0, 199175.0, 128024.0, 80136.0, 48669.0, 29225.0, 17560.0, 10541.0, 6311.0, 3745.0, 2167.0, 1256.0, 769.0, 452.0, 271.0, 142.0, 107.0, 53.0, 24.0, 20.0, 19.0, 12.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.22705078125, -18.5947265625, -17.96240234375, -17.330078125, -16.69775390625, -16.0654296875, -15.43310546875, -14.80078125, -14.16845703125, -13.5361328125, -12.90380859375, -12.271484375, -11.63916015625, -11.0068359375, -10.37451171875, -9.7421875, -9.10986328125, -8.4775390625, -7.84521484375, -7.212890625, -6.58056640625, -5.9482421875, -5.31591796875, -4.68359375, -4.05126953125, -3.4189453125, -2.78662109375, -2.154296875, -1.52197265625, -0.8896484375, -0.25732421875, 0.375, 1.00732421875, 1.6396484375, 2.27197265625, 2.904296875, 3.53662109375, 4.1689453125, 4.80126953125, 5.43359375, 6.06591796875, 6.6982421875, 7.33056640625, 7.962890625, 8.59521484375, 9.2275390625, 9.85986328125, 10.4921875, 11.12451171875, 11.7568359375, 12.38916015625, 13.021484375, 13.65380859375, 14.2861328125, 14.91845703125, 15.55078125, 16.18310546875, 16.8154296875, 17.44775390625, 18.080078125, 18.71240234375, 19.3447265625, 19.97705078125, 20.609375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 4.0, 4.0, 6.0, 5.0, 5.0, 14.0, 8.0, 8.0, 18.0, 16.0, 18.0, 18.0, 27.0, 21.0, 34.0, 24.0, 27.0, 39.0, 30.0, 32.0, 30.0, 31.0, 32.0, 50.0, 45.0, 36.0, 38.0, 36.0, 36.0, 37.0, 26.0, 29.0, 27.0, 22.0, 21.0, 17.0, 17.0, 17.0, 18.0, 14.0, 14.0, 12.0, 4.0, 6.0, 6.0, 8.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0], "bins": [-21.421875, -20.817626953125, -20.21337890625, -19.609130859375, -19.0048828125, -18.400634765625, -17.79638671875, -17.192138671875, -16.587890625, -15.983642578125, -15.37939453125, -14.775146484375, -14.1708984375, -13.566650390625, -12.96240234375, -12.358154296875, -11.75390625, -11.149658203125, -10.54541015625, -9.941162109375, -9.3369140625, -8.732666015625, -8.12841796875, -7.524169921875, -6.919921875, -6.315673828125, -5.71142578125, -5.107177734375, -4.5029296875, -3.898681640625, -3.29443359375, -2.690185546875, -2.0859375, -1.481689453125, -0.87744140625, -0.273193359375, 0.3310546875, 0.935302734375, 1.53955078125, 2.143798828125, 2.748046875, 3.352294921875, 3.95654296875, 4.560791015625, 5.1650390625, 5.769287109375, 6.37353515625, 6.977783203125, 7.58203125, 8.186279296875, 8.79052734375, 9.394775390625, 9.9990234375, 10.603271484375, 11.20751953125, 11.811767578125, 12.416015625, 13.020263671875, 13.62451171875, 14.228759765625, 14.8330078125, 15.437255859375, 16.04150390625, 16.645751953125, 17.25]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 1.0, 9.0, 12.0, 26.0, 32.0, 65.0, 100.0, 176.0, 258.0, 431.0, 714.0, 1044.0, 1850.0, 3100.0, 5028.0, 8010.0, 12865.0, 20428.0, 32121.0, 49316.0, 74010.0, 109254.0, 154155.0, 211060.0, 273754.0, 336481.0, 388162.0, 417711.0, 417678.0, 388335.0, 334896.0, 272860.0, 210132.0, 153096.0, 108718.0, 73707.0, 49244.0, 31965.0, 20032.0, 12831.0, 8052.0, 4948.0, 3030.0, 1863.0, 1096.0, 645.0, 396.0, 234.0, 142.0, 95.0, 49.0, 35.0, 23.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.296875, -14.8187255859375, -14.340576171875, -13.8624267578125, -13.38427734375, -12.9061279296875, -12.427978515625, -11.9498291015625, -11.4716796875, -10.9935302734375, -10.515380859375, -10.0372314453125, -9.55908203125, -9.0809326171875, -8.602783203125, -8.1246337890625, -7.646484375, -7.1683349609375, -6.690185546875, -6.2120361328125, -5.73388671875, -5.2557373046875, -4.777587890625, -4.2994384765625, -3.8212890625, -3.3431396484375, -2.864990234375, -2.3868408203125, -1.90869140625, -1.4305419921875, -0.952392578125, -0.4742431640625, 0.00390625, 0.4820556640625, 0.960205078125, 1.4383544921875, 1.91650390625, 2.3946533203125, 2.872802734375, 3.3509521484375, 3.8291015625, 4.3072509765625, 4.785400390625, 5.2635498046875, 5.74169921875, 6.2198486328125, 6.697998046875, 7.1761474609375, 7.654296875, 8.1324462890625, 8.610595703125, 9.0887451171875, 9.56689453125, 10.0450439453125, 10.523193359375, 11.0013427734375, 11.4794921875, 11.9576416015625, 12.435791015625, 12.9139404296875, 13.39208984375, 13.8702392578125, 14.348388671875, 14.8265380859375, 15.3046875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 12.0, 9.0, 16.0, 17.0, 17.0, 19.0, 38.0, 37.0, 46.0, 53.0, 53.0, 76.0, 103.0, 108.0, 101.0, 116.0, 151.0, 173.0, 174.0, 178.0, 191.0, 177.0, 201.0, 179.0, 202.0, 191.0, 204.0, 161.0, 166.0, 120.0, 111.0, 109.0, 100.0, 83.0, 76.0, 56.0, 41.0, 36.0, 35.0, 25.0, 28.0, 16.0, 12.0, 15.0, 6.0, 4.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.4609375, -8.181884765625, -7.90283203125, -7.623779296875, -7.3447265625, -7.065673828125, -6.78662109375, -6.507568359375, -6.228515625, -5.949462890625, -5.67041015625, -5.391357421875, -5.1123046875, -4.833251953125, -4.55419921875, -4.275146484375, -3.99609375, -3.717041015625, -3.43798828125, -3.158935546875, -2.8798828125, -2.600830078125, -2.32177734375, -2.042724609375, -1.763671875, -1.484619140625, -1.20556640625, -0.926513671875, -0.6474609375, -0.368408203125, -0.08935546875, 0.189697265625, 0.46875, 0.747802734375, 1.02685546875, 1.305908203125, 1.5849609375, 1.864013671875, 2.14306640625, 2.422119140625, 2.701171875, 2.980224609375, 3.25927734375, 3.538330078125, 3.8173828125, 4.096435546875, 4.37548828125, 4.654541015625, 4.93359375, 5.212646484375, 5.49169921875, 5.770751953125, 6.0498046875, 6.328857421875, 6.60791015625, 6.886962890625, 7.166015625, 7.445068359375, 7.72412109375, 8.003173828125, 8.2822265625, 8.561279296875, 8.84033203125, 9.119384765625, 9.3984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 10.0, 5.0, 9.0, 11.0, 19.0, 21.0, 21.0, 35.0, 25.0, 39.0, 36.0, 36.0, 26.0, 41.0, 48.0, 48.0, 53.0, 40.0, 34.0, 40.0, 41.0, 37.0, 46.0, 40.0, 18.0, 26.0, 33.0, 21.0, 24.0, 15.0, 17.0, 15.0, 12.0, 10.0, 11.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-21.126115798950195, -20.4793758392334, -19.8326358795166, -19.185895919799805, -18.539154052734375, -17.892414093017578, -17.24567413330078, -16.598934173583984, -15.952194213867188, -15.30545425415039, -14.658714294433594, -14.01197338104248, -13.365233421325684, -12.718493461608887, -12.071752548217773, -11.425012588500977, -10.77827262878418, -10.131532669067383, -9.484792709350586, -8.838051795959473, -8.191311836242676, -7.544571876525879, -6.897831439971924, -6.251091003417969, -5.604351043701172, -4.957611083984375, -4.31087064743042, -3.664130449295044, -3.017390251159668, -2.370650053024292, -1.723909854888916, -1.077169418334961, -0.43042945861816406, 0.21631073951721191, 0.8630509376525879, 1.5097911357879639, 2.15653133392334, 2.803271532058716, 3.450011730194092, 4.096752166748047, 4.743492126464844, 5.390232086181641, 6.036972522735596, 6.683712959289551, 7.330452919006348, 7.9771928787231445, 8.623933792114258, 9.270673751831055, 9.917413711547852, 10.564153671264648, 11.210893630981445, 11.857634544372559, 12.504374504089355, 13.151114463806152, 13.797855377197266, 14.444595336914062, 15.09133529663086, 15.738075256347656, 16.384815216064453, 17.03155517578125, 17.678295135498047, 18.325037002563477, 18.971776962280273, 19.61851692199707, 20.265256881713867]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 10.0, 9.0, 11.0, 8.0, 11.0, 24.0, 13.0, 26.0, 17.0, 25.0, 18.0, 24.0, 25.0, 41.0, 29.0, 43.0, 29.0, 42.0, 39.0, 40.0, 37.0, 41.0, 32.0, 45.0, 40.0, 28.0, 37.0, 25.0, 27.0, 19.0, 19.0, 19.0, 22.0, 23.0, 16.0, 12.0, 10.0, 3.0, 15.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.80310821533203, -21.084636688232422, -20.366165161132812, -19.647693634033203, -18.929222106933594, -18.210750579833984, -17.492279052734375, -16.7738094329834, -16.05533790588379, -15.33686637878418, -14.61839485168457, -13.899923324584961, -13.181452751159668, -12.462981224060059, -11.74450969696045, -11.026039123535156, -10.30756664276123, -9.589095115661621, -8.870623588562012, -8.152153015136719, -7.433681488037109, -6.7152099609375, -5.996738433837891, -5.2782673835754395, -4.55979585647583, -3.8413245677948, -3.1228532791137695, -2.40438175201416, -1.6859104633331299, -0.9674391746520996, -0.24896764755249023, 0.46950340270996094, 1.1879749298095703, 1.9064462184906006, 2.624917507171631, 3.3433890342712402, 4.061860084533691, 4.780331611633301, 5.49880313873291, 6.217274188995361, 6.935745716094971, 7.65421724319458, 8.372688293457031, 9.09115982055664, 9.80963134765625, 10.52810287475586, 11.246574401855469, 11.965044975280762, 12.683516502380371, 13.40198802947998, 14.12045955657959, 14.838930130004883, 15.557401657104492, 16.2758731842041, 16.99434471130371, 17.71281623840332, 18.43128776550293, 19.14975929260254, 19.86823081970215, 20.586702346801758, 21.305173873901367, 22.023643493652344, 22.742115020751953, 23.460586547851562, 24.179058074951172]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 14.0, 11.0, 27.0, 26.0, 61.0, 90.0, 109.0, 166.0, 250.0, 352.0, 547.0, 869.0, 1259.0, 1806.0, 2772.0, 4325.0, 6395.0, 10046.0, 15854.0, 25526.0, 40587.0, 65603.0, 105128.0, 160218.0, 198920.0, 148289.0, 96195.0, 60895.0, 37424.0, 23056.0, 14639.0, 9431.0, 6009.0, 3939.0, 2510.0, 1722.0, 1145.0, 738.0, 506.0, 359.0, 240.0, 138.0, 114.0, 74.0, 56.0, 34.0, 28.0, 13.0, 10.0, 11.0, 2.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0], "bins": [-3.58203125, -3.467987060546875, -3.35394287109375, -3.239898681640625, -3.1258544921875, -3.011810302734375, -2.89776611328125, -2.783721923828125, -2.669677734375, -2.555633544921875, -2.44158935546875, -2.327545166015625, -2.2135009765625, -2.099456787109375, -1.98541259765625, -1.871368408203125, -1.75732421875, -1.643280029296875, -1.52923583984375, -1.415191650390625, -1.3011474609375, -1.187103271484375, -1.07305908203125, -0.959014892578125, -0.844970703125, -0.730926513671875, -0.61688232421875, -0.502838134765625, -0.3887939453125, -0.274749755859375, -0.16070556640625, -0.046661376953125, 0.0673828125, 0.181427001953125, 0.29547119140625, 0.409515380859375, 0.5235595703125, 0.637603759765625, 0.75164794921875, 0.865692138671875, 0.979736328125, 1.093780517578125, 1.20782470703125, 1.321868896484375, 1.4359130859375, 1.549957275390625, 1.66400146484375, 1.778045654296875, 1.89208984375, 2.006134033203125, 2.12017822265625, 2.234222412109375, 2.3482666015625, 2.462310791015625, 2.57635498046875, 2.690399169921875, 2.804443359375, 2.918487548828125, 3.03253173828125, 3.146575927734375, 3.2606201171875, 3.374664306640625, 3.48870849609375, 3.602752685546875, 3.716796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 14.0, 12.0, 11.0, 11.0, 11.0, 16.0, 20.0, 18.0, 20.0, 18.0, 25.0, 30.0, 37.0, 39.0, 32.0, 38.0, 46.0, 50.0, 46.0, 33.0, 41.0, 32.0, 34.0, 38.0, 28.0, 27.0, 31.0, 25.0, 30.0, 19.0, 17.0, 14.0, 16.0, 22.0, 11.0, 11.0, 13.0, 10.0, 9.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.125, -23.384765625, -22.64453125, -21.904296875, -21.1640625, -20.423828125, -19.68359375, -18.943359375, -18.203125, -17.462890625, -16.72265625, -15.982421875, -15.2421875, -14.501953125, -13.76171875, -13.021484375, -12.28125, -11.541015625, -10.80078125, -10.060546875, -9.3203125, -8.580078125, -7.83984375, -7.099609375, -6.359375, -5.619140625, -4.87890625, -4.138671875, -3.3984375, -2.658203125, -1.91796875, -1.177734375, -0.4375, 0.302734375, 1.04296875, 1.783203125, 2.5234375, 3.263671875, 4.00390625, 4.744140625, 5.484375, 6.224609375, 6.96484375, 7.705078125, 8.4453125, 9.185546875, 9.92578125, 10.666015625, 11.40625, 12.146484375, 12.88671875, 13.626953125, 14.3671875, 15.107421875, 15.84765625, 16.587890625, 17.328125, 18.068359375, 18.80859375, 19.548828125, 20.2890625, 21.029296875, 21.76953125, 22.509765625, 23.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 14.0, 17.0, 26.0, 35.0, 51.0, 66.0, 112.0, 141.0, 228.0, 355.0, 489.0, 757.0, 1174.0, 1667.0, 2470.0, 3514.0, 5169.0, 7876.0, 11737.0, 18082.0, 27845.0, 43850.0, 68515.0, 107996.0, 159745.0, 187166.0, 140707.0, 92761.0, 58604.0, 37129.0, 23685.0, 15580.0, 10253.0, 6564.0, 4581.0, 3098.0, 2118.0, 1390.0, 995.0, 630.0, 444.0, 297.0, 195.0, 146.0, 108.0, 69.0, 31.0, 35.0, 20.0, 9.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.95703125, -2.86553955078125, -2.7740478515625, -2.68255615234375, -2.591064453125, -2.49957275390625, -2.4080810546875, -2.31658935546875, -2.22509765625, -2.13360595703125, -2.0421142578125, -1.95062255859375, -1.859130859375, -1.76763916015625, -1.6761474609375, -1.58465576171875, -1.4931640625, -1.40167236328125, -1.3101806640625, -1.21868896484375, -1.127197265625, -1.03570556640625, -0.9442138671875, -0.85272216796875, -0.76123046875, -0.66973876953125, -0.5782470703125, -0.48675537109375, -0.395263671875, -0.30377197265625, -0.2122802734375, -0.12078857421875, -0.029296875, 0.06219482421875, 0.1536865234375, 0.24517822265625, 0.336669921875, 0.42816162109375, 0.5196533203125, 0.61114501953125, 0.70263671875, 0.79412841796875, 0.8856201171875, 0.97711181640625, 1.068603515625, 1.16009521484375, 1.2515869140625, 1.34307861328125, 1.4345703125, 1.52606201171875, 1.6175537109375, 1.70904541015625, 1.800537109375, 1.89202880859375, 1.9835205078125, 2.07501220703125, 2.16650390625, 2.25799560546875, 2.3494873046875, 2.44097900390625, 2.532470703125, 2.62396240234375, 2.7154541015625, 2.80694580078125, 2.8984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 8.0, 10.0, 8.0, 8.0, 14.0, 7.0, 15.0, 17.0, 23.0, 17.0, 33.0, 38.0, 33.0, 35.0, 29.0, 40.0, 41.0, 35.0, 25.0, 41.0, 41.0, 40.0, 36.0, 31.0, 42.0, 32.0, 31.0, 36.0, 31.0, 35.0, 29.0, 17.0, 17.0, 11.0, 16.0, 13.0, 11.0, 12.0, 9.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.59375, -16.082763671875, -15.57177734375, -15.060791015625, -14.5498046875, -14.038818359375, -13.52783203125, -13.016845703125, -12.505859375, -11.994873046875, -11.48388671875, -10.972900390625, -10.4619140625, -9.950927734375, -9.43994140625, -8.928955078125, -8.41796875, -7.906982421875, -7.39599609375, -6.885009765625, -6.3740234375, -5.863037109375, -5.35205078125, -4.841064453125, -4.330078125, -3.819091796875, -3.30810546875, -2.797119140625, -2.2861328125, -1.775146484375, -1.26416015625, -0.753173828125, -0.2421875, 0.268798828125, 0.77978515625, 1.290771484375, 1.8017578125, 2.312744140625, 2.82373046875, 3.334716796875, 3.845703125, 4.356689453125, 4.86767578125, 5.378662109375, 5.8896484375, 6.400634765625, 6.91162109375, 7.422607421875, 7.93359375, 8.444580078125, 8.95556640625, 9.466552734375, 9.9775390625, 10.488525390625, 10.99951171875, 11.510498046875, 12.021484375, 12.532470703125, 13.04345703125, 13.554443359375, 14.0654296875, 14.576416015625, 15.08740234375, 15.598388671875, 16.109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 13.0, 19.0, 16.0, 25.0, 36.0, 60.0, 106.0, 146.0, 206.0, 334.0, 479.0, 735.0, 1133.0, 1757.0, 2678.0, 4264.0, 6947.0, 11512.0, 19793.0, 35705.0, 69547.0, 147186.0, 304683.0, 224853.0, 100260.0, 49953.0, 26933.0, 15217.0, 8880.0, 5412.0, 3341.0, 2222.0, 1374.0, 973.0, 594.0, 380.0, 266.0, 190.0, 102.0, 54.0, 45.0, 38.0, 38.0, 12.0, 9.0, 6.0, 5.0, 9.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238525390625, -0.23077011108398438, -0.22301483154296875, -0.21525955200195312, -0.2075042724609375, -0.19974899291992188, -0.19199371337890625, -0.18423843383789062, -0.176483154296875, -0.16872787475585938, -0.16097259521484375, -0.15321731567382812, -0.1454620361328125, -0.13770675659179688, -0.12995147705078125, -0.12219619750976562, -0.11444091796875, -0.10668563842773438, -0.09893035888671875, -0.09117507934570312, -0.0834197998046875, -0.07566452026367188, -0.06790924072265625, -0.060153961181640625, -0.052398681640625, -0.044643402099609375, -0.03688812255859375, -0.029132843017578125, -0.0213775634765625, -0.013622283935546875, -0.00586700439453125, 0.001888275146484375, 0.0096435546875, 0.017398834228515625, 0.02515411376953125, 0.032909393310546875, 0.0406646728515625, 0.048419952392578125, 0.05617523193359375, 0.06393051147460938, 0.071685791015625, 0.07944107055664062, 0.08719635009765625, 0.09495162963867188, 0.1027069091796875, 0.11046218872070312, 0.11821746826171875, 0.12597274780273438, 0.13372802734375, 0.14148330688476562, 0.14923858642578125, 0.15699386596679688, 0.1647491455078125, 0.17250442504882812, 0.18025970458984375, 0.18801498413085938, 0.195770263671875, 0.20352554321289062, 0.21128082275390625, 0.21903610229492188, 0.2267913818359375, 0.23454666137695312, 0.24230194091796875, 0.2500572204589844, 0.2578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 8.0, 20.0, 25.0, 30.0, 42.0, 49.0, 61.0, 78.0, 77.0, 80.0, 69.0, 94.0, 68.0, 63.0, 50.0, 42.0, 32.0, 24.0, 14.0, 17.0, 11.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.003545761108398e-05, -6.810110062360764e-05, -6.616674363613129e-05, -6.423238664865494e-05, -6.229802966117859e-05, -6.036367267370224e-05, -5.842931568622589e-05, -5.649495869874954e-05, -5.456060171127319e-05, -5.2626244723796844e-05, -5.0691887736320496e-05, -4.875753074884415e-05, -4.68231737613678e-05, -4.488881677389145e-05, -4.29544597864151e-05, -4.102010279893875e-05, -3.90857458114624e-05, -3.7151388823986053e-05, -3.5217031836509705e-05, -3.3282674849033356e-05, -3.134831786155701e-05, -2.9413960874080658e-05, -2.747960388660431e-05, -2.554524689912796e-05, -2.361088991165161e-05, -2.1676532924175262e-05, -1.9742175936698914e-05, -1.7807818949222565e-05, -1.5873461961746216e-05, -1.3939104974269867e-05, -1.2004747986793518e-05, -1.007039099931717e-05, -8.13603401184082e-06, -6.2016770243644714e-06, -4.2673200368881226e-06, -2.3329630494117737e-06, -3.986060619354248e-07, 1.535750925540924e-06, 3.470107913017273e-06, 5.404464900493622e-06, 7.338821887969971e-06, 9.27317887544632e-06, 1.1207535862922668e-05, 1.3141892850399017e-05, 1.5076249837875366e-05, 1.7010606825351715e-05, 1.8944963812828064e-05, 2.0879320800304413e-05, 2.2813677787780762e-05, 2.474803477525711e-05, 2.668239176273346e-05, 2.861674875020981e-05, 3.055110573768616e-05, 3.2485462725162506e-05, 3.4419819712638855e-05, 3.6354176700115204e-05, 3.828853368759155e-05, 4.02228906750679e-05, 4.215724766254425e-05, 4.40916046500206e-05, 4.602596163749695e-05, 4.79603186249733e-05, 4.9894675612449646e-05, 5.1829032599925995e-05, 5.3763389587402344e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 14.0, 18.0, 29.0, 40.0, 65.0, 101.0, 132.0, 251.0, 343.0, 578.0, 915.0, 1585.0, 2556.0, 4337.0, 7466.0, 13301.0, 25208.0, 48274.0, 96985.0, 226977.0, 346002.0, 134811.0, 64973.0, 32871.0, 17587.0, 9423.0, 5485.0, 3180.0, 1872.0, 1193.0, 722.0, 482.0, 295.0, 148.0, 101.0, 78.0, 51.0, 26.0, 28.0, 20.0, 8.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9523696899414062, -0.9228057861328125, -0.8932418823242188, -0.863677978515625, -0.8341140747070312, -0.8045501708984375, -0.7749862670898438, -0.74542236328125, -0.7158584594726562, -0.6862945556640625, -0.6567306518554688, -0.627166748046875, -0.5976028442382812, -0.5680389404296875, -0.5384750366210938, -0.5089111328125, -0.47934722900390625, -0.4497833251953125, -0.42021942138671875, -0.390655517578125, -0.36109161376953125, -0.3315277099609375, -0.30196380615234375, -0.27239990234375, -0.24283599853515625, -0.2132720947265625, -0.18370819091796875, -0.154144287109375, -0.12458038330078125, -0.0950164794921875, -0.06545257568359375, -0.035888671875, -0.00632476806640625, 0.0232391357421875, 0.05280303955078125, 0.082366943359375, 0.11193084716796875, 0.1414947509765625, 0.17105865478515625, 0.20062255859375, 0.23018646240234375, 0.2597503662109375, 0.28931427001953125, 0.318878173828125, 0.34844207763671875, 0.3780059814453125, 0.40756988525390625, 0.4371337890625, 0.46669769287109375, 0.4962615966796875, 0.5258255004882812, 0.555389404296875, 0.5849533081054688, 0.6145172119140625, 0.6440811157226562, 0.67364501953125, 0.7032089233398438, 0.7327728271484375, 0.7623367309570312, 0.791900634765625, 0.8214645385742188, 0.8510284423828125, 0.8805923461914062, 0.91015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 8.0, 4.0, 7.0, 7.0, 10.0, 14.0, 14.0, 22.0, 20.0, 25.0, 32.0, 30.0, 42.0, 39.0, 47.0, 46.0, 38.0, 48.0, 51.0, 49.0, 38.0, 35.0, 52.0, 56.0, 41.0, 39.0, 31.0, 33.0, 22.0, 12.0, 13.0, 13.0, 16.0, 10.0, 6.0, 9.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.438232421875, -0.4240760803222656, -0.40991973876953125, -0.3957633972167969, -0.3816070556640625, -0.3674507141113281, -0.35329437255859375, -0.3391380310058594, -0.324981689453125, -0.3108253479003906, -0.29666900634765625, -0.2825126647949219, -0.2683563232421875, -0.2541999816894531, -0.24004364013671875, -0.22588729858398438, -0.21173095703125, -0.19757461547851562, -0.18341827392578125, -0.16926193237304688, -0.1551055908203125, -0.14094924926757812, -0.12679290771484375, -0.11263656616210938, -0.098480224609375, -0.08432388305664062, -0.07016754150390625, -0.056011199951171875, -0.0418548583984375, -0.027698516845703125, -0.01354217529296875, 0.000614166259765625, 0.0147705078125, 0.028926849365234375, 0.04308319091796875, 0.057239532470703125, 0.0713958740234375, 0.08555221557617188, 0.09970855712890625, 0.11386489868164062, 0.128021240234375, 0.14217758178710938, 0.15633392333984375, 0.17049026489257812, 0.1846466064453125, 0.19880294799804688, 0.21295928955078125, 0.22711563110351562, 0.24127197265625, 0.2554283142089844, 0.26958465576171875, 0.2837409973144531, 0.2978973388671875, 0.3120536804199219, 0.32621002197265625, 0.3403663635253906, 0.354522705078125, 0.3686790466308594, 0.38283538818359375, 0.3969917297363281, 0.4111480712890625, 0.4253044128417969, 0.43946075439453125, 0.4536170959472656, 0.4677734375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 9.0, 6.0, 10.0, 13.0, 15.0, 24.0, 19.0, 31.0, 31.0, 39.0, 34.0, 27.0, 34.0, 42.0, 40.0, 41.0, 54.0, 44.0, 37.0, 40.0, 35.0, 45.0, 38.0, 39.0, 26.0, 26.0, 29.0, 21.0, 20.0, 18.0, 20.0, 18.0, 13.0, 9.0, 11.0, 7.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-19.849225997924805, -19.220840454101562, -18.592456817626953, -17.96407127380371, -17.33568572998047, -16.70730209350586, -16.078916549682617, -15.450531005859375, -14.82214641571045, -14.193761825561523, -13.565376281738281, -12.936991691589355, -12.30860710144043, -11.680221557617188, -11.051836967468262, -10.423452377319336, -9.795066833496094, -9.166682243347168, -8.538296699523926, -7.909912109375, -7.281527042388916, -6.653141975402832, -6.024757385253906, -5.396372318267822, -4.767987251281738, -4.139602184295654, -3.5112173557281494, -2.8828325271606445, -2.2544474601745605, -1.6260623931884766, -0.9976775646209717, -0.3692927360534668, 0.2590904235839844, 0.8874753713607788, 1.5158603191375732, 2.144245147705078, 2.772630214691162, 3.401015281677246, 4.029399871826172, 4.657784938812256, 5.28617000579834, 5.914555072784424, 6.542940139770508, 7.171324729919434, 7.799709796905518, 8.428094863891602, 9.056479454040527, 9.684864044189453, 10.313249588012695, 10.941634178161621, 11.570019721984863, 12.198404312133789, 12.826789855957031, 13.455174446105957, 14.083559036254883, 14.711944580078125, 15.34032917022705, 15.968713760375977, 16.59709930419922, 17.22548484802246, 17.85386848449707, 18.482254028320312, 19.110639572143555, 19.739023208618164, 20.367408752441406]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 7.0, 11.0, 9.0, 11.0, 8.0, 12.0, 19.0, 19.0, 19.0, 21.0, 24.0, 19.0, 24.0, 23.0, 39.0, 33.0, 30.0, 42.0, 33.0, 46.0, 37.0, 42.0, 38.0, 33.0, 50.0, 39.0, 29.0, 34.0, 26.0, 28.0, 18.0, 21.0, 18.0, 20.0, 22.0, 24.0, 11.0, 6.0, 6.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.98387336730957, -21.26636505126953, -20.548858642578125, -19.831350326538086, -19.11384391784668, -18.39633560180664, -17.678829193115234, -16.961320877075195, -16.243812561035156, -15.526305198669434, -14.808797836303711, -14.091289520263672, -13.373783111572266, -12.656274795532227, -11.938767433166504, -11.221260070800781, -10.503753662109375, -9.786246299743652, -9.06873893737793, -8.35123062133789, -7.633723735809326, -6.9162163734436035, -6.198708534240723, -5.481201171875, -4.763693809509277, -4.046186447143555, -3.328678846359253, -2.611171245574951, -1.8936638832092285, -1.1761565208435059, -0.458648681640625, 0.25885868072509766, 0.9763660430908203, 1.6938735246658325, 2.4113810062408447, 3.1288886070251465, 3.846395969390869, 4.563903331756592, 5.281411170959473, 5.998918533325195, 6.716425895690918, 7.433933258056641, 8.151440620422363, 8.868947982788086, 9.586456298828125, 10.303962707519531, 11.02147102355957, 11.738978385925293, 12.456485748291016, 13.173993110656738, 13.891500473022461, 14.6090087890625, 15.326515197753906, 16.044023513793945, 16.761531829833984, 17.47903823852539, 18.196544647216797, 18.914052963256836, 19.631559371948242, 20.34906768798828, 21.066574096679688, 21.784082412719727, 22.501590728759766, 23.219097137451172, 23.93660545349121]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 8.0, 7.0, 19.0, 19.0, 42.0, 71.0, 118.0, 236.0, 365.0, 624.0, 1067.0, 1687.0, 2768.0, 4462.0, 7312.0, 11736.0, 18616.0, 28219.0, 41838.0, 59384.0, 79773.0, 99219.0, 113428.0, 119214.0, 112266.0, 97195.0, 77658.0, 57081.0, 40445.0, 27137.0, 17482.0, 11012.0, 7077.0, 4341.0, 2618.0, 1633.0, 945.0, 568.0, 347.0, 206.0, 122.0, 83.0, 50.0, 31.0, 14.0, 7.0, 6.0, 6.0, 5.0, 0.0, 3.0], "bins": [-18.734375, -18.2203369140625, -17.706298828125, -17.1922607421875, -16.67822265625, -16.1641845703125, -15.650146484375, -15.1361083984375, -14.6220703125, -14.1080322265625, -13.593994140625, -13.0799560546875, -12.56591796875, -12.0518798828125, -11.537841796875, -11.0238037109375, -10.509765625, -9.9957275390625, -9.481689453125, -8.9676513671875, -8.45361328125, -7.9395751953125, -7.425537109375, -6.9114990234375, -6.3974609375, -5.8834228515625, -5.369384765625, -4.8553466796875, -4.34130859375, -3.8272705078125, -3.313232421875, -2.7991943359375, -2.28515625, -1.7711181640625, -1.257080078125, -0.7430419921875, -0.22900390625, 0.2850341796875, 0.799072265625, 1.3131103515625, 1.8271484375, 2.3411865234375, 2.855224609375, 3.3692626953125, 3.88330078125, 4.3973388671875, 4.911376953125, 5.4254150390625, 5.939453125, 6.4534912109375, 6.967529296875, 7.4815673828125, 7.99560546875, 8.5096435546875, 9.023681640625, 9.5377197265625, 10.0517578125, 10.5657958984375, 11.079833984375, 11.5938720703125, 12.10791015625, 12.6219482421875, 13.135986328125, 13.6500244140625, 14.1640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 4.0, 7.0, 11.0, 10.0, 7.0, 11.0, 17.0, 11.0, 19.0, 28.0, 27.0, 21.0, 22.0, 33.0, 24.0, 33.0, 25.0, 39.0, 41.0, 39.0, 29.0, 40.0, 45.0, 46.0, 30.0, 44.0, 32.0, 27.0, 35.0, 35.0, 28.0, 21.0, 23.0, 16.0, 11.0, 19.0, 11.0, 15.0, 14.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.3125, -19.612060546875, -18.91162109375, -18.211181640625, -17.5107421875, -16.810302734375, -16.10986328125, -15.409423828125, -14.708984375, -14.008544921875, -13.30810546875, -12.607666015625, -11.9072265625, -11.206787109375, -10.50634765625, -9.805908203125, -9.10546875, -8.405029296875, -7.70458984375, -7.004150390625, -6.3037109375, -5.603271484375, -4.90283203125, -4.202392578125, -3.501953125, -2.801513671875, -2.10107421875, -1.400634765625, -0.7001953125, 0.000244140625, 0.70068359375, 1.401123046875, 2.1015625, 2.802001953125, 3.50244140625, 4.202880859375, 4.9033203125, 5.603759765625, 6.30419921875, 7.004638671875, 7.705078125, 8.405517578125, 9.10595703125, 9.806396484375, 10.5068359375, 11.207275390625, 11.90771484375, 12.608154296875, 13.30859375, 14.009033203125, 14.70947265625, 15.409912109375, 16.1103515625, 16.810791015625, 17.51123046875, 18.211669921875, 18.912109375, 19.612548828125, 20.31298828125, 21.013427734375, 21.7138671875, 22.414306640625, 23.11474609375, 23.815185546875, 24.515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 11.0, 22.0, 30.0, 42.0, 71.0, 117.0, 169.0, 256.0, 429.0, 638.0, 915.0, 1465.0, 2260.0, 3470.0, 5485.0, 8128.0, 12055.0, 18730.0, 26956.0, 38183.0, 53059.0, 69752.0, 86045.0, 98688.0, 106550.0, 105550.0, 97731.0, 82868.0, 66641.0, 50193.0, 36482.0, 25556.0, 17157.0, 11332.0, 7532.0, 4944.0, 3202.0, 1979.0, 1362.0, 828.0, 596.0, 385.0, 243.0, 156.0, 117.0, 60.0, 43.0, 21.0, 19.0, 13.0, 6.0, 5.0, 5.0, 1.0, 1.0], "bins": [-15.875, -15.4068603515625, -14.938720703125, -14.4705810546875, -14.00244140625, -13.5343017578125, -13.066162109375, -12.5980224609375, -12.1298828125, -11.6617431640625, -11.193603515625, -10.7254638671875, -10.25732421875, -9.7891845703125, -9.321044921875, -8.8529052734375, -8.384765625, -7.9166259765625, -7.448486328125, -6.9803466796875, -6.51220703125, -6.0440673828125, -5.575927734375, -5.1077880859375, -4.6396484375, -4.1715087890625, -3.703369140625, -3.2352294921875, -2.76708984375, -2.2989501953125, -1.830810546875, -1.3626708984375, -0.89453125, -0.4263916015625, 0.041748046875, 0.5098876953125, 0.97802734375, 1.4461669921875, 1.914306640625, 2.3824462890625, 2.8505859375, 3.3187255859375, 3.786865234375, 4.2550048828125, 4.72314453125, 5.1912841796875, 5.659423828125, 6.1275634765625, 6.595703125, 7.0638427734375, 7.531982421875, 8.0001220703125, 8.46826171875, 8.9364013671875, 9.404541015625, 9.8726806640625, 10.3408203125, 10.8089599609375, 11.277099609375, 11.7452392578125, 12.21337890625, 12.6815185546875, 13.149658203125, 13.6177978515625, 14.0859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 3.0, 2.0, 6.0, 11.0, 9.0, 11.0, 15.0, 16.0, 16.0, 15.0, 19.0, 28.0, 23.0, 27.0, 34.0, 37.0, 34.0, 23.0, 49.0, 37.0, 40.0, 35.0, 48.0, 49.0, 47.0, 36.0, 29.0, 40.0, 35.0, 27.0, 21.0, 25.0, 27.0, 19.0, 19.0, 13.0, 11.0, 9.0, 5.0, 11.0, 9.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-15.03125, -14.5692138671875, -14.107177734375, -13.6451416015625, -13.18310546875, -12.7210693359375, -12.259033203125, -11.7969970703125, -11.3349609375, -10.8729248046875, -10.410888671875, -9.9488525390625, -9.48681640625, -9.0247802734375, -8.562744140625, -8.1007080078125, -7.638671875, -7.1766357421875, -6.714599609375, -6.2525634765625, -5.79052734375, -5.3284912109375, -4.866455078125, -4.4044189453125, -3.9423828125, -3.4803466796875, -3.018310546875, -2.5562744140625, -2.09423828125, -1.6322021484375, -1.170166015625, -0.7081298828125, -0.24609375, 0.2159423828125, 0.677978515625, 1.1400146484375, 1.60205078125, 2.0640869140625, 2.526123046875, 2.9881591796875, 3.4501953125, 3.9122314453125, 4.374267578125, 4.8363037109375, 5.29833984375, 5.7603759765625, 6.222412109375, 6.6844482421875, 7.146484375, 7.6085205078125, 8.070556640625, 8.5325927734375, 8.99462890625, 9.4566650390625, 9.918701171875, 10.3807373046875, 10.8427734375, 11.3048095703125, 11.766845703125, 12.2288818359375, 12.69091796875, 13.1529541015625, 13.614990234375, 14.0770263671875, 14.5390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 16.0, 21.0, 30.0, 38.0, 45.0, 73.0, 119.0, 215.0, 316.0, 494.0, 850.0, 1389.0, 2432.0, 4428.0, 7691.0, 13415.0, 23351.0, 39997.0, 65015.0, 98583.0, 133225.0, 153567.0, 150099.0, 124701.0, 89074.0, 57653.0, 34368.0, 20235.0, 11372.0, 6723.0, 3690.0, 2043.0, 1306.0, 736.0, 443.0, 276.0, 181.0, 121.0, 89.0, 45.0, 29.0, 13.0, 13.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94921875, -5.7564697265625, -5.563720703125, -5.3709716796875, -5.17822265625, -4.9854736328125, -4.792724609375, -4.5999755859375, -4.4072265625, -4.2144775390625, -4.021728515625, -3.8289794921875, -3.63623046875, -3.4434814453125, -3.250732421875, -3.0579833984375, -2.865234375, -2.6724853515625, -2.479736328125, -2.2869873046875, -2.09423828125, -1.9014892578125, -1.708740234375, -1.5159912109375, -1.3232421875, -1.1304931640625, -0.937744140625, -0.7449951171875, -0.55224609375, -0.3594970703125, -0.166748046875, 0.0260009765625, 0.21875, 0.4114990234375, 0.604248046875, 0.7969970703125, 0.98974609375, 1.1824951171875, 1.375244140625, 1.5679931640625, 1.7607421875, 1.9534912109375, 2.146240234375, 2.3389892578125, 2.53173828125, 2.7244873046875, 2.917236328125, 3.1099853515625, 3.302734375, 3.4954833984375, 3.688232421875, 3.8809814453125, 4.07373046875, 4.2664794921875, 4.459228515625, 4.6519775390625, 4.8447265625, 5.0374755859375, 5.230224609375, 5.4229736328125, 5.61572265625, 5.8084716796875, 6.001220703125, 6.1939697265625, 6.38671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 13.0, 12.0, 26.0, 21.0, 20.0, 17.0, 27.0, 27.0, 33.0, 36.0, 35.0, 43.0, 56.0, 50.0, 49.0, 51.0, 50.0, 44.0, 43.0, 50.0, 29.0, 40.0, 33.0, 30.0, 30.0, 21.0, 22.0, 15.0, 16.0, 8.0, 7.0, 9.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006279945373535156, -0.0006105229258537292, -0.0005930513143539429, -0.0005755797028541565, -0.0005581080913543701, -0.0005406364798545837, -0.0005231648683547974, -0.000505693256855011, -0.0004882216453552246, -0.00047075003385543823, -0.00045327842235565186, -0.0004358068108558655, -0.0004183351993560791, -0.0004008635878562927, -0.00038339197635650635, -0.00036592036485671997, -0.0003484487533569336, -0.0003309771418571472, -0.00031350553035736084, -0.00029603391885757446, -0.0002785623073577881, -0.0002610906958580017, -0.00024361908435821533, -0.00022614747285842896, -0.00020867586135864258, -0.0001912042498588562, -0.00017373263835906982, -0.00015626102685928345, -0.00013878941535949707, -0.0001213178038597107, -0.00010384619235992432, -8.637458086013794e-05, -6.890296936035156e-05, -5.1431357860565186e-05, -3.395974636077881e-05, -1.648813486099243e-05, 9.834766387939453e-07, 1.8455088138580322e-05, 3.59266996383667e-05, 5.3398311138153076e-05, 7.086992263793945e-05, 8.834153413772583e-05, 0.00010581314563751221, 0.00012328475713729858, 0.00014075636863708496, 0.00015822798013687134, 0.00017569959163665771, 0.0001931712031364441, 0.00021064281463623047, 0.00022811442613601685, 0.0002455860376358032, 0.0002630576491355896, 0.000280529260635376, 0.00029800087213516235, 0.00031547248363494873, 0.0003329440951347351, 0.0003504157066345215, 0.00036788731813430786, 0.00038535892963409424, 0.0004028305411338806, 0.000420302152633667, 0.00043777376413345337, 0.00045524537563323975, 0.0004727169871330261, 0.0004901885986328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 13.0, 21.0, 27.0, 43.0, 62.0, 85.0, 118.0, 193.0, 321.0, 473.0, 767.0, 1142.0, 1844.0, 2634.0, 4317.0, 6758.0, 10840.0, 16929.0, 26247.0, 39628.0, 57388.0, 78305.0, 101292.0, 118408.0, 124724.0, 117330.0, 99163.0, 76372.0, 55585.0, 38138.0, 24984.0, 15974.0, 10300.0, 6575.0, 4192.0, 2618.0, 1717.0, 1019.0, 719.0, 473.0, 291.0, 166.0, 116.0, 75.0, 55.0, 35.0, 30.0, 8.0, 15.0, 6.0, 6.0, 4.0, 4.0, 3.0], "bins": [-5.6875, -5.52239990234375, -5.3572998046875, -5.19219970703125, -5.027099609375, -4.86199951171875, -4.6968994140625, -4.53179931640625, -4.36669921875, -4.20159912109375, -4.0364990234375, -3.87139892578125, -3.706298828125, -3.54119873046875, -3.3760986328125, -3.21099853515625, -3.0458984375, -2.88079833984375, -2.7156982421875, -2.55059814453125, -2.385498046875, -2.22039794921875, -2.0552978515625, -1.89019775390625, -1.72509765625, -1.55999755859375, -1.3948974609375, -1.22979736328125, -1.064697265625, -0.89959716796875, -0.7344970703125, -0.56939697265625, -0.404296875, -0.23919677734375, -0.0740966796875, 0.09100341796875, 0.256103515625, 0.42120361328125, 0.5863037109375, 0.75140380859375, 0.91650390625, 1.08160400390625, 1.2467041015625, 1.41180419921875, 1.576904296875, 1.74200439453125, 1.9071044921875, 2.07220458984375, 2.2373046875, 2.40240478515625, 2.5675048828125, 2.73260498046875, 2.897705078125, 3.06280517578125, 3.2279052734375, 3.39300537109375, 3.55810546875, 3.72320556640625, 3.8883056640625, 4.05340576171875, 4.218505859375, 4.38360595703125, 4.5487060546875, 4.71380615234375, 4.87890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 9.0, 10.0, 10.0, 13.0, 11.0, 24.0, 19.0, 32.0, 37.0, 28.0, 23.0, 26.0, 49.0, 48.0, 37.0, 39.0, 47.0, 40.0, 42.0, 41.0, 44.0, 47.0, 40.0, 36.0, 35.0, 17.0, 31.0, 16.0, 28.0, 17.0, 13.0, 16.0, 18.0, 10.0, 8.0, 2.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.431640625, -2.360595703125, -2.28955078125, -2.218505859375, -2.1474609375, -2.076416015625, -2.00537109375, -1.934326171875, -1.86328125, -1.792236328125, -1.72119140625, -1.650146484375, -1.5791015625, -1.508056640625, -1.43701171875, -1.365966796875, -1.294921875, -1.223876953125, -1.15283203125, -1.081787109375, -1.0107421875, -0.939697265625, -0.86865234375, -0.797607421875, -0.7265625, -0.655517578125, -0.58447265625, -0.513427734375, -0.4423828125, -0.371337890625, -0.30029296875, -0.229248046875, -0.158203125, -0.087158203125, -0.01611328125, 0.054931640625, 0.1259765625, 0.197021484375, 0.26806640625, 0.339111328125, 0.41015625, 0.481201171875, 0.55224609375, 0.623291015625, 0.6943359375, 0.765380859375, 0.83642578125, 0.907470703125, 0.978515625, 1.049560546875, 1.12060546875, 1.191650390625, 1.2626953125, 1.333740234375, 1.40478515625, 1.475830078125, 1.546875, 1.617919921875, 1.68896484375, 1.760009765625, 1.8310546875, 1.902099609375, 1.97314453125, 2.044189453125, 2.115234375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 10.0, 4.0, 3.0, 6.0, 8.0, 11.0, 14.0, 12.0, 22.0, 27.0, 22.0, 30.0, 33.0, 27.0, 29.0, 31.0, 47.0, 49.0, 44.0, 54.0, 34.0, 44.0, 56.0, 37.0, 36.0, 31.0, 36.0, 32.0, 29.0, 17.0, 26.0, 22.0, 18.0, 20.0, 17.0, 15.0, 8.0, 14.0, 6.0, 2.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.69333839416504, -19.070175170898438, -18.44701385498047, -17.823850631713867, -17.2006893157959, -16.577526092529297, -15.954364776611328, -15.331201553344727, -14.708040237426758, -14.084877967834473, -13.461715698242188, -12.838553428649902, -12.215391159057617, -11.592228889465332, -10.969066619873047, -10.345903396606445, -9.72274112701416, -9.099578857421875, -8.47641658782959, -7.853254318237305, -7.2300920486450195, -6.606929779052734, -5.983767032623291, -5.360604763031006, -4.737442493438721, -4.1142802238464355, -3.4911179542541504, -2.867955446243286, -2.244793176651001, -1.6216309070587158, -0.9984683990478516, -0.3753061294555664, 0.24785614013671875, 0.8710184693336487, 1.4941807985305786, 2.1173431873321533, 2.7405054569244385, 3.3636677265167236, 3.986830234527588, 4.609992504119873, 5.233154773712158, 5.856317043304443, 6.4794793128967285, 7.102642059326172, 7.725804328918457, 8.348966598510742, 8.972128868103027, 9.595291137695312, 10.218453407287598, 10.841615676879883, 11.464777946472168, 12.087940216064453, 12.711102485656738, 13.334264755249023, 13.957427978515625, 14.580589294433594, 15.203752517700195, 15.82691478729248, 16.450077056884766, 17.073240280151367, 17.696401596069336, 18.319564819335938, 18.942726135253906, 19.565889358520508, 20.189050674438477]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 9.0, 11.0, 6.0, 15.0, 15.0, 15.0, 15.0, 21.0, 15.0, 19.0, 23.0, 30.0, 26.0, 31.0, 45.0, 31.0, 35.0, 44.0, 47.0, 41.0, 43.0, 35.0, 36.0, 32.0, 35.0, 35.0, 29.0, 29.0, 27.0, 27.0, 23.0, 29.0, 9.0, 20.0, 18.0, 11.0, 10.0, 15.0, 8.0, 4.0, 7.0, 1.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.66383934020996, -21.906023025512695, -21.14820671081543, -20.390392303466797, -19.63257598876953, -18.874759674072266, -18.116943359375, -17.359127044677734, -16.60131072998047, -15.843494415283203, -15.085679054260254, -14.327862739562988, -13.570047378540039, -12.812231063842773, -12.054414749145508, -11.296598434448242, -10.53878402709961, -9.780967712402344, -9.023152351379395, -8.265336036682129, -7.5075201988220215, -6.749704360961914, -5.991888046264648, -5.234072208404541, -4.476256370544434, -3.718440532684326, -2.9606244564056396, -2.202808380126953, -1.4449925422668457, -0.6871767044067383, 0.07063961029052734, 0.8284554481506348, 1.5862712860107422, 2.3440871238708496, 3.101903200149536, 3.8597192764282227, 4.61753511428833, 5.3753509521484375, 6.133167266845703, 6.8909831047058105, 7.648798942565918, 8.406615257263184, 9.164430618286133, 9.922246932983398, 10.680063247680664, 11.437878608703613, 12.195694923400879, 12.953510284423828, 13.711326599121094, 14.46914291381836, 15.226958274841309, 15.984774589538574, 16.742589950561523, 17.50040626525879, 18.258222579956055, 19.01603889465332, 19.773853302001953, 20.53166961669922, 21.289485931396484, 22.04730224609375, 22.805116653442383, 23.56293296813965, 24.320749282836914, 25.07856559753418, 25.836381912231445]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 15.0, 27.0, 44.0, 64.0, 110.0, 189.0, 293.0, 463.0, 667.0, 1067.0, 1716.0, 2626.0, 4184.0, 6432.0, 9971.0, 15678.0, 23948.0, 37188.0, 56319.0, 84469.0, 124540.0, 178942.0, 248936.0, 328801.0, 404343.0, 457729.0, 467615.0, 433900.0, 364196.0, 284770.0, 209687.0, 149072.0, 101443.0, 67792.0, 45039.0, 29052.0, 18841.0, 12241.0, 8050.0, 4934.0, 3250.0, 2050.0, 1289.0, 869.0, 522.0, 310.0, 245.0, 137.0, 79.0, 53.0, 33.0, 22.0, 9.0, 6.0, 6.0, 3.0, 1.0], "bins": [-15.734375, -15.2608642578125, -14.787353515625, -14.3138427734375, -13.84033203125, -13.3668212890625, -12.893310546875, -12.4197998046875, -11.9462890625, -11.4727783203125, -10.999267578125, -10.5257568359375, -10.05224609375, -9.5787353515625, -9.105224609375, -8.6317138671875, -8.158203125, -7.6846923828125, -7.211181640625, -6.7376708984375, -6.26416015625, -5.7906494140625, -5.317138671875, -4.8436279296875, -4.3701171875, -3.8966064453125, -3.423095703125, -2.9495849609375, -2.47607421875, -2.0025634765625, -1.529052734375, -1.0555419921875, -0.58203125, -0.1085205078125, 0.364990234375, 0.8385009765625, 1.31201171875, 1.7855224609375, 2.259033203125, 2.7325439453125, 3.2060546875, 3.6795654296875, 4.153076171875, 4.6265869140625, 5.10009765625, 5.5736083984375, 6.047119140625, 6.5206298828125, 6.994140625, 7.4676513671875, 7.941162109375, 8.4146728515625, 8.88818359375, 9.3616943359375, 9.835205078125, 10.3087158203125, 10.7822265625, 11.2557373046875, 11.729248046875, 12.2027587890625, 12.67626953125, 13.1497802734375, 13.623291015625, 14.0968017578125, 14.5703125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 3.0, 10.0, 10.0, 10.0, 12.0, 13.0, 13.0, 13.0, 24.0, 27.0, 16.0, 22.0, 25.0, 44.0, 25.0, 38.0, 39.0, 38.0, 46.0, 49.0, 41.0, 44.0, 27.0, 40.0, 35.0, 32.0, 29.0, 36.0, 29.0, 20.0, 16.0, 21.0, 18.0, 20.0, 8.0, 19.0, 15.0, 13.0, 13.0, 5.0, 10.0, 1.0, 6.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.0625, -17.504150390625, -16.94580078125, -16.387451171875, -15.8291015625, -15.270751953125, -14.71240234375, -14.154052734375, -13.595703125, -13.037353515625, -12.47900390625, -11.920654296875, -11.3623046875, -10.803955078125, -10.24560546875, -9.687255859375, -9.12890625, -8.570556640625, -8.01220703125, -7.453857421875, -6.8955078125, -6.337158203125, -5.77880859375, -5.220458984375, -4.662109375, -4.103759765625, -3.54541015625, -2.987060546875, -2.4287109375, -1.870361328125, -1.31201171875, -0.753662109375, -0.1953125, 0.363037109375, 0.92138671875, 1.479736328125, 2.0380859375, 2.596435546875, 3.15478515625, 3.713134765625, 4.271484375, 4.829833984375, 5.38818359375, 5.946533203125, 6.5048828125, 7.063232421875, 7.62158203125, 8.179931640625, 8.73828125, 9.296630859375, 9.85498046875, 10.413330078125, 10.9716796875, 11.530029296875, 12.08837890625, 12.646728515625, 13.205078125, 13.763427734375, 14.32177734375, 14.880126953125, 15.4384765625, 15.996826171875, 16.55517578125, 17.113525390625, 17.671875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 10.0, 9.0, 16.0, 22.0, 40.0, 89.0, 126.0, 246.0, 419.0, 710.0, 1204.0, 2172.0, 3750.0, 6410.0, 11174.0, 19314.0, 32394.0, 53622.0, 85925.0, 133262.0, 196391.0, 273441.0, 357475.0, 430821.0, 473545.0, 474782.0, 433361.0, 361686.0, 280432.0, 200981.0, 136814.0, 88936.0, 54850.0, 33433.0, 19774.0, 11322.0, 6571.0, 3775.0, 2136.0, 1230.0, 694.0, 385.0, 221.0, 127.0, 85.0, 54.0, 30.0, 15.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9453125, -14.4476318359375, -13.949951171875, -13.4522705078125, -12.95458984375, -12.4569091796875, -11.959228515625, -11.4615478515625, -10.9638671875, -10.4661865234375, -9.968505859375, -9.4708251953125, -8.97314453125, -8.4754638671875, -7.977783203125, -7.4801025390625, -6.982421875, -6.4847412109375, -5.987060546875, -5.4893798828125, -4.99169921875, -4.4940185546875, -3.996337890625, -3.4986572265625, -3.0009765625, -2.5032958984375, -2.005615234375, -1.5079345703125, -1.01025390625, -0.5125732421875, -0.014892578125, 0.4827880859375, 0.98046875, 1.4781494140625, 1.975830078125, 2.4735107421875, 2.97119140625, 3.4688720703125, 3.966552734375, 4.4642333984375, 4.9619140625, 5.4595947265625, 5.957275390625, 6.4549560546875, 6.95263671875, 7.4503173828125, 7.947998046875, 8.4456787109375, 8.943359375, 9.4410400390625, 9.938720703125, 10.4364013671875, 10.93408203125, 11.4317626953125, 11.929443359375, 12.4271240234375, 12.9248046875, 13.4224853515625, 13.920166015625, 14.4178466796875, 14.91552734375, 15.4132080078125, 15.910888671875, 16.4085693359375, 16.90625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 6.0, 5.0, 15.0, 11.0, 15.0, 23.0, 30.0, 39.0, 42.0, 48.0, 66.0, 102.0, 91.0, 106.0, 105.0, 144.0, 150.0, 159.0, 184.0, 195.0, 178.0, 201.0, 207.0, 226.0, 207.0, 183.0, 189.0, 168.0, 142.0, 154.0, 107.0, 107.0, 76.0, 61.0, 73.0, 55.0, 37.0, 31.0, 35.0, 27.0, 13.0, 17.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.0234375, -8.7467041015625, -8.469970703125, -8.1932373046875, -7.91650390625, -7.6397705078125, -7.363037109375, -7.0863037109375, -6.8095703125, -6.5328369140625, -6.256103515625, -5.9793701171875, -5.70263671875, -5.4259033203125, -5.149169921875, -4.8724365234375, -4.595703125, -4.3189697265625, -4.042236328125, -3.7655029296875, -3.48876953125, -3.2120361328125, -2.935302734375, -2.6585693359375, -2.3818359375, -2.1051025390625, -1.828369140625, -1.5516357421875, -1.27490234375, -0.9981689453125, -0.721435546875, -0.4447021484375, -0.16796875, 0.1087646484375, 0.385498046875, 0.6622314453125, 0.93896484375, 1.2156982421875, 1.492431640625, 1.7691650390625, 2.0458984375, 2.3226318359375, 2.599365234375, 2.8760986328125, 3.15283203125, 3.4295654296875, 3.706298828125, 3.9830322265625, 4.259765625, 4.5364990234375, 4.813232421875, 5.0899658203125, 5.36669921875, 5.6434326171875, 5.920166015625, 6.1968994140625, 6.4736328125, 6.7503662109375, 7.027099609375, 7.3038330078125, 7.58056640625, 7.8572998046875, 8.134033203125, 8.4107666015625, 8.6875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 10.0, 9.0, 10.0, 14.0, 16.0, 18.0, 30.0, 25.0, 33.0, 29.0, 49.0, 45.0, 47.0, 53.0, 45.0, 53.0, 71.0, 53.0, 45.0, 49.0, 40.0, 31.0, 37.0, 22.0, 34.0, 25.0, 18.0, 20.0, 23.0, 13.0, 10.0, 7.0, 5.0, 1.0, 9.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.792701721191406, -18.082082748413086, -17.371461868286133, -16.660842895507812, -15.950222969055176, -15.239603042602539, -14.528984069824219, -13.818364143371582, -13.107744216918945, -12.397124290466309, -11.686504364013672, -10.975885391235352, -10.265265464782715, -9.554645538330078, -8.844026565551758, -8.133406639099121, -7.422786712646484, -6.712166786193848, -6.001547336578369, -5.290927886962891, -4.580307960510254, -3.8696882724761963, -3.1590685844421387, -2.44844913482666, -1.7378292083740234, -1.0272095203399658, -0.3165898323059082, 0.3940298557281494, 1.104649543762207, 1.8152692317962646, 2.5258889198303223, 3.236508369445801, 3.9471282958984375, 4.657748222351074, 5.368367671966553, 6.078987121582031, 6.789607048034668, 7.500226974487305, 8.210845947265625, 8.921465873718262, 9.632085800170898, 10.342705726623535, 11.053325653076172, 11.763944625854492, 12.474564552307129, 13.185184478759766, 13.895803451538086, 14.606423377990723, 15.31704330444336, 16.02766227722168, 16.738283157348633, 17.448902130126953, 18.159523010253906, 18.870141983032227, 19.580760955810547, 20.2913818359375, 21.00200080871582, 21.71261978149414, 22.423240661621094, 23.133859634399414, 23.844478607177734, 24.555099487304688, 25.265718460083008, 25.976337432861328, 26.68695831298828]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 15.0, 11.0, 13.0, 16.0, 27.0, 24.0, 24.0, 32.0, 34.0, 44.0, 49.0, 34.0, 40.0, 46.0, 56.0, 39.0, 43.0, 33.0, 41.0, 33.0, 35.0, 36.0, 40.0, 22.0, 24.0, 24.0, 22.0, 21.0, 15.0, 12.0, 8.0, 9.0, 7.0, 6.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.516550064086914, -20.770729064941406, -20.02490997314453, -19.279088973999023, -18.533267974853516, -17.78744888305664, -17.041627883911133, -16.295806884765625, -15.54998779296875, -14.804167747497559, -14.058347702026367, -13.31252670288086, -12.566706657409668, -11.820886611938477, -11.075065612792969, -10.329245567321777, -9.583425521850586, -8.837605476379395, -8.091785430908203, -7.345964431762695, -6.600144386291504, -5.8543243408203125, -5.108503818511963, -4.362683296203613, -3.616863250732422, -2.8710429668426514, -2.125222682952881, -1.3794023990631104, -0.6335821151733398, 0.11223816871643066, 0.8580584526062012, 1.6038789749145508, 2.349700927734375, 3.0955212116241455, 3.841341495513916, 4.587162017822266, 5.332982063293457, 6.078802108764648, 6.824622631072998, 7.570443153381348, 8.316263198852539, 9.06208324432373, 9.807903289794922, 10.55372428894043, 11.299544334411621, 12.045364379882812, 12.79118537902832, 13.537005424499512, 14.282825469970703, 15.028645515441895, 15.774465560913086, 16.520286560058594, 17.26610565185547, 18.011926651000977, 18.757747650146484, 19.50356674194336, 20.249387741088867, 20.995208740234375, 21.74102783203125, 22.486848831176758, 23.232669830322266, 23.97848892211914, 24.72430992126465, 25.470130920410156, 26.21595001220703]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 10.0, 24.0, 35.0, 43.0, 77.0, 112.0, 163.0, 253.0, 371.0, 593.0, 861.0, 1298.0, 2087.0, 3070.0, 4839.0, 7475.0, 11773.0, 18250.0, 28870.0, 44508.0, 69316.0, 106399.0, 156577.0, 186002.0, 140415.0, 93920.0, 61312.0, 38982.0, 25378.0, 16252.0, 10553.0, 6598.0, 4296.0, 2734.0, 1787.0, 1159.0, 740.0, 480.0, 317.0, 205.0, 125.0, 95.0, 53.0, 40.0, 33.0, 29.0, 14.0, 15.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.8494873046875, -2.755615234375, -2.6617431640625, -2.56787109375, -2.4739990234375, -2.380126953125, -2.2862548828125, -2.1923828125, -2.0985107421875, -2.004638671875, -1.9107666015625, -1.81689453125, -1.7230224609375, -1.629150390625, -1.5352783203125, -1.44140625, -1.3475341796875, -1.253662109375, -1.1597900390625, -1.06591796875, -0.9720458984375, -0.878173828125, -0.7843017578125, -0.6904296875, -0.5965576171875, -0.502685546875, -0.4088134765625, -0.31494140625, -0.2210693359375, -0.127197265625, -0.0333251953125, 0.060546875, 0.1544189453125, 0.248291015625, 0.3421630859375, 0.43603515625, 0.5299072265625, 0.623779296875, 0.7176513671875, 0.8115234375, 0.9053955078125, 0.999267578125, 1.0931396484375, 1.18701171875, 1.2808837890625, 1.374755859375, 1.4686279296875, 1.5625, 1.6563720703125, 1.750244140625, 1.8441162109375, 1.93798828125, 2.0318603515625, 2.125732421875, 2.2196044921875, 2.3134765625, 2.4073486328125, 2.501220703125, 2.5950927734375, 2.68896484375, 2.7828369140625, 2.876708984375, 2.9705810546875, 3.064453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 8.0, 13.0, 8.0, 8.0, 13.0, 17.0, 14.0, 19.0, 20.0, 26.0, 28.0, 31.0, 40.0, 33.0, 48.0, 45.0, 42.0, 44.0, 55.0, 44.0, 41.0, 45.0, 45.0, 35.0, 34.0, 25.0, 20.0, 40.0, 27.0, 25.0, 20.0, 10.0, 17.0, 12.0, 7.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.984375, -22.206787109375, -21.42919921875, -20.651611328125, -19.8740234375, -19.096435546875, -18.31884765625, -17.541259765625, -16.763671875, -15.986083984375, -15.20849609375, -14.430908203125, -13.6533203125, -12.875732421875, -12.09814453125, -11.320556640625, -10.54296875, -9.765380859375, -8.98779296875, -8.210205078125, -7.4326171875, -6.655029296875, -5.87744140625, -5.099853515625, -4.322265625, -3.544677734375, -2.76708984375, -1.989501953125, -1.2119140625, -0.434326171875, 0.34326171875, 1.120849609375, 1.8984375, 2.676025390625, 3.45361328125, 4.231201171875, 5.0087890625, 5.786376953125, 6.56396484375, 7.341552734375, 8.119140625, 8.896728515625, 9.67431640625, 10.451904296875, 11.2294921875, 12.007080078125, 12.78466796875, 13.562255859375, 14.33984375, 15.117431640625, 15.89501953125, 16.672607421875, 17.4501953125, 18.227783203125, 19.00537109375, 19.782958984375, 20.560546875, 21.338134765625, 22.11572265625, 22.893310546875, 23.6708984375, 24.448486328125, 25.22607421875, 26.003662109375, 26.78125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 11.0, 13.0, 16.0, 29.0, 62.0, 65.0, 119.0, 143.0, 217.0, 315.0, 504.0, 701.0, 1022.0, 1412.0, 1942.0, 3040.0, 4200.0, 6212.0, 9318.0, 14261.0, 21584.0, 33063.0, 52240.0, 81266.0, 126684.0, 181011.0, 173621.0, 118904.0, 76389.0, 48291.0, 30706.0, 20094.0, 13078.0, 8897.0, 6053.0, 4043.0, 2730.0, 1961.0, 1320.0, 972.0, 593.0, 464.0, 307.0, 232.0, 153.0, 97.0, 70.0, 41.0, 32.0, 26.0, 18.0, 7.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.638671875, -2.5533447265625, -2.468017578125, -2.3826904296875, -2.29736328125, -2.2120361328125, -2.126708984375, -2.0413818359375, -1.9560546875, -1.8707275390625, -1.785400390625, -1.7000732421875, -1.61474609375, -1.5294189453125, -1.444091796875, -1.3587646484375, -1.2734375, -1.1881103515625, -1.102783203125, -1.0174560546875, -0.93212890625, -0.8468017578125, -0.761474609375, -0.6761474609375, -0.5908203125, -0.5054931640625, -0.420166015625, -0.3348388671875, -0.24951171875, -0.1641845703125, -0.078857421875, 0.0064697265625, 0.091796875, 0.1771240234375, 0.262451171875, 0.3477783203125, 0.43310546875, 0.5184326171875, 0.603759765625, 0.6890869140625, 0.7744140625, 0.8597412109375, 0.945068359375, 1.0303955078125, 1.11572265625, 1.2010498046875, 1.286376953125, 1.3717041015625, 1.45703125, 1.5423583984375, 1.627685546875, 1.7130126953125, 1.79833984375, 1.8836669921875, 1.968994140625, 2.0543212890625, 2.1396484375, 2.2249755859375, 2.310302734375, 2.3956298828125, 2.48095703125, 2.5662841796875, 2.651611328125, 2.7369384765625, 2.822265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 8.0, 3.0, 9.0, 10.0, 12.0, 11.0, 17.0, 12.0, 14.0, 12.0, 19.0, 23.0, 25.0, 31.0, 33.0, 28.0, 37.0, 36.0, 33.0, 26.0, 44.0, 50.0, 37.0, 36.0, 43.0, 41.0, 40.0, 15.0, 34.0, 24.0, 30.0, 33.0, 27.0, 20.0, 16.0, 21.0, 22.0, 12.0, 11.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-14.65625, -14.21142578125, -13.7666015625, -13.32177734375, -12.876953125, -12.43212890625, -11.9873046875, -11.54248046875, -11.09765625, -10.65283203125, -10.2080078125, -9.76318359375, -9.318359375, -8.87353515625, -8.4287109375, -7.98388671875, -7.5390625, -7.09423828125, -6.6494140625, -6.20458984375, -5.759765625, -5.31494140625, -4.8701171875, -4.42529296875, -3.98046875, -3.53564453125, -3.0908203125, -2.64599609375, -2.201171875, -1.75634765625, -1.3115234375, -0.86669921875, -0.421875, 0.02294921875, 0.4677734375, 0.91259765625, 1.357421875, 1.80224609375, 2.2470703125, 2.69189453125, 3.13671875, 3.58154296875, 4.0263671875, 4.47119140625, 4.916015625, 5.36083984375, 5.8056640625, 6.25048828125, 6.6953125, 7.14013671875, 7.5849609375, 8.02978515625, 8.474609375, 8.91943359375, 9.3642578125, 9.80908203125, 10.25390625, 10.69873046875, 11.1435546875, 11.58837890625, 12.033203125, 12.47802734375, 12.9228515625, 13.36767578125, 13.8125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 14.0, 18.0, 35.0, 47.0, 75.0, 99.0, 148.0, 223.0, 359.0, 491.0, 795.0, 1143.0, 1891.0, 3013.0, 4949.0, 8500.0, 15153.0, 28527.0, 58683.0, 134774.0, 331318.0, 257400.0, 101036.0, 45880.0, 23170.0, 12241.0, 7131.0, 4232.0, 2503.0, 1561.0, 1042.0, 683.0, 481.0, 309.0, 191.0, 129.0, 95.0, 61.0, 40.0, 31.0, 22.0, 15.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2255859375, -0.21850013732910156, -0.21141433715820312, -0.2043285369873047, -0.19724273681640625, -0.1901569366455078, -0.18307113647460938, -0.17598533630371094, -0.1688995361328125, -0.16181373596191406, -0.15472793579101562, -0.1476421356201172, -0.14055633544921875, -0.1334705352783203, -0.12638473510742188, -0.11929893493652344, -0.112213134765625, -0.10512733459472656, -0.09804153442382812, -0.09095573425292969, -0.08386993408203125, -0.07678413391113281, -0.06969833374023438, -0.06261253356933594, -0.0555267333984375, -0.04844093322753906, -0.041355133056640625, -0.03426933288574219, -0.02718353271484375, -0.020097732543945312, -0.013011932373046875, -0.0059261322021484375, 0.00115966796875, 0.008245468139648438, 0.015331268310546875, 0.022417068481445312, 0.02950286865234375, 0.03658866882324219, 0.043674468994140625, 0.05076026916503906, 0.0578460693359375, 0.06493186950683594, 0.07201766967773438, 0.07910346984863281, 0.08618927001953125, 0.09327507019042969, 0.10036087036132812, 0.10744667053222656, 0.114532470703125, 0.12161827087402344, 0.12870407104492188, 0.1357898712158203, 0.14287567138671875, 0.1499614715576172, 0.15704727172851562, 0.16413307189941406, 0.1712188720703125, 0.17830467224121094, 0.18539047241210938, 0.1924762725830078, 0.19956207275390625, 0.2066478729248047, 0.21373367309570312, 0.22081947326660156, 0.2279052734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 6.0, 7.0, 6.0, 6.0, 6.0, 5.0, 14.0, 6.0, 16.0, 15.0, 17.0, 26.0, 16.0, 23.0, 17.0, 36.0, 40.0, 37.0, 48.0, 48.0, 56.0, 48.0, 46.0, 39.0, 45.0, 39.0, 43.0, 25.0, 41.0, 37.0, 29.0, 30.0, 22.0, 22.0, 17.0, 10.0, 12.0, 13.0, 6.0, 7.0, 7.0, 7.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.5928020477294922e-05, -2.5063753128051758e-05, -2.4199485778808594e-05, -2.333521842956543e-05, -2.2470951080322266e-05, -2.16066837310791e-05, -2.0742416381835938e-05, -1.9878149032592773e-05, -1.901388168334961e-05, -1.8149614334106445e-05, -1.728534698486328e-05, -1.6421079635620117e-05, -1.5556812286376953e-05, -1.4692544937133789e-05, -1.3828277587890625e-05, -1.2964010238647461e-05, -1.2099742889404297e-05, -1.1235475540161133e-05, -1.0371208190917969e-05, -9.506940841674805e-06, -8.64267349243164e-06, -7.778406143188477e-06, -6.9141387939453125e-06, -6.0498714447021484e-06, -5.185604095458984e-06, -4.32133674621582e-06, -3.4570693969726562e-06, -2.592802047729492e-06, -1.7285346984863281e-06, -8.642673492431641e-07, 0.0, 8.642673492431641e-07, 1.7285346984863281e-06, 2.592802047729492e-06, 3.4570693969726562e-06, 4.32133674621582e-06, 5.185604095458984e-06, 6.0498714447021484e-06, 6.9141387939453125e-06, 7.778406143188477e-06, 8.64267349243164e-06, 9.506940841674805e-06, 1.0371208190917969e-05, 1.1235475540161133e-05, 1.2099742889404297e-05, 1.2964010238647461e-05, 1.3828277587890625e-05, 1.4692544937133789e-05, 1.5556812286376953e-05, 1.6421079635620117e-05, 1.728534698486328e-05, 1.8149614334106445e-05, 1.901388168334961e-05, 1.9878149032592773e-05, 2.0742416381835938e-05, 2.16066837310791e-05, 2.2470951080322266e-05, 2.333521842956543e-05, 2.4199485778808594e-05, 2.5063753128051758e-05, 2.5928020477294922e-05, 2.6792287826538086e-05, 2.765655517578125e-05, 2.8520822525024414e-05, 2.9385089874267578e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 12.0, 15.0, 33.0, 27.0, 60.0, 97.0, 124.0, 222.0, 332.0, 434.0, 628.0, 908.0, 1330.0, 2007.0, 2885.0, 4248.0, 6269.0, 8792.0, 12554.0, 18469.0, 27754.0, 42550.0, 68448.0, 117158.0, 228273.0, 207990.0, 109193.0, 64280.0, 40553.0, 26452.0, 17738.0, 11963.0, 8289.0, 5741.0, 4004.0, 2737.0, 1904.0, 1292.0, 916.0, 572.0, 460.0, 314.0, 177.0, 104.0, 77.0, 47.0, 42.0, 28.0, 16.0, 19.0, 10.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.446533203125, -0.43297576904296875, -0.4194183349609375, -0.40586090087890625, -0.392303466796875, -0.37874603271484375, -0.3651885986328125, -0.35163116455078125, -0.33807373046875, -0.32451629638671875, -0.3109588623046875, -0.29740142822265625, -0.283843994140625, -0.27028656005859375, -0.2567291259765625, -0.24317169189453125, -0.2296142578125, -0.21605682373046875, -0.2024993896484375, -0.18894195556640625, -0.175384521484375, -0.16182708740234375, -0.1482696533203125, -0.13471221923828125, -0.12115478515625, -0.10759735107421875, -0.0940399169921875, -0.08048248291015625, -0.066925048828125, -0.05336761474609375, -0.0398101806640625, -0.02625274658203125, -0.0126953125, 0.00086212158203125, 0.0144195556640625, 0.02797698974609375, 0.041534423828125, 0.05509185791015625, 0.0686492919921875, 0.08220672607421875, 0.09576416015625, 0.10932159423828125, 0.1228790283203125, 0.13643646240234375, 0.149993896484375, 0.16355133056640625, 0.1771087646484375, 0.19066619873046875, 0.2042236328125, 0.21778106689453125, 0.2313385009765625, 0.24489593505859375, 0.258453369140625, 0.27201080322265625, 0.2855682373046875, 0.29912567138671875, 0.31268310546875, 0.32624053955078125, 0.3397979736328125, 0.35335540771484375, 0.366912841796875, 0.38047027587890625, 0.3940277099609375, 0.40758514404296875, 0.421142578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 7.0, 5.0, 5.0, 10.0, 8.0, 10.0, 17.0, 18.0, 23.0, 14.0, 32.0, 19.0, 25.0, 34.0, 40.0, 38.0, 42.0, 61.0, 55.0, 62.0, 64.0, 53.0, 48.0, 42.0, 39.0, 37.0, 32.0, 24.0, 18.0, 24.0, 11.0, 10.0, 12.0, 9.0, 7.0, 9.0, 9.0, 5.0, 8.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31591796875, -0.3057594299316406, -0.29560089111328125, -0.2854423522949219, -0.2752838134765625, -0.2651252746582031, -0.25496673583984375, -0.24480819702148438, -0.234649658203125, -0.22449111938476562, -0.21433258056640625, -0.20417404174804688, -0.1940155029296875, -0.18385696411132812, -0.17369842529296875, -0.16353988647460938, -0.15338134765625, -0.14322280883789062, -0.13306427001953125, -0.12290573120117188, -0.1127471923828125, -0.10258865356445312, -0.09243011474609375, -0.08227157592773438, -0.072113037109375, -0.061954498291015625, -0.05179595947265625, -0.041637420654296875, -0.0314788818359375, -0.021320343017578125, -0.01116180419921875, -0.001003265380859375, 0.0091552734375, 0.019313812255859375, 0.02947235107421875, 0.039630889892578125, 0.0497894287109375, 0.059947967529296875, 0.07010650634765625, 0.08026504516601562, 0.090423583984375, 0.10058212280273438, 0.11074066162109375, 0.12089920043945312, 0.1310577392578125, 0.14121627807617188, 0.15137481689453125, 0.16153335571289062, 0.17169189453125, 0.18185043334960938, 0.19200897216796875, 0.20216751098632812, 0.2123260498046875, 0.22248458862304688, 0.23264312744140625, 0.24280166625976562, 0.252960205078125, 0.2631187438964844, 0.27327728271484375, 0.2834358215332031, 0.2935943603515625, 0.3037528991699219, 0.31391143798828125, 0.3240699768066406, 0.334228515625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 10.0, 10.0, 14.0, 15.0, 20.0, 21.0, 28.0, 36.0, 20.0, 45.0, 37.0, 56.0, 51.0, 36.0, 62.0, 52.0, 58.0, 56.0, 49.0, 45.0, 38.0, 24.0, 36.0, 30.0, 23.0, 30.0, 19.0, 18.0, 14.0, 13.0, 10.0, 8.0, 2.0, 2.0, 8.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.86077308654785, -18.159896850585938, -17.459020614624023, -16.75814437866211, -16.057270050048828, -15.356392860412598, -14.655517578125, -13.954641342163086, -13.253765106201172, -12.552888870239258, -11.852012634277344, -11.151137351989746, -10.450261116027832, -9.749384880065918, -9.04850959777832, -8.347633361816406, -7.646757125854492, -6.945880889892578, -6.245005130767822, -5.544129371643066, -4.843253135681152, -4.142376899719238, -3.4415011405944824, -2.7406253814697266, -2.0397491455078125, -1.3388731479644775, -0.6379971504211426, 0.06287884712219238, 0.7637548446655273, 1.4646308422088623, 2.1655068397521973, 2.866382598876953, 3.5672607421875, 4.268136978149414, 4.96901273727417, 5.669888496398926, 6.37076473236084, 7.071640968322754, 7.77251672744751, 8.473392486572266, 9.17426872253418, 9.875144958496094, 10.576021194458008, 11.276896476745605, 11.97777271270752, 12.678648948669434, 13.379524230957031, 14.080400466918945, 14.78127670288086, 15.482152938842773, 16.183029174804688, 16.8839054107666, 17.584781646728516, 18.285655975341797, 18.98653221130371, 19.687408447265625, 20.38828468322754, 21.089160919189453, 21.790037155151367, 22.49091339111328, 23.191787719726562, 23.892663955688477, 24.59354019165039, 25.294416427612305, 25.99529266357422]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 6.0, 1.0, 5.0, 5.0, 3.0, 5.0, 7.0, 8.0, 12.0, 8.0, 15.0, 11.0, 16.0, 12.0, 31.0, 23.0, 25.0, 28.0, 35.0, 47.0, 42.0, 40.0, 37.0, 48.0, 50.0, 49.0, 36.0, 38.0, 36.0, 31.0, 38.0, 38.0, 34.0, 25.0, 25.0, 27.0, 18.0, 20.0, 17.0, 9.0, 11.0, 5.0, 11.0, 6.0, 4.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.182872772216797, -20.446439743041992, -19.710006713867188, -18.973573684692383, -18.237140655517578, -17.500707626342773, -16.76427459716797, -16.027841567993164, -15.29140853881836, -14.554975509643555, -13.81854248046875, -13.082109451293945, -12.34567642211914, -11.609243392944336, -10.872810363769531, -10.136377334594727, -9.399944305419922, -8.663511276245117, -7.9270782470703125, -7.190645217895508, -6.454212188720703, -5.717779159545898, -4.981346130371094, -4.244913101196289, -3.5084800720214844, -2.7720470428466797, -2.035614013671875, -1.2991809844970703, -0.5627479553222656, 0.17368507385253906, 0.9101181030273438, 1.6465511322021484, 2.3829822540283203, 3.119415283203125, 3.8558483123779297, 4.592281341552734, 5.328714370727539, 6.065147399902344, 6.801580429077148, 7.538013458251953, 8.274446487426758, 9.010879516601562, 9.747312545776367, 10.483745574951172, 11.220178604125977, 11.956611633300781, 12.693044662475586, 13.42947769165039, 14.165910720825195, 14.90234375, 15.638776779174805, 16.37520980834961, 17.111642837524414, 17.84807586669922, 18.584508895874023, 19.320941925048828, 20.057374954223633, 20.793807983398438, 21.530241012573242, 22.266674041748047, 23.00310707092285, 23.739540100097656, 24.47597312927246, 25.212406158447266, 25.94883918762207]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 20.0, 25.0, 37.0, 57.0, 98.0, 178.0, 247.0, 394.0, 649.0, 1027.0, 1659.0, 2770.0, 4603.0, 7236.0, 11435.0, 17936.0, 27040.0, 39738.0, 55693.0, 74439.0, 92567.0, 107601.0, 114535.0, 111181.0, 98611.0, 82102.0, 62401.0, 45753.0, 31510.0, 20776.0, 13536.0, 8540.0, 5393.0, 3375.0, 2088.0, 1272.0, 787.0, 479.0, 271.0, 194.0, 115.0, 58.0, 41.0, 38.0, 13.0, 6.0, 14.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-14.890625, -14.4486083984375, -14.006591796875, -13.5645751953125, -13.12255859375, -12.6805419921875, -12.238525390625, -11.7965087890625, -11.3544921875, -10.9124755859375, -10.470458984375, -10.0284423828125, -9.58642578125, -9.1444091796875, -8.702392578125, -8.2603759765625, -7.818359375, -7.3763427734375, -6.934326171875, -6.4923095703125, -6.05029296875, -5.6082763671875, -5.166259765625, -4.7242431640625, -4.2822265625, -3.8402099609375, -3.398193359375, -2.9561767578125, -2.51416015625, -2.0721435546875, -1.630126953125, -1.1881103515625, -0.74609375, -0.3040771484375, 0.137939453125, 0.5799560546875, 1.02197265625, 1.4639892578125, 1.906005859375, 2.3480224609375, 2.7900390625, 3.2320556640625, 3.674072265625, 4.1160888671875, 4.55810546875, 5.0001220703125, 5.442138671875, 5.8841552734375, 6.326171875, 6.7681884765625, 7.210205078125, 7.6522216796875, 8.09423828125, 8.5362548828125, 8.978271484375, 9.4202880859375, 9.8623046875, 10.3043212890625, 10.746337890625, 11.1883544921875, 11.63037109375, 12.0723876953125, 12.514404296875, 12.9564208984375, 13.3984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 5.0, 13.0, 7.0, 11.0, 8.0, 9.0, 12.0, 19.0, 23.0, 18.0, 24.0, 44.0, 38.0, 35.0, 33.0, 37.0, 48.0, 40.0, 47.0, 47.0, 47.0, 43.0, 37.0, 51.0, 31.0, 37.0, 45.0, 27.0, 25.0, 24.0, 18.0, 25.0, 16.0, 10.0, 7.0, 5.0, 6.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.3974609375, -20.638671875, -19.8798828125, -19.12109375, -18.3623046875, -17.603515625, -16.8447265625, -16.0859375, -15.3271484375, -14.568359375, -13.8095703125, -13.05078125, -12.2919921875, -11.533203125, -10.7744140625, -10.015625, -9.2568359375, -8.498046875, -7.7392578125, -6.98046875, -6.2216796875, -5.462890625, -4.7041015625, -3.9453125, -3.1865234375, -2.427734375, -1.6689453125, -0.91015625, -0.1513671875, 0.607421875, 1.3662109375, 2.125, 2.8837890625, 3.642578125, 4.4013671875, 5.16015625, 5.9189453125, 6.677734375, 7.4365234375, 8.1953125, 8.9541015625, 9.712890625, 10.4716796875, 11.23046875, 11.9892578125, 12.748046875, 13.5068359375, 14.265625, 15.0244140625, 15.783203125, 16.5419921875, 17.30078125, 18.0595703125, 18.818359375, 19.5771484375, 20.3359375, 21.0947265625, 21.853515625, 22.6123046875, 23.37109375, 24.1298828125, 24.888671875, 25.6474609375, 26.40625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 14.0, 12.0, 31.0, 39.0, 74.0, 140.0, 231.0, 335.0, 594.0, 1044.0, 1840.0, 3051.0, 5523.0, 9330.0, 15938.0, 25908.0, 40623.0, 60761.0, 85115.0, 108571.0, 125831.0, 130328.0, 120180.0, 99736.0, 74615.0, 51912.0, 34234.0, 21305.0, 13066.0, 7658.0, 4367.0, 2619.0, 1397.0, 907.0, 465.0, 308.0, 182.0, 102.0, 60.0, 49.0, 24.0, 12.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9453125, -15.4359130859375, -14.926513671875, -14.4171142578125, -13.90771484375, -13.3983154296875, -12.888916015625, -12.3795166015625, -11.8701171875, -11.3607177734375, -10.851318359375, -10.3419189453125, -9.83251953125, -9.3231201171875, -8.813720703125, -8.3043212890625, -7.794921875, -7.2855224609375, -6.776123046875, -6.2667236328125, -5.75732421875, -5.2479248046875, -4.738525390625, -4.2291259765625, -3.7197265625, -3.2103271484375, -2.700927734375, -2.1915283203125, -1.68212890625, -1.1727294921875, -0.663330078125, -0.1539306640625, 0.35546875, 0.8648681640625, 1.374267578125, 1.8836669921875, 2.39306640625, 2.9024658203125, 3.411865234375, 3.9212646484375, 4.4306640625, 4.9400634765625, 5.449462890625, 5.9588623046875, 6.46826171875, 6.9776611328125, 7.487060546875, 7.9964599609375, 8.505859375, 9.0152587890625, 9.524658203125, 10.0340576171875, 10.54345703125, 11.0528564453125, 11.562255859375, 12.0716552734375, 12.5810546875, 13.0904541015625, 13.599853515625, 14.1092529296875, 14.61865234375, 15.1280517578125, 15.637451171875, 16.1468505859375, 16.65625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 2.0, 6.0, 8.0, 6.0, 9.0, 16.0, 17.0, 22.0, 24.0, 29.0, 35.0, 31.0, 31.0, 37.0, 40.0, 34.0, 39.0, 57.0, 70.0, 38.0, 58.0, 40.0, 58.0, 43.0, 32.0, 28.0, 29.0, 30.0, 17.0, 22.0, 22.0, 17.0, 21.0, 6.0, 6.0, 6.0, 4.0, 5.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.078125, -14.576171875, -14.07421875, -13.572265625, -13.0703125, -12.568359375, -12.06640625, -11.564453125, -11.0625, -10.560546875, -10.05859375, -9.556640625, -9.0546875, -8.552734375, -8.05078125, -7.548828125, -7.046875, -6.544921875, -6.04296875, -5.541015625, -5.0390625, -4.537109375, -4.03515625, -3.533203125, -3.03125, -2.529296875, -2.02734375, -1.525390625, -1.0234375, -0.521484375, -0.01953125, 0.482421875, 0.984375, 1.486328125, 1.98828125, 2.490234375, 2.9921875, 3.494140625, 3.99609375, 4.498046875, 5.0, 5.501953125, 6.00390625, 6.505859375, 7.0078125, 7.509765625, 8.01171875, 8.513671875, 9.015625, 9.517578125, 10.01953125, 10.521484375, 11.0234375, 11.525390625, 12.02734375, 12.529296875, 13.03125, 13.533203125, 14.03515625, 14.537109375, 15.0390625, 15.541015625, 16.04296875, 16.544921875, 17.046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 1.0, 8.0, 10.0, 4.0, 16.0, 26.0, 28.0, 43.0, 95.0, 112.0, 163.0, 233.0, 396.0, 567.0, 893.0, 1432.0, 2227.0, 3745.0, 6000.0, 9513.0, 15970.0, 25210.0, 39537.0, 58931.0, 83810.0, 109098.0, 128086.0, 132881.0, 121052.0, 98340.0, 72460.0, 50113.0, 33233.0, 20562.0, 12797.0, 8069.0, 4681.0, 2989.0, 1865.0, 1193.0, 762.0, 473.0, 340.0, 185.0, 147.0, 82.0, 63.0, 43.0, 34.0, 14.0, 11.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.62109375, -4.473388671875, -4.32568359375, -4.177978515625, -4.0302734375, -3.882568359375, -3.73486328125, -3.587158203125, -3.439453125, -3.291748046875, -3.14404296875, -2.996337890625, -2.8486328125, -2.700927734375, -2.55322265625, -2.405517578125, -2.2578125, -2.110107421875, -1.96240234375, -1.814697265625, -1.6669921875, -1.519287109375, -1.37158203125, -1.223876953125, -1.076171875, -0.928466796875, -0.78076171875, -0.633056640625, -0.4853515625, -0.337646484375, -0.18994140625, -0.042236328125, 0.10546875, 0.253173828125, 0.40087890625, 0.548583984375, 0.6962890625, 0.843994140625, 0.99169921875, 1.139404296875, 1.287109375, 1.434814453125, 1.58251953125, 1.730224609375, 1.8779296875, 2.025634765625, 2.17333984375, 2.321044921875, 2.46875, 2.616455078125, 2.76416015625, 2.911865234375, 3.0595703125, 3.207275390625, 3.35498046875, 3.502685546875, 3.650390625, 3.798095703125, 3.94580078125, 4.093505859375, 4.2412109375, 4.388916015625, 4.53662109375, 4.684326171875, 4.83203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 0.0, 9.0, 9.0, 12.0, 18.0, 17.0, 20.0, 25.0, 22.0, 27.0, 42.0, 48.0, 42.0, 54.0, 61.0, 39.0, 55.0, 49.0, 58.0, 56.0, 56.0, 47.0, 37.0, 38.0, 23.0, 23.0, 23.0, 18.0, 13.0, 15.0, 11.0, 11.0, 6.0, 4.0, 7.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0005578994750976562, -0.0005419217050075531, -0.00052594393491745, -0.0005099661648273468, -0.0004939883947372437, -0.0004780106246471405, -0.00046203285455703735, -0.0004460550844669342, -0.00043007731437683105, -0.0004140995442867279, -0.00039812177419662476, -0.0003821440041065216, -0.00036616623401641846, -0.0003501884639263153, -0.00033421069383621216, -0.000318232923746109, -0.00030225515365600586, -0.0002862773835659027, -0.00027029961347579956, -0.0002543218433856964, -0.00023834407329559326, -0.0002223663032054901, -0.00020638853311538696, -0.0001904107630252838, -0.00017443299293518066, -0.00015845522284507751, -0.00014247745275497437, -0.00012649968266487122, -0.00011052191257476807, -9.454414248466492e-05, -7.856637239456177e-05, -6.258860230445862e-05, -4.661083221435547e-05, -3.063306212425232e-05, -1.465529203414917e-05, 1.3224780559539795e-06, 1.730024814605713e-05, 3.327801823616028e-05, 4.925578832626343e-05, 6.523355841636658e-05, 8.121132850646973e-05, 9.718909859657288e-05, 0.00011316686868667603, 0.00012914463877677917, 0.00014512240886688232, 0.00016110017895698547, 0.00017707794904708862, 0.00019305571913719177, 0.00020903348922729492, 0.00022501125931739807, 0.00024098902940750122, 0.00025696679949760437, 0.0002729445695877075, 0.00028892233967781067, 0.0003049001097679138, 0.00032087787985801697, 0.0003368556499481201, 0.00035283342003822327, 0.0003688111901283264, 0.00038478896021842957, 0.0004007667303085327, 0.00041674450039863586, 0.000432722270488739, 0.00044870004057884216, 0.0004646778106689453]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 7.0, 9.0, 13.0, 24.0, 39.0, 69.0, 111.0, 210.0, 313.0, 531.0, 816.0, 1353.0, 2246.0, 3666.0, 6511.0, 11058.0, 18681.0, 31340.0, 51177.0, 78292.0, 110493.0, 137719.0, 148045.0, 136344.0, 109034.0, 76406.0, 49451.0, 30356.0, 18063.0, 10619.0, 6238.0, 3717.0, 2216.0, 1345.0, 801.0, 475.0, 297.0, 159.0, 122.0, 70.0, 50.0, 25.0, 21.0, 6.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.67578125, -5.49542236328125, -5.3150634765625, -5.13470458984375, -4.954345703125, -4.77398681640625, -4.5936279296875, -4.41326904296875, -4.23291015625, -4.05255126953125, -3.8721923828125, -3.69183349609375, -3.511474609375, -3.33111572265625, -3.1507568359375, -2.97039794921875, -2.7900390625, -2.60968017578125, -2.4293212890625, -2.24896240234375, -2.068603515625, -1.88824462890625, -1.7078857421875, -1.52752685546875, -1.34716796875, -1.16680908203125, -0.9864501953125, -0.80609130859375, -0.625732421875, -0.44537353515625, -0.2650146484375, -0.08465576171875, 0.095703125, 0.27606201171875, 0.4564208984375, 0.63677978515625, 0.817138671875, 0.99749755859375, 1.1778564453125, 1.35821533203125, 1.53857421875, 1.71893310546875, 1.8992919921875, 2.07965087890625, 2.260009765625, 2.44036865234375, 2.6207275390625, 2.80108642578125, 2.9814453125, 3.16180419921875, 3.3421630859375, 3.52252197265625, 3.702880859375, 3.88323974609375, 4.0635986328125, 4.24395751953125, 4.42431640625, 4.60467529296875, 4.7850341796875, 4.96539306640625, 5.145751953125, 5.32611083984375, 5.5064697265625, 5.68682861328125, 5.8671875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 8.0, 9.0, 16.0, 17.0, 22.0, 22.0, 34.0, 31.0, 41.0, 61.0, 56.0, 50.0, 60.0, 54.0, 84.0, 62.0, 65.0, 56.0, 51.0, 37.0, 27.0, 27.0, 23.0, 21.0, 15.0, 15.0, 10.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.288360595703125, -2.18414306640625, -2.079925537109375, -1.9757080078125, -1.871490478515625, -1.76727294921875, -1.663055419921875, -1.558837890625, -1.454620361328125, -1.35040283203125, -1.246185302734375, -1.1419677734375, -1.037750244140625, -0.93353271484375, -0.829315185546875, -0.72509765625, -0.620880126953125, -0.51666259765625, -0.412445068359375, -0.3082275390625, -0.204010009765625, -0.09979248046875, 0.004425048828125, 0.108642578125, 0.212860107421875, 0.31707763671875, 0.421295166015625, 0.5255126953125, 0.629730224609375, 0.73394775390625, 0.838165283203125, 0.9423828125, 1.046600341796875, 1.15081787109375, 1.255035400390625, 1.3592529296875, 1.463470458984375, 1.56768798828125, 1.671905517578125, 1.776123046875, 1.880340576171875, 1.98455810546875, 2.088775634765625, 2.1929931640625, 2.297210693359375, 2.40142822265625, 2.505645751953125, 2.60986328125, 2.714080810546875, 2.81829833984375, 2.922515869140625, 3.0267333984375, 3.130950927734375, 3.23516845703125, 3.339385986328125, 3.443603515625, 3.547821044921875, 3.65203857421875, 3.756256103515625, 3.8604736328125, 3.964691162109375, 4.06890869140625, 4.173126220703125, 4.27734375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 3.0, 6.0, 8.0, 11.0, 23.0, 19.0, 28.0, 26.0, 22.0, 18.0, 32.0, 32.0, 43.0, 42.0, 40.0, 46.0, 54.0, 47.0, 41.0, 52.0, 53.0, 32.0, 40.0, 34.0, 37.0, 28.0, 28.0, 20.0, 29.0, 18.0, 20.0, 15.0, 15.0, 7.0, 4.0, 7.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-17.382543563842773, -16.76424217224121, -16.14594078063965, -15.52763843536377, -14.90933609008789, -14.291034698486328, -13.672733306884766, -13.054431915283203, -12.436129570007324, -11.817828178405762, -11.199525833129883, -10.58122444152832, -9.962923049926758, -9.344620704650879, -8.726319313049316, -8.108016967773438, -7.489715576171875, -6.871413707733154, -6.253111839294434, -5.634810447692871, -5.01650857925415, -4.39820671081543, -3.779905080795288, -3.1616034507751465, -2.543301582336426, -1.9249998331069946, -1.3066980838775635, -0.6883963346481323, -0.07009458541870117, 0.5482072830200195, 1.1665089130401611, 1.7848105430603027, 2.4031124114990234, 3.021414279937744, 3.6397159099578857, 4.258017539978027, 4.876319408416748, 5.494621276855469, 6.112922668457031, 6.731224536895752, 7.349526405334473, 7.967828273773193, 8.586130142211914, 9.204431533813477, 9.822732925415039, 10.441035270690918, 11.05933666229248, 11.67763900756836, 12.295940399169922, 12.914241790771484, 13.532544136047363, 14.150845527648926, 14.769147872924805, 15.387449264526367, 16.00575065612793, 16.624052047729492, 17.242355346679688, 17.86065673828125, 18.478958129882812, 19.097261428833008, 19.71556282043457, 20.333864212036133, 20.952165603637695, 21.570466995239258, 22.18876838684082]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 5.0, 18.0, 4.0, 12.0, 11.0, 11.0, 16.0, 16.0, 15.0, 20.0, 25.0, 36.0, 30.0, 47.0, 48.0, 48.0, 39.0, 47.0, 33.0, 30.0, 56.0, 51.0, 33.0, 35.0, 30.0, 41.0, 29.0, 27.0, 18.0, 25.0, 29.0, 25.0, 23.0, 17.0, 10.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.262420654296875, -23.506309509277344, -22.750198364257812, -21.99408531188965, -21.237974166870117, -20.481863021850586, -19.725749969482422, -18.96963882446289, -18.21352767944336, -17.457416534423828, -16.701305389404297, -15.945192337036133, -15.189081192016602, -14.43297004699707, -13.676857948303223, -12.920745849609375, -12.164634704589844, -11.408523559570312, -10.652411460876465, -9.896299362182617, -9.140188217163086, -8.384077072143555, -7.627964973449707, -6.871853351593018, -6.115741729736328, -5.359630107879639, -4.603518486022949, -3.8474068641662598, -3.0912952423095703, -2.335183620452881, -1.5790719985961914, -0.822960376739502, -0.06684684753417969, 0.6892647743225098, 1.4453763961791992, 2.2014880180358887, 2.957599639892578, 3.7137112617492676, 4.469822883605957, 5.2259345054626465, 5.982046127319336, 6.738157749176025, 7.494269371032715, 8.250381469726562, 9.006492614746094, 9.762603759765625, 10.518715858459473, 11.27482795715332, 12.030939102172852, 12.787050247192383, 13.54316234588623, 14.299274444580078, 15.05538558959961, 15.81149673461914, 16.567607879638672, 17.323720932006836, 18.079832077026367, 18.8359432220459, 19.592056274414062, 20.348167419433594, 21.104278564453125, 21.860389709472656, 22.616500854492188, 23.37261390686035, 24.128725051879883]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 7.0, 19.0, 25.0, 50.0, 69.0, 111.0, 198.0, 282.0, 489.0, 912.0, 1322.0, 2281.0, 3505.0, 5801.0, 9377.0, 15022.0, 24234.0, 37952.0, 59206.0, 90666.0, 137251.0, 199301.0, 277145.0, 362930.0, 437987.0, 480758.0, 475340.0, 425482.0, 346039.0, 261072.0, 185642.0, 127163.0, 83288.0, 53664.0, 33941.0, 21299.0, 13293.0, 8169.0, 5065.0, 3134.0, 1901.0, 1113.0, 682.0, 418.0, 252.0, 156.0, 103.0, 62.0, 46.0, 31.0, 17.0, 11.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-15.1015625, -14.6424560546875, -14.183349609375, -13.7242431640625, -13.26513671875, -12.8060302734375, -12.346923828125, -11.8878173828125, -11.4287109375, -10.9696044921875, -10.510498046875, -10.0513916015625, -9.59228515625, -9.1331787109375, -8.674072265625, -8.2149658203125, -7.755859375, -7.2967529296875, -6.837646484375, -6.3785400390625, -5.91943359375, -5.4603271484375, -5.001220703125, -4.5421142578125, -4.0830078125, -3.6239013671875, -3.164794921875, -2.7056884765625, -2.24658203125, -1.7874755859375, -1.328369140625, -0.8692626953125, -0.41015625, 0.0489501953125, 0.508056640625, 0.9671630859375, 1.42626953125, 1.8853759765625, 2.344482421875, 2.8035888671875, 3.2626953125, 3.7218017578125, 4.180908203125, 4.6400146484375, 5.09912109375, 5.5582275390625, 6.017333984375, 6.4764404296875, 6.935546875, 7.3946533203125, 7.853759765625, 8.3128662109375, 8.77197265625, 9.2310791015625, 9.690185546875, 10.1492919921875, 10.6083984375, 11.0675048828125, 11.526611328125, 11.9857177734375, 12.44482421875, 12.9039306640625, 13.363037109375, 13.8221435546875, 14.28125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 2.0, 9.0, 6.0, 12.0, 8.0, 13.0, 6.0, 10.0, 14.0, 16.0, 23.0, 33.0, 23.0, 31.0, 28.0, 38.0, 37.0, 48.0, 34.0, 44.0, 58.0, 39.0, 44.0, 43.0, 39.0, 31.0, 45.0, 28.0, 33.0, 29.0, 29.0, 20.0, 30.0, 17.0, 20.0, 14.0, 11.0, 7.0, 7.0, 1.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.390625, -16.81396484375, -16.2373046875, -15.66064453125, -15.083984375, -14.50732421875, -13.9306640625, -13.35400390625, -12.77734375, -12.20068359375, -11.6240234375, -11.04736328125, -10.470703125, -9.89404296875, -9.3173828125, -8.74072265625, -8.1640625, -7.58740234375, -7.0107421875, -6.43408203125, -5.857421875, -5.28076171875, -4.7041015625, -4.12744140625, -3.55078125, -2.97412109375, -2.3974609375, -1.82080078125, -1.244140625, -0.66748046875, -0.0908203125, 0.48583984375, 1.0625, 1.63916015625, 2.2158203125, 2.79248046875, 3.369140625, 3.94580078125, 4.5224609375, 5.09912109375, 5.67578125, 6.25244140625, 6.8291015625, 7.40576171875, 7.982421875, 8.55908203125, 9.1357421875, 9.71240234375, 10.2890625, 10.86572265625, 11.4423828125, 12.01904296875, 12.595703125, 13.17236328125, 13.7490234375, 14.32568359375, 14.90234375, 15.47900390625, 16.0556640625, 16.63232421875, 17.208984375, 17.78564453125, 18.3623046875, 18.93896484375, 19.515625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 7.0, 2.0, 8.0, 7.0, 14.0, 26.0, 50.0, 80.0, 101.0, 137.0, 265.0, 445.0, 762.0, 1266.0, 2015.0, 3409.0, 5493.0, 9170.0, 15056.0, 24284.0, 38661.0, 60722.0, 90923.0, 134255.0, 189047.0, 252133.0, 319002.0, 380012.0, 420544.0, 430301.0, 410113.0, 362120.0, 299282.0, 231723.0, 170890.0, 119857.0, 80918.0, 53350.0, 33845.0, 21218.0, 12836.0, 7940.0, 4631.0, 2887.0, 1736.0, 1049.0, 645.0, 407.0, 229.0, 160.0, 94.0, 56.0, 40.0, 22.0, 18.0, 16.0, 6.0, 5.0, 4.0, 2.0], "bins": [-14.109375, -13.686279296875, -13.26318359375, -12.840087890625, -12.4169921875, -11.993896484375, -11.57080078125, -11.147705078125, -10.724609375, -10.301513671875, -9.87841796875, -9.455322265625, -9.0322265625, -8.609130859375, -8.18603515625, -7.762939453125, -7.33984375, -6.916748046875, -6.49365234375, -6.070556640625, -5.6474609375, -5.224365234375, -4.80126953125, -4.378173828125, -3.955078125, -3.531982421875, -3.10888671875, -2.685791015625, -2.2626953125, -1.839599609375, -1.41650390625, -0.993408203125, -0.5703125, -0.147216796875, 0.27587890625, 0.698974609375, 1.1220703125, 1.545166015625, 1.96826171875, 2.391357421875, 2.814453125, 3.237548828125, 3.66064453125, 4.083740234375, 4.5068359375, 4.929931640625, 5.35302734375, 5.776123046875, 6.19921875, 6.622314453125, 7.04541015625, 7.468505859375, 7.8916015625, 8.314697265625, 8.73779296875, 9.160888671875, 9.583984375, 10.007080078125, 10.43017578125, 10.853271484375, 11.2763671875, 11.699462890625, 12.12255859375, 12.545654296875, 12.96875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 9.0, 12.0, 19.0, 13.0, 27.0, 31.0, 54.0, 43.0, 52.0, 74.0, 88.0, 108.0, 99.0, 137.0, 159.0, 145.0, 188.0, 203.0, 202.0, 219.0, 240.0, 200.0, 223.0, 204.0, 187.0, 170.0, 129.0, 144.0, 127.0, 97.0, 96.0, 82.0, 61.0, 49.0, 38.0, 28.0, 21.0, 24.0, 16.0, 13.0, 16.0, 9.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.5234375, -8.254150390625, -7.98486328125, -7.715576171875, -7.4462890625, -7.177001953125, -6.90771484375, -6.638427734375, -6.369140625, -6.099853515625, -5.83056640625, -5.561279296875, -5.2919921875, -5.022705078125, -4.75341796875, -4.484130859375, -4.21484375, -3.945556640625, -3.67626953125, -3.406982421875, -3.1376953125, -2.868408203125, -2.59912109375, -2.329833984375, -2.060546875, -1.791259765625, -1.52197265625, -1.252685546875, -0.9833984375, -0.714111328125, -0.44482421875, -0.175537109375, 0.09375, 0.363037109375, 0.63232421875, 0.901611328125, 1.1708984375, 1.440185546875, 1.70947265625, 1.978759765625, 2.248046875, 2.517333984375, 2.78662109375, 3.055908203125, 3.3251953125, 3.594482421875, 3.86376953125, 4.133056640625, 4.40234375, 4.671630859375, 4.94091796875, 5.210205078125, 5.4794921875, 5.748779296875, 6.01806640625, 6.287353515625, 6.556640625, 6.825927734375, 7.09521484375, 7.364501953125, 7.6337890625, 7.903076171875, 8.17236328125, 8.441650390625, 8.7109375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 13.0, 15.0, 17.0, 18.0, 22.0, 27.0, 24.0, 22.0, 35.0, 38.0, 61.0, 59.0, 65.0, 54.0, 54.0, 60.0, 48.0, 50.0, 43.0, 38.0, 31.0, 35.0, 33.0, 24.0, 19.0, 19.0, 14.0, 13.0, 10.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.391103744506836, -16.73643684387207, -16.081768035888672, -15.427101135253906, -14.772433280944824, -14.117765426635742, -13.463098526000977, -12.808430671691895, -12.153762817382812, -11.49909496307373, -10.844427108764648, -10.189760208129883, -9.5350923538208, -8.880424499511719, -8.225757598876953, -7.571089744567871, -6.916421890258789, -6.261754035949707, -5.607086658477783, -4.952419281005859, -4.297751426696777, -3.6430838108062744, -2.9884161949157715, -2.3337488174438477, -1.6790809631347656, -1.0244133472442627, -0.36974573135375977, 0.28492188453674316, 0.9395895004272461, 1.594257116317749, 2.248924732208252, 2.903592109680176, 3.558259963989258, 4.21292781829834, 4.867595195770264, 5.5222625732421875, 6.1769304275512695, 6.831598281860352, 7.486265659332275, 8.1409330368042, 8.795600891113281, 9.450268745422363, 10.104936599731445, 10.759603500366211, 11.414271354675293, 12.068939208984375, 12.72360610961914, 13.378273963928223, 14.032941818237305, 14.687609672546387, 15.342277526855469, 15.996944427490234, 16.651611328125, 17.3062801361084, 17.960947036743164, 18.615615844726562, 19.270282745361328, 19.924949645996094, 20.579618453979492, 21.234285354614258, 21.888954162597656, 22.543621063232422, 23.198287963867188, 23.852954864501953, 24.50762367248535]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 5.0, 12.0, 12.0, 11.0, 10.0, 12.0, 17.0, 21.0, 23.0, 17.0, 28.0, 35.0, 36.0, 39.0, 26.0, 43.0, 46.0, 33.0, 42.0, 32.0, 43.0, 43.0, 28.0, 37.0, 45.0, 46.0, 34.0, 36.0, 25.0, 22.0, 28.0, 19.0, 21.0, 12.0, 15.0, 13.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.653776168823242, -18.978042602539062, -18.30230712890625, -17.62657356262207, -16.95083999633789, -16.27510643005371, -15.599371910095215, -14.923637390136719, -14.247903823852539, -13.57217025756836, -12.896435737609863, -12.220701217651367, -11.544967651367188, -10.869234085083008, -10.193499565124512, -9.517765045166016, -8.842031478881836, -8.166297912597656, -7.49056339263916, -6.814829349517822, -6.139095306396484, -5.4633612632751465, -4.787627220153809, -4.111893177032471, -3.436159133911133, -2.760425090789795, -2.084691047668457, -1.4089570045471191, -0.7332229614257812, -0.05748891830444336, 0.6182451248168945, 1.2939791679382324, 1.9697151184082031, 2.645449161529541, 3.321183204650879, 3.996917247772217, 4.672651290893555, 5.348385334014893, 6.0241193771362305, 6.699853420257568, 7.375587463378906, 8.051321029663086, 8.727055549621582, 9.402790069580078, 10.078523635864258, 10.754257202148438, 11.429991722106934, 12.10572624206543, 12.78145980834961, 13.457193374633789, 14.132927894592285, 14.808662414550781, 15.484395980834961, 16.16012954711914, 16.835865020751953, 17.511598587036133, 18.187332153320312, 18.863065719604492, 19.538799285888672, 20.214534759521484, 20.890268325805664, 21.566001892089844, 22.241737365722656, 22.917470932006836, 23.593204498291016]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 4.0, 3.0, 8.0, 17.0, 26.0, 32.0, 48.0, 84.0, 106.0, 167.0, 208.0, 331.0, 463.0, 693.0, 990.0, 1431.0, 2159.0, 3156.0, 4638.0, 6816.0, 10047.0, 15383.0, 22235.0, 33401.0, 49836.0, 74654.0, 107590.0, 149401.0, 163078.0, 127550.0, 89593.0, 60281.0, 40792.0, 27121.0, 18195.0, 12147.0, 8459.0, 5603.0, 3713.0, 2549.0, 1827.0, 1150.0, 807.0, 538.0, 390.0, 256.0, 187.0, 131.0, 92.0, 61.0, 41.0, 23.0, 16.0, 23.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0], "bins": [-2.375, -2.30133056640625, -2.2276611328125, -2.15399169921875, -2.080322265625, -2.00665283203125, -1.9329833984375, -1.85931396484375, -1.78564453125, -1.71197509765625, -1.6383056640625, -1.56463623046875, -1.490966796875, -1.41729736328125, -1.3436279296875, -1.26995849609375, -1.1962890625, -1.12261962890625, -1.0489501953125, -0.97528076171875, -0.901611328125, -0.82794189453125, -0.7542724609375, -0.68060302734375, -0.60693359375, -0.53326416015625, -0.4595947265625, -0.38592529296875, -0.312255859375, -0.23858642578125, -0.1649169921875, -0.09124755859375, -0.017578125, 0.05609130859375, 0.1297607421875, 0.20343017578125, 0.277099609375, 0.35076904296875, 0.4244384765625, 0.49810791015625, 0.57177734375, 0.64544677734375, 0.7191162109375, 0.79278564453125, 0.866455078125, 0.94012451171875, 1.0137939453125, 1.08746337890625, 1.1611328125, 1.23480224609375, 1.3084716796875, 1.38214111328125, 1.455810546875, 1.52947998046875, 1.6031494140625, 1.67681884765625, 1.75048828125, 1.82415771484375, 1.8978271484375, 1.97149658203125, 2.045166015625, 2.11883544921875, 2.1925048828125, 2.26617431640625, 2.33984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 3.0, 4.0, 8.0, 8.0, 12.0, 10.0, 15.0, 18.0, 10.0, 17.0, 25.0, 27.0, 39.0, 34.0, 37.0, 46.0, 32.0, 38.0, 44.0, 50.0, 48.0, 45.0, 42.0, 30.0, 51.0, 48.0, 40.0, 34.0, 34.0, 27.0, 31.0, 17.0, 18.0, 11.0, 14.0, 14.0, 5.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.21875, -20.466796875, -19.71484375, -18.962890625, -18.2109375, -17.458984375, -16.70703125, -15.955078125, -15.203125, -14.451171875, -13.69921875, -12.947265625, -12.1953125, -11.443359375, -10.69140625, -9.939453125, -9.1875, -8.435546875, -7.68359375, -6.931640625, -6.1796875, -5.427734375, -4.67578125, -3.923828125, -3.171875, -2.419921875, -1.66796875, -0.916015625, -0.1640625, 0.587890625, 1.33984375, 2.091796875, 2.84375, 3.595703125, 4.34765625, 5.099609375, 5.8515625, 6.603515625, 7.35546875, 8.107421875, 8.859375, 9.611328125, 10.36328125, 11.115234375, 11.8671875, 12.619140625, 13.37109375, 14.123046875, 14.875, 15.626953125, 16.37890625, 17.130859375, 17.8828125, 18.634765625, 19.38671875, 20.138671875, 20.890625, 21.642578125, 22.39453125, 23.146484375, 23.8984375, 24.650390625, 25.40234375, 26.154296875, 26.90625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 10.0, 11.0, 12.0, 23.0, 37.0, 66.0, 97.0, 130.0, 186.0, 262.0, 445.0, 603.0, 953.0, 1322.0, 1936.0, 2893.0, 4356.0, 6610.0, 10519.0, 16504.0, 26828.0, 44233.0, 74289.0, 121823.0, 185033.0, 198271.0, 135473.0, 83165.0, 50402.0, 29939.0, 18537.0, 11381.0, 7490.0, 4837.0, 3185.0, 2193.0, 1442.0, 979.0, 656.0, 469.0, 320.0, 199.0, 150.0, 90.0, 68.0, 47.0, 20.0, 22.0, 11.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.697265625, -2.61328125, -2.529296875, -2.4453125, -2.361328125, -2.27734375, -2.193359375, -2.109375, -2.025390625, -1.94140625, -1.857421875, -1.7734375, -1.689453125, -1.60546875, -1.521484375, -1.4375, -1.353515625, -1.26953125, -1.185546875, -1.1015625, -1.017578125, -0.93359375, -0.849609375, -0.765625, -0.681640625, -0.59765625, -0.513671875, -0.4296875, -0.345703125, -0.26171875, -0.177734375, -0.09375, -0.009765625, 0.07421875, 0.158203125, 0.2421875, 0.326171875, 0.41015625, 0.494140625, 0.578125, 0.662109375, 0.74609375, 0.830078125, 0.9140625, 0.998046875, 1.08203125, 1.166015625, 1.25, 1.333984375, 1.41796875, 1.501953125, 1.5859375, 1.669921875, 1.75390625, 1.837890625, 1.921875, 2.005859375, 2.08984375, 2.173828125, 2.2578125, 2.341796875, 2.42578125, 2.509765625, 2.59375, 2.677734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 9.0, 5.0, 6.0, 10.0, 7.0, 17.0, 13.0, 20.0, 13.0, 26.0, 26.0, 25.0, 25.0, 33.0, 36.0, 40.0, 36.0, 28.0, 42.0, 49.0, 46.0, 55.0, 43.0, 46.0, 45.0, 36.0, 43.0, 28.0, 21.0, 23.0, 30.0, 28.0, 19.0, 20.0, 10.0, 8.0, 12.0, 5.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-15.3515625, -14.8994140625, -14.447265625, -13.9951171875, -13.54296875, -13.0908203125, -12.638671875, -12.1865234375, -11.734375, -11.2822265625, -10.830078125, -10.3779296875, -9.92578125, -9.4736328125, -9.021484375, -8.5693359375, -8.1171875, -7.6650390625, -7.212890625, -6.7607421875, -6.30859375, -5.8564453125, -5.404296875, -4.9521484375, -4.5, -4.0478515625, -3.595703125, -3.1435546875, -2.69140625, -2.2392578125, -1.787109375, -1.3349609375, -0.8828125, -0.4306640625, 0.021484375, 0.4736328125, 0.92578125, 1.3779296875, 1.830078125, 2.2822265625, 2.734375, 3.1865234375, 3.638671875, 4.0908203125, 4.54296875, 4.9951171875, 5.447265625, 5.8994140625, 6.3515625, 6.8037109375, 7.255859375, 7.7080078125, 8.16015625, 8.6123046875, 9.064453125, 9.5166015625, 9.96875, 10.4208984375, 10.873046875, 11.3251953125, 11.77734375, 12.2294921875, 12.681640625, 13.1337890625, 13.5859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 19.0, 19.0, 32.0, 51.0, 65.0, 111.0, 139.0, 227.0, 298.0, 476.0, 713.0, 1032.0, 1389.0, 2007.0, 3028.0, 4337.0, 6568.0, 10057.0, 16017.0, 25545.0, 43926.0, 79489.0, 154201.0, 277444.0, 191564.0, 94850.0, 51952.0, 30283.0, 18328.0, 11559.0, 7368.0, 4834.0, 3358.0, 2207.0, 1518.0, 1101.0, 777.0, 519.0, 362.0, 256.0, 160.0, 116.0, 83.0, 56.0, 29.0, 27.0, 13.0, 11.0, 17.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11810302734375, -0.11424922943115234, -0.11039543151855469, -0.10654163360595703, -0.10268783569335938, -0.09883403778076172, -0.09498023986816406, -0.0911264419555664, -0.08727264404296875, -0.0834188461303711, -0.07956504821777344, -0.07571125030517578, -0.07185745239257812, -0.06800365447998047, -0.06414985656738281, -0.060296058654785156, -0.0564422607421875, -0.052588462829589844, -0.04873466491699219, -0.04488086700439453, -0.041027069091796875, -0.03717327117919922, -0.03331947326660156, -0.029465675354003906, -0.02561187744140625, -0.021758079528808594, -0.017904281616210938, -0.014050483703613281, -0.010196685791015625, -0.006342887878417969, -0.0024890899658203125, 0.0013647079467773438, 0.005218505859375, 0.009072303771972656, 0.012926101684570312, 0.01677989959716797, 0.020633697509765625, 0.02448749542236328, 0.028341293334960938, 0.032195091247558594, 0.03604888916015625, 0.039902687072753906, 0.04375648498535156, 0.04761028289794922, 0.051464080810546875, 0.05531787872314453, 0.05917167663574219, 0.06302547454833984, 0.0668792724609375, 0.07073307037353516, 0.07458686828613281, 0.07844066619873047, 0.08229446411132812, 0.08614826202392578, 0.09000205993652344, 0.0938558578491211, 0.09770965576171875, 0.1015634536743164, 0.10541725158691406, 0.10927104949951172, 0.11312484741210938, 0.11697864532470703, 0.12083244323730469, 0.12468624114990234, 0.1285400390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 6.0, 10.0, 8.0, 12.0, 10.0, 11.0, 17.0, 22.0, 24.0, 32.0, 32.0, 34.0, 46.0, 45.0, 49.0, 43.0, 57.0, 30.0, 44.0, 48.0, 51.0, 33.0, 35.0, 37.0, 27.0, 36.0, 35.0, 23.0, 28.0, 27.0, 17.0, 14.0, 13.0, 8.0, 9.0, 7.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9609928131103516e-05, -1.8880702555179596e-05, -1.8151476979255676e-05, -1.7422251403331757e-05, -1.6693025827407837e-05, -1.5963800251483917e-05, -1.5234574675559998e-05, -1.4505349099636078e-05, -1.3776123523712158e-05, -1.3046897947788239e-05, -1.2317672371864319e-05, -1.15884467959404e-05, -1.085922122001648e-05, -1.012999564409256e-05, -9.40077006816864e-06, -8.67154449224472e-06, -7.9423189163208e-06, -7.213093340396881e-06, -6.4838677644729614e-06, -5.754642188549042e-06, -5.025416612625122e-06, -4.296191036701202e-06, -3.5669654607772827e-06, -2.837739884853363e-06, -2.1085143089294434e-06, -1.3792887330055237e-06, -6.50063157081604e-07, 7.916241884231567e-08, 8.083879947662354e-07, 1.537613570690155e-06, 2.2668391466140747e-06, 2.9960647225379944e-06, 3.725290298461914e-06, 4.454515874385834e-06, 5.183741450309753e-06, 5.912967026233673e-06, 6.642192602157593e-06, 7.3714181780815125e-06, 8.100643754005432e-06, 8.829869329929352e-06, 9.559094905853271e-06, 1.0288320481777191e-05, 1.101754605770111e-05, 1.174677163362503e-05, 1.247599720954895e-05, 1.320522278547287e-05, 1.393444836139679e-05, 1.466367393732071e-05, 1.539289951324463e-05, 1.612212508916855e-05, 1.6851350665092468e-05, 1.7580576241016388e-05, 1.8309801816940308e-05, 1.9039027392864227e-05, 1.9768252968788147e-05, 2.0497478544712067e-05, 2.1226704120635986e-05, 2.1955929696559906e-05, 2.2685155272483826e-05, 2.3414380848407745e-05, 2.4143606424331665e-05, 2.4872832000255585e-05, 2.5602057576179504e-05, 2.6331283152103424e-05, 2.7060508728027344e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 7.0, 15.0, 25.0, 32.0, 46.0, 67.0, 106.0, 154.0, 229.0, 324.0, 496.0, 804.0, 1333.0, 2028.0, 3080.0, 4841.0, 7854.0, 12327.0, 19440.0, 31695.0, 52558.0, 91879.0, 174781.0, 278941.0, 155076.0, 82982.0, 48384.0, 29294.0, 18198.0, 11540.0, 7210.0, 4637.0, 2947.0, 1823.0, 1179.0, 775.0, 512.0, 304.0, 225.0, 137.0, 81.0, 63.0, 42.0, 28.0, 19.0, 12.0, 11.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.277099609375, -0.2679901123046875, -0.258880615234375, -0.2497711181640625, -0.24066162109375, -0.2315521240234375, -0.222442626953125, -0.2133331298828125, -0.2042236328125, -0.1951141357421875, -0.186004638671875, -0.1768951416015625, -0.16778564453125, -0.1586761474609375, -0.149566650390625, -0.1404571533203125, -0.13134765625, -0.1222381591796875, -0.113128662109375, -0.1040191650390625, -0.09490966796875, -0.0858001708984375, -0.076690673828125, -0.0675811767578125, -0.0584716796875, -0.0493621826171875, -0.040252685546875, -0.0311431884765625, -0.02203369140625, -0.0129241943359375, -0.003814697265625, 0.0052947998046875, 0.014404296875, 0.0235137939453125, 0.032623291015625, 0.0417327880859375, 0.05084228515625, 0.0599517822265625, 0.069061279296875, 0.0781707763671875, 0.0872802734375, 0.0963897705078125, 0.105499267578125, 0.1146087646484375, 0.12371826171875, 0.1328277587890625, 0.141937255859375, 0.1510467529296875, 0.16015625, 0.1692657470703125, 0.178375244140625, 0.1874847412109375, 0.19659423828125, 0.2057037353515625, 0.214813232421875, 0.2239227294921875, 0.2330322265625, 0.2421417236328125, 0.251251220703125, 0.2603607177734375, 0.26947021484375, 0.2785797119140625, 0.287689208984375, 0.2967987060546875, 0.305908203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 1.0, 2.0, 5.0, 6.0, 4.0, 3.0, 10.0, 11.0, 12.0, 15.0, 23.0, 19.0, 34.0, 29.0, 36.0, 58.0, 54.0, 56.0, 60.0, 71.0, 47.0, 79.0, 58.0, 45.0, 48.0, 36.0, 27.0, 18.0, 23.0, 14.0, 16.0, 16.0, 5.0, 13.0, 10.0, 8.0, 2.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2027587890625, -0.19663238525390625, -0.1905059814453125, -0.18437957763671875, -0.178253173828125, -0.17212677001953125, -0.1660003662109375, -0.15987396240234375, -0.15374755859375, -0.14762115478515625, -0.1414947509765625, -0.13536834716796875, -0.129241943359375, -0.12311553955078125, -0.1169891357421875, -0.11086273193359375, -0.104736328125, -0.09860992431640625, -0.0924835205078125, -0.08635711669921875, -0.080230712890625, -0.07410430908203125, -0.0679779052734375, -0.06185150146484375, -0.05572509765625, -0.04959869384765625, -0.0434722900390625, -0.03734588623046875, -0.031219482421875, -0.02509307861328125, -0.0189666748046875, -0.01284027099609375, -0.0067138671875, -0.00058746337890625, 0.0055389404296875, 0.01166534423828125, 0.017791748046875, 0.02391815185546875, 0.0300445556640625, 0.03617095947265625, 0.04229736328125, 0.04842376708984375, 0.0545501708984375, 0.06067657470703125, 0.066802978515625, 0.07292938232421875, 0.0790557861328125, 0.08518218994140625, 0.09130859375, 0.09743499755859375, 0.1035614013671875, 0.10968780517578125, 0.115814208984375, 0.12194061279296875, 0.1280670166015625, 0.13419342041015625, 0.14031982421875, 0.14644622802734375, 0.1525726318359375, 0.15869903564453125, 0.164825439453125, 0.17095184326171875, 0.1770782470703125, 0.18320465087890625, 0.1893310546875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 2.0, 14.0, 11.0, 16.0, 14.0, 17.0, 31.0, 29.0, 24.0, 26.0, 36.0, 46.0, 62.0, 63.0, 62.0, 49.0, 59.0, 56.0, 47.0, 49.0, 40.0, 33.0, 27.0, 35.0, 37.0, 26.0, 13.0, 16.0, 8.0, 13.0, 10.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.597570419311523, -16.947839736938477, -16.298107147216797, -15.64837646484375, -14.998645782470703, -14.348915100097656, -13.699183464050293, -13.04945182800293, -12.399721145629883, -11.749990463256836, -11.100258827209473, -10.45052719116211, -9.800796508789062, -9.151065826416016, -8.501334190368652, -7.851603031158447, -7.201871871948242, -6.552140712738037, -5.902409553527832, -5.252678394317627, -4.602947235107422, -3.953216075897217, -3.3034849166870117, -2.6537537574768066, -2.0040225982666016, -1.3542914390563965, -0.7045602798461914, -0.05482912063598633, 0.5949020385742188, 1.2446331977844238, 1.894364356994629, 2.544095516204834, 3.193826675415039, 3.843557834625244, 4.493288993835449, 5.143020153045654, 5.792751312255859, 6.4424824714660645, 7.0922136306762695, 7.741944789886475, 8.39167594909668, 9.041406631469727, 9.69113826751709, 10.340869903564453, 10.9906005859375, 11.640331268310547, 12.29006290435791, 12.939794540405273, 13.58952522277832, 14.239255905151367, 14.88898754119873, 15.538719177246094, 16.18844985961914, 16.838180541992188, 17.487911224365234, 18.137643814086914, 18.78737449645996, 19.437105178833008, 20.086837768554688, 20.736568450927734, 21.38629913330078, 22.036029815673828, 22.685760498046875, 23.335493087768555, 23.9852237701416]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 3.0, 6.0, 4.0, 5.0, 12.0, 11.0, 12.0, 10.0, 12.0, 15.0, 21.0, 23.0, 15.0, 32.0, 32.0, 35.0, 39.0, 29.0, 40.0, 46.0, 33.0, 38.0, 40.0, 38.0, 43.0, 29.0, 36.0, 45.0, 48.0, 35.0, 35.0, 25.0, 23.0, 30.0, 16.0, 22.0, 13.0, 14.0, 14.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.7023983001709, -19.03127098083496, -18.360143661499023, -17.689016342163086, -17.01789093017578, -16.346763610839844, -15.675636291503906, -15.004508972167969, -14.333381652832031, -13.662254333496094, -12.991127014160156, -12.320000648498535, -11.648873329162598, -10.97774600982666, -10.306619644165039, -9.635492324829102, -8.964365005493164, -8.293237686157227, -7.622110843658447, -6.950984001159668, -6.2798566818237305, -5.608729362487793, -4.937602519989014, -4.266475677490234, -3.595348358154297, -2.9242212772369385, -2.25309419631958, -1.5819671154022217, -0.9108400344848633, -0.23971295356750488, 0.4314141273498535, 1.1025409698486328, 1.7736663818359375, 2.444793462753296, 3.1159205436706543, 3.7870476245880127, 4.458174705505371, 5.129302024841309, 5.800428867340088, 6.471555709838867, 7.142683029174805, 7.813810348510742, 8.48493766784668, 9.1560640335083, 9.827191352844238, 10.498318672180176, 11.169445037841797, 11.840572357177734, 12.511699676513672, 13.18282699584961, 13.853954315185547, 14.525080680847168, 15.196208000183105, 15.867335319519043, 16.538461685180664, 17.2095890045166, 17.88071632385254, 18.551843643188477, 19.222970962524414, 19.89409828186035, 20.565223693847656, 21.236351013183594, 21.90747833251953, 22.57860565185547, 23.249732971191406]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 11.0, 19.0, 21.0, 33.0, 62.0, 96.0, 114.0, 193.0, 297.0, 489.0, 697.0, 1037.0, 1685.0, 2510.0, 3636.0, 5448.0, 8186.0, 11719.0, 17131.0, 24032.0, 33268.0, 44214.0, 56486.0, 69161.0, 81381.0, 89816.0, 94140.0, 92767.0, 86058.0, 76079.0, 63255.0, 50963.0, 38677.0, 29093.0, 20813.0, 14437.0, 10159.0, 6882.0, 4477.0, 3139.0, 2055.0, 1311.0, 872.0, 552.0, 366.0, 260.0, 174.0, 105.0, 70.0, 40.0, 29.0, 18.0, 9.0, 12.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.87158203125, -9.5400390625, -9.20849609375, -8.876953125, -8.54541015625, -8.2138671875, -7.88232421875, -7.55078125, -7.21923828125, -6.8876953125, -6.55615234375, -6.224609375, -5.89306640625, -5.5615234375, -5.22998046875, -4.8984375, -4.56689453125, -4.2353515625, -3.90380859375, -3.572265625, -3.24072265625, -2.9091796875, -2.57763671875, -2.24609375, -1.91455078125, -1.5830078125, -1.25146484375, -0.919921875, -0.58837890625, -0.2568359375, 0.07470703125, 0.40625, 0.73779296875, 1.0693359375, 1.40087890625, 1.732421875, 2.06396484375, 2.3955078125, 2.72705078125, 3.05859375, 3.39013671875, 3.7216796875, 4.05322265625, 4.384765625, 4.71630859375, 5.0478515625, 5.37939453125, 5.7109375, 6.04248046875, 6.3740234375, 6.70556640625, 7.037109375, 7.36865234375, 7.7001953125, 8.03173828125, 8.36328125, 8.69482421875, 9.0263671875, 9.35791015625, 9.689453125, 10.02099609375, 10.3525390625, 10.68408203125, 11.015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 6.0, 11.0, 6.0, 11.0, 16.0, 11.0, 10.0, 18.0, 21.0, 33.0, 30.0, 33.0, 25.0, 31.0, 33.0, 42.0, 40.0, 42.0, 46.0, 36.0, 44.0, 37.0, 48.0, 41.0, 41.0, 39.0, 36.0, 32.0, 30.0, 21.0, 31.0, 16.0, 18.0, 13.0, 8.0, 15.0, 10.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.96875, -19.2666015625, -18.564453125, -17.8623046875, -17.16015625, -16.4580078125, -15.755859375, -15.0537109375, -14.3515625, -13.6494140625, -12.947265625, -12.2451171875, -11.54296875, -10.8408203125, -10.138671875, -9.4365234375, -8.734375, -8.0322265625, -7.330078125, -6.6279296875, -5.92578125, -5.2236328125, -4.521484375, -3.8193359375, -3.1171875, -2.4150390625, -1.712890625, -1.0107421875, -0.30859375, 0.3935546875, 1.095703125, 1.7978515625, 2.5, 3.2021484375, 3.904296875, 4.6064453125, 5.30859375, 6.0107421875, 6.712890625, 7.4150390625, 8.1171875, 8.8193359375, 9.521484375, 10.2236328125, 10.92578125, 11.6279296875, 12.330078125, 13.0322265625, 13.734375, 14.4365234375, 15.138671875, 15.8408203125, 16.54296875, 17.2451171875, 17.947265625, 18.6494140625, 19.3515625, 20.0537109375, 20.755859375, 21.4580078125, 22.16015625, 22.8623046875, 23.564453125, 24.2666015625, 24.96875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 5.0, 13.0, 11.0, 14.0, 25.0, 47.0, 60.0, 101.0, 162.0, 290.0, 413.0, 664.0, 1065.0, 1746.0, 2694.0, 4240.0, 6452.0, 10136.0, 15128.0, 22585.0, 32309.0, 44710.0, 59785.0, 76515.0, 91959.0, 102172.0, 106156.0, 102578.0, 90686.0, 75383.0, 59514.0, 44631.0, 31594.0, 21980.0, 15002.0, 9832.0, 6478.0, 4163.0, 2787.0, 1631.0, 1053.0, 672.0, 405.0, 261.0, 142.0, 124.0, 58.0, 48.0, 29.0, 22.0, 12.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-11.4296875, -11.0546875, -10.6796875, -10.3046875, -9.9296875, -9.5546875, -9.1796875, -8.8046875, -8.4296875, -8.0546875, -7.6796875, -7.3046875, -6.9296875, -6.5546875, -6.1796875, -5.8046875, -5.4296875, -5.0546875, -4.6796875, -4.3046875, -3.9296875, -3.5546875, -3.1796875, -2.8046875, -2.4296875, -2.0546875, -1.6796875, -1.3046875, -0.9296875, -0.5546875, -0.1796875, 0.1953125, 0.5703125, 0.9453125, 1.3203125, 1.6953125, 2.0703125, 2.4453125, 2.8203125, 3.1953125, 3.5703125, 3.9453125, 4.3203125, 4.6953125, 5.0703125, 5.4453125, 5.8203125, 6.1953125, 6.5703125, 6.9453125, 7.3203125, 7.6953125, 8.0703125, 8.4453125, 8.8203125, 9.1953125, 9.5703125, 9.9453125, 10.3203125, 10.6953125, 11.0703125, 11.4453125, 11.8203125, 12.1953125, 12.5703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 8.0, 15.0, 11.0, 12.0, 18.0, 20.0, 19.0, 12.0, 38.0, 30.0, 26.0, 24.0, 28.0, 39.0, 37.0, 35.0, 56.0, 61.0, 36.0, 38.0, 39.0, 48.0, 36.0, 39.0, 41.0, 23.0, 27.0, 16.0, 23.0, 28.0, 21.0, 14.0, 17.0, 14.0, 9.0, 9.0, 8.0, 6.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.4375, -14.0103759765625, -13.583251953125, -13.1561279296875, -12.72900390625, -12.3018798828125, -11.874755859375, -11.4476318359375, -11.0205078125, -10.5933837890625, -10.166259765625, -9.7391357421875, -9.31201171875, -8.8848876953125, -8.457763671875, -8.0306396484375, -7.603515625, -7.1763916015625, -6.749267578125, -6.3221435546875, -5.89501953125, -5.4678955078125, -5.040771484375, -4.6136474609375, -4.1865234375, -3.7593994140625, -3.332275390625, -2.9051513671875, -2.47802734375, -2.0509033203125, -1.623779296875, -1.1966552734375, -0.76953125, -0.3424072265625, 0.084716796875, 0.5118408203125, 0.93896484375, 1.3660888671875, 1.793212890625, 2.2203369140625, 2.6474609375, 3.0745849609375, 3.501708984375, 3.9288330078125, 4.35595703125, 4.7830810546875, 5.210205078125, 5.6373291015625, 6.064453125, 6.4915771484375, 6.918701171875, 7.3458251953125, 7.77294921875, 8.2000732421875, 8.627197265625, 9.0543212890625, 9.4814453125, 9.9085693359375, 10.335693359375, 10.7628173828125, 11.18994140625, 11.6170654296875, 12.044189453125, 12.4713134765625, 12.8984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 16.0, 29.0, 42.0, 52.0, 75.0, 122.0, 191.0, 342.0, 534.0, 800.0, 1353.0, 2161.0, 3532.0, 5730.0, 9421.0, 15118.0, 23927.0, 36197.0, 53478.0, 74127.0, 95623.0, 113529.0, 121854.0, 118506.0, 104404.0, 83998.0, 62255.0, 43320.0, 29220.0, 18432.0, 11658.0, 7060.0, 4402.0, 2623.0, 1632.0, 1081.0, 653.0, 374.0, 228.0, 171.0, 109.0, 63.0, 44.0, 23.0, 17.0, 16.0, 2.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.9459228515625, -3.821533203125, -3.6971435546875, -3.57275390625, -3.4483642578125, -3.323974609375, -3.1995849609375, -3.0751953125, -2.9508056640625, -2.826416015625, -2.7020263671875, -2.57763671875, -2.4532470703125, -2.328857421875, -2.2044677734375, -2.080078125, -1.9556884765625, -1.831298828125, -1.7069091796875, -1.58251953125, -1.4581298828125, -1.333740234375, -1.2093505859375, -1.0849609375, -0.9605712890625, -0.836181640625, -0.7117919921875, -0.58740234375, -0.4630126953125, -0.338623046875, -0.2142333984375, -0.08984375, 0.0345458984375, 0.158935546875, 0.2833251953125, 0.40771484375, 0.5321044921875, 0.656494140625, 0.7808837890625, 0.9052734375, 1.0296630859375, 1.154052734375, 1.2784423828125, 1.40283203125, 1.5272216796875, 1.651611328125, 1.7760009765625, 1.900390625, 2.0247802734375, 2.149169921875, 2.2735595703125, 2.39794921875, 2.5223388671875, 2.646728515625, 2.7711181640625, 2.8955078125, 3.0198974609375, 3.144287109375, 3.2686767578125, 3.39306640625, 3.5174560546875, 3.641845703125, 3.7662353515625, 3.890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 11.0, 11.0, 18.0, 18.0, 21.0, 14.0, 18.0, 16.0, 34.0, 37.0, 25.0, 27.0, 34.0, 29.0, 33.0, 40.0, 34.0, 44.0, 44.0, 30.0, 36.0, 33.0, 34.0, 45.0, 30.0, 36.0, 29.0, 31.0, 30.0, 21.0, 16.0, 15.0, 11.0, 14.0, 12.0, 9.0, 9.0, 9.0, 5.0, 11.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00035834312438964844, -0.00034697726368904114, -0.00033561140298843384, -0.00032424554228782654, -0.00031287968158721924, -0.00030151382088661194, -0.00029014796018600464, -0.00027878209948539734, -0.00026741623878479004, -0.00025605037808418274, -0.00024468451738357544, -0.00023331865668296814, -0.00022195279598236084, -0.00021058693528175354, -0.00019922107458114624, -0.00018785521388053894, -0.00017648935317993164, -0.00016512349247932434, -0.00015375763177871704, -0.00014239177107810974, -0.00013102591037750244, -0.00011966004967689514, -0.00010829418897628784, -9.692832827568054e-05, -8.556246757507324e-05, -7.419660687446594e-05, -6.283074617385864e-05, -5.146488547325134e-05, -4.009902477264404e-05, -2.8733164072036743e-05, -1.7367303371429443e-05, -6.0014426708221436e-06, 5.364418029785156e-06, 1.6730278730392456e-05, 2.8096139430999756e-05, 3.9462000131607056e-05, 5.0827860832214355e-05, 6.219372153282166e-05, 7.355958223342896e-05, 8.492544293403625e-05, 9.629130363464355e-05, 0.00010765716433525085, 0.00011902302503585815, 0.00013038888573646545, 0.00014175474643707275, 0.00015312060713768005, 0.00016448646783828735, 0.00017585232853889465, 0.00018721818923950195, 0.00019858404994010925, 0.00020994991064071655, 0.00022131577134132385, 0.00023268163204193115, 0.00024404749274253845, 0.00025541335344314575, 0.00026677921414375305, 0.00027814507484436035, 0.00028951093554496765, 0.00030087679624557495, 0.00031224265694618225, 0.00032360851764678955, 0.00033497437834739685, 0.00034634023904800415, 0.00035770609974861145, 0.00036907196044921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 7.0, 8.0, 11.0, 16.0, 31.0, 38.0, 60.0, 99.0, 188.0, 278.0, 509.0, 747.0, 1299.0, 2258.0, 3480.0, 5880.0, 9471.0, 15621.0, 24944.0, 39148.0, 57979.0, 81350.0, 105684.0, 123655.0, 129844.0, 121090.0, 100797.0, 76097.0, 53569.0, 35221.0, 22827.0, 14195.0, 8670.0, 5373.0, 3183.0, 1941.0, 1172.0, 705.0, 387.0, 269.0, 165.0, 122.0, 54.0, 34.0, 31.0, 21.0, 10.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0], "bins": [-4.76953125, -4.630859375, -4.4921875, -4.353515625, -4.21484375, -4.076171875, -3.9375, -3.798828125, -3.66015625, -3.521484375, -3.3828125, -3.244140625, -3.10546875, -2.966796875, -2.828125, -2.689453125, -2.55078125, -2.412109375, -2.2734375, -2.134765625, -1.99609375, -1.857421875, -1.71875, -1.580078125, -1.44140625, -1.302734375, -1.1640625, -1.025390625, -0.88671875, -0.748046875, -0.609375, -0.470703125, -0.33203125, -0.193359375, -0.0546875, 0.083984375, 0.22265625, 0.361328125, 0.5, 0.638671875, 0.77734375, 0.916015625, 1.0546875, 1.193359375, 1.33203125, 1.470703125, 1.609375, 1.748046875, 1.88671875, 2.025390625, 2.1640625, 2.302734375, 2.44140625, 2.580078125, 2.71875, 2.857421875, 2.99609375, 3.134765625, 3.2734375, 3.412109375, 3.55078125, 3.689453125, 3.828125, 3.966796875, 4.10546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 5.0, 3.0, 3.0, 5.0, 9.0, 14.0, 15.0, 22.0, 24.0, 27.0, 30.0, 32.0, 37.0, 37.0, 45.0, 50.0, 48.0, 56.0, 50.0, 57.0, 50.0, 48.0, 45.0, 38.0, 45.0, 32.0, 32.0, 20.0, 25.0, 13.0, 19.0, 13.0, 7.0, 8.0, 8.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-2.533203125, -2.46221923828125, -2.3912353515625, -2.32025146484375, -2.249267578125, -2.17828369140625, -2.1072998046875, -2.03631591796875, -1.96533203125, -1.89434814453125, -1.8233642578125, -1.75238037109375, -1.681396484375, -1.61041259765625, -1.5394287109375, -1.46844482421875, -1.3974609375, -1.32647705078125, -1.2554931640625, -1.18450927734375, -1.113525390625, -1.04254150390625, -0.9715576171875, -0.90057373046875, -0.82958984375, -0.75860595703125, -0.6876220703125, -0.61663818359375, -0.545654296875, -0.47467041015625, -0.4036865234375, -0.33270263671875, -0.26171875, -0.19073486328125, -0.1197509765625, -0.04876708984375, 0.022216796875, 0.09320068359375, 0.1641845703125, 0.23516845703125, 0.30615234375, 0.37713623046875, 0.4481201171875, 0.51910400390625, 0.590087890625, 0.66107177734375, 0.7320556640625, 0.80303955078125, 0.8740234375, 0.94500732421875, 1.0159912109375, 1.08697509765625, 1.157958984375, 1.22894287109375, 1.2999267578125, 1.37091064453125, 1.44189453125, 1.51287841796875, 1.5838623046875, 1.65484619140625, 1.725830078125, 1.79681396484375, 1.8677978515625, 1.93878173828125, 2.009765625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 7.0, 8.0, 16.0, 20.0, 18.0, 16.0, 22.0, 28.0, 28.0, 22.0, 40.0, 46.0, 60.0, 56.0, 70.0, 55.0, 45.0, 57.0, 44.0, 43.0, 36.0, 47.0, 38.0, 32.0, 16.0, 18.0, 19.0, 13.0, 12.0, 9.0, 12.0, 6.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.87759780883789, -17.261014938354492, -16.644432067871094, -16.027851104736328, -15.41126823425293, -14.794685363769531, -14.17810344696045, -13.561521530151367, -12.944938659667969, -12.32835578918457, -11.711773872375488, -11.095191955566406, -10.478609085083008, -9.86202621459961, -9.245444297790527, -8.628862380981445, -8.012279510498047, -7.395697116851807, -6.779114723205566, -6.162532329559326, -5.545949935913086, -4.929367542266846, -4.3127851486206055, -3.6962027549743652, -3.079620361328125, -2.4630379676818848, -1.8464555740356445, -1.2298731803894043, -0.6132907867431641, 0.003291606903076172, 0.6198740005493164, 1.2364563941955566, 1.853036880493164, 2.4696192741394043, 3.0862016677856445, 3.7027840614318848, 4.319366455078125, 4.935948848724365, 5.5525312423706055, 6.169113636016846, 6.785696029663086, 7.402278423309326, 8.018860816955566, 8.635442733764648, 9.252025604248047, 9.868608474731445, 10.485190391540527, 11.10177230834961, 11.718355178833008, 12.334938049316406, 12.951519966125488, 13.56810188293457, 14.184684753417969, 14.801267623901367, 15.41784954071045, 16.03443145751953, 16.65101432800293, 17.267597198486328, 17.884178161621094, 18.500761032104492, 19.11734390258789, 19.73392677307129, 20.350509643554688, 20.967090606689453, 21.58367347717285]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 10.0, 4.0, 10.0, 5.0, 9.0, 17.0, 14.0, 16.0, 24.0, 28.0, 19.0, 40.0, 35.0, 32.0, 37.0, 35.0, 44.0, 46.0, 37.0, 45.0, 49.0, 43.0, 44.0, 45.0, 37.0, 51.0, 25.0, 35.0, 25.0, 33.0, 23.0, 10.0, 20.0, 13.0, 13.0, 4.0, 10.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.188093185424805, -20.439037322998047, -19.689983367919922, -18.940929412841797, -18.19187355041504, -17.44281768798828, -16.693763732910156, -15.944708824157715, -15.195653915405273, -14.446599006652832, -13.69754409790039, -12.94848918914795, -12.199434280395508, -11.450379371643066, -10.701324462890625, -9.952269554138184, -9.203214645385742, -8.4541597366333, -7.705104827880859, -6.956049919128418, -6.206995010375977, -5.457940101623535, -4.708885192871094, -3.9598302841186523, -3.210775375366211, -2.4617204666137695, -1.7126655578613281, -0.9636106491088867, -0.2145557403564453, 0.5344991683959961, 1.2835540771484375, 2.032608985900879, 2.7816638946533203, 3.5307188034057617, 4.279773712158203, 5.0288286209106445, 5.777883529663086, 6.526938438415527, 7.275993347167969, 8.02504825592041, 8.774103164672852, 9.523158073425293, 10.272212982177734, 11.021267890930176, 11.770322799682617, 12.519377708435059, 13.2684326171875, 14.017487525939941, 14.766542434692383, 15.515597343444824, 16.264652252197266, 17.01370620727539, 17.76276206970215, 18.511817932128906, 19.26087188720703, 20.009925842285156, 20.758981704711914, 21.508037567138672, 22.257091522216797, 23.006145477294922, 23.75520133972168, 24.504257202148438, 25.253311157226562, 26.002365112304688, 26.751420974731445]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 21.0, 43.0, 88.0, 141.0, 221.0, 392.0, 677.0, 1208.0, 2004.0, 3428.0, 5857.0, 9886.0, 16433.0, 26843.0, 44531.0, 71433.0, 111984.0, 170088.0, 246885.0, 335215.0, 422519.0, 483200.0, 498440.0, 461718.0, 387230.0, 296850.0, 213058.0, 143953.0, 92761.0, 58143.0, 35848.0, 21844.0, 12836.0, 7564.0, 4523.0, 2692.0, 1519.0, 908.0, 550.0, 283.0, 198.0, 99.0, 50.0, 42.0, 38.0, 16.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.078125, -12.61572265625, -12.1533203125, -11.69091796875, -11.228515625, -10.76611328125, -10.3037109375, -9.84130859375, -9.37890625, -8.91650390625, -8.4541015625, -7.99169921875, -7.529296875, -7.06689453125, -6.6044921875, -6.14208984375, -5.6796875, -5.21728515625, -4.7548828125, -4.29248046875, -3.830078125, -3.36767578125, -2.9052734375, -2.44287109375, -1.98046875, -1.51806640625, -1.0556640625, -0.59326171875, -0.130859375, 0.33154296875, 0.7939453125, 1.25634765625, 1.71875, 2.18115234375, 2.6435546875, 3.10595703125, 3.568359375, 4.03076171875, 4.4931640625, 4.95556640625, 5.41796875, 5.88037109375, 6.3427734375, 6.80517578125, 7.267578125, 7.72998046875, 8.1923828125, 8.65478515625, 9.1171875, 9.57958984375, 10.0419921875, 10.50439453125, 10.966796875, 11.42919921875, 11.8916015625, 12.35400390625, 12.81640625, 13.27880859375, 13.7412109375, 14.20361328125, 14.666015625, 15.12841796875, 15.5908203125, 16.05322265625, 16.515625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 7.0, 2.0, 2.0, 8.0, 10.0, 12.0, 14.0, 10.0, 20.0, 10.0, 23.0, 26.0, 25.0, 30.0, 29.0, 25.0, 48.0, 36.0, 40.0, 46.0, 29.0, 42.0, 38.0, 47.0, 45.0, 47.0, 47.0, 38.0, 28.0, 28.0, 28.0, 23.0, 28.0, 18.0, 21.0, 16.0, 16.0, 14.0, 6.0, 6.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.984375, -15.42919921875, -14.8740234375, -14.31884765625, -13.763671875, -13.20849609375, -12.6533203125, -12.09814453125, -11.54296875, -10.98779296875, -10.4326171875, -9.87744140625, -9.322265625, -8.76708984375, -8.2119140625, -7.65673828125, -7.1015625, -6.54638671875, -5.9912109375, -5.43603515625, -4.880859375, -4.32568359375, -3.7705078125, -3.21533203125, -2.66015625, -2.10498046875, -1.5498046875, -0.99462890625, -0.439453125, 0.11572265625, 0.6708984375, 1.22607421875, 1.78125, 2.33642578125, 2.8916015625, 3.44677734375, 4.001953125, 4.55712890625, 5.1123046875, 5.66748046875, 6.22265625, 6.77783203125, 7.3330078125, 7.88818359375, 8.443359375, 8.99853515625, 9.5537109375, 10.10888671875, 10.6640625, 11.21923828125, 11.7744140625, 12.32958984375, 12.884765625, 13.43994140625, 13.9951171875, 14.55029296875, 15.10546875, 15.66064453125, 16.2158203125, 16.77099609375, 17.326171875, 17.88134765625, 18.4365234375, 18.99169921875, 19.546875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 19.0, 22.0, 39.0, 82.0, 139.0, 228.0, 371.0, 638.0, 1051.0, 1935.0, 3169.0, 5239.0, 8793.0, 14568.0, 23535.0, 37055.0, 56486.0, 85766.0, 125699.0, 176328.0, 234622.0, 297052.0, 353579.0, 396352.0, 415716.0, 405658.0, 370512.0, 316642.0, 254329.0, 193064.0, 140389.0, 97281.0, 65276.0, 42497.0, 27260.0, 17028.0, 10357.0, 6312.0, 3719.0, 2229.0, 1316.0, 811.0, 420.0, 300.0, 183.0, 93.0, 58.0, 38.0, 9.0, 9.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.3472900390625, -11.944580078125, -11.5418701171875, -11.13916015625, -10.7364501953125, -10.333740234375, -9.9310302734375, -9.5283203125, -9.1256103515625, -8.722900390625, -8.3201904296875, -7.91748046875, -7.5147705078125, -7.112060546875, -6.7093505859375, -6.306640625, -5.9039306640625, -5.501220703125, -5.0985107421875, -4.69580078125, -4.2930908203125, -3.890380859375, -3.4876708984375, -3.0849609375, -2.6822509765625, -2.279541015625, -1.8768310546875, -1.47412109375, -1.0714111328125, -0.668701171875, -0.2659912109375, 0.13671875, 0.5394287109375, 0.942138671875, 1.3448486328125, 1.74755859375, 2.1502685546875, 2.552978515625, 2.9556884765625, 3.3583984375, 3.7611083984375, 4.163818359375, 4.5665283203125, 4.96923828125, 5.3719482421875, 5.774658203125, 6.1773681640625, 6.580078125, 6.9827880859375, 7.385498046875, 7.7882080078125, 8.19091796875, 8.5936279296875, 8.996337890625, 9.3990478515625, 9.8017578125, 10.2044677734375, 10.607177734375, 11.0098876953125, 11.41259765625, 11.8153076171875, 12.218017578125, 12.6207275390625, 13.0234375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 6.0, 15.0, 10.0, 13.0, 10.0, 23.0, 32.0, 32.0, 39.0, 62.0, 85.0, 66.0, 99.0, 97.0, 104.0, 129.0, 158.0, 170.0, 186.0, 167.0, 208.0, 195.0, 202.0, 194.0, 205.0, 171.0, 177.0, 173.0, 150.0, 135.0, 105.0, 102.0, 89.0, 88.0, 80.0, 59.0, 49.0, 39.0, 39.0, 27.0, 19.0, 21.0, 12.0, 7.0, 13.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.403564453125, -7.16259765625, -6.921630859375, -6.6806640625, -6.439697265625, -6.19873046875, -5.957763671875, -5.716796875, -5.475830078125, -5.23486328125, -4.993896484375, -4.7529296875, -4.511962890625, -4.27099609375, -4.030029296875, -3.7890625, -3.548095703125, -3.30712890625, -3.066162109375, -2.8251953125, -2.584228515625, -2.34326171875, -2.102294921875, -1.861328125, -1.620361328125, -1.37939453125, -1.138427734375, -0.8974609375, -0.656494140625, -0.41552734375, -0.174560546875, 0.06640625, 0.307373046875, 0.54833984375, 0.789306640625, 1.0302734375, 1.271240234375, 1.51220703125, 1.753173828125, 1.994140625, 2.235107421875, 2.47607421875, 2.717041015625, 2.9580078125, 3.198974609375, 3.43994140625, 3.680908203125, 3.921875, 4.162841796875, 4.40380859375, 4.644775390625, 4.8857421875, 5.126708984375, 5.36767578125, 5.608642578125, 5.849609375, 6.090576171875, 6.33154296875, 6.572509765625, 6.8134765625, 7.054443359375, 7.29541015625, 7.536376953125, 7.77734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 9.0, 7.0, 20.0, 19.0, 28.0, 28.0, 38.0, 44.0, 30.0, 50.0, 49.0, 63.0, 71.0, 71.0, 71.0, 69.0, 54.0, 45.0, 40.0, 37.0, 38.0, 28.0, 17.0, 23.0, 12.0, 11.0, 10.0, 1.0, 4.0, 6.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.934795379638672, -19.184358596801758, -18.433923721313477, -17.683486938476562, -16.93305206298828, -16.182615280151367, -15.432178497314453, -14.681742668151855, -13.931306838989258, -13.18087100982666, -12.430435180664062, -11.679998397827148, -10.92956256866455, -10.179126739501953, -9.428689956665039, -8.678254127502441, -7.927818298339844, -7.177382469177246, -6.42694616317749, -5.676509857177734, -4.926074028015137, -4.175638198852539, -3.425201892852783, -2.6747655868530273, -1.9243297576904297, -1.173893690109253, -0.42345762252807617, 0.3269784450531006, 1.0774145126342773, 1.827850580215454, 2.578286647796631, 3.3287229537963867, 4.079156875610352, 4.829592704772949, 5.580029010772705, 6.330465316772461, 7.080901145935059, 7.831336975097656, 8.58177375793457, 9.332209587097168, 10.082645416259766, 10.833081245422363, 11.583517074584961, 12.333953857421875, 13.084389686584473, 13.83482551574707, 14.585262298583984, 15.335698127746582, 16.08613395690918, 16.836570739746094, 17.587005615234375, 18.33744239807129, 19.087879180908203, 19.838314056396484, 20.5887508392334, 21.339187622070312, 22.089622497558594, 22.840059280395508, 23.59049415588379, 24.340930938720703, 25.091365814208984, 25.8418025970459, 26.592239379882812, 27.342674255371094, 28.093111038208008]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 6.0, 6.0, 6.0, 8.0, 16.0, 18.0, 12.0, 13.0, 17.0, 31.0, 31.0, 28.0, 28.0, 40.0, 32.0, 44.0, 34.0, 34.0, 23.0, 44.0, 43.0, 39.0, 54.0, 43.0, 37.0, 42.0, 35.0, 28.0, 29.0, 33.0, 21.0, 20.0, 22.0, 19.0, 9.0, 10.0, 13.0, 7.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.133386611938477, -19.46126937866211, -18.78915023803711, -18.117033004760742, -17.444915771484375, -16.772796630859375, -16.100679397583008, -15.42856216430664, -14.756443977355957, -14.084325790405273, -13.412208557128906, -12.740090370178223, -12.067972183227539, -11.395854949951172, -10.723736763000488, -10.051618576049805, -9.379501342773438, -8.707383155822754, -8.035265922546387, -7.363147735595703, -6.691030025482178, -6.018912315368652, -5.346794128417969, -4.674676418304443, -4.002558708190918, -3.3304409980773926, -2.658323049545288, -1.9862051010131836, -1.3140873908996582, -0.6419696807861328, 0.03014850616455078, 0.7022662162780762, 1.3743839263916016, 2.046501636505127, 2.7186195850372314, 3.390737533569336, 4.062855243682861, 4.734972953796387, 5.40709114074707, 6.079208850860596, 6.751326560974121, 7.4234442710876465, 8.095561981201172, 8.767680168151855, 9.439798355102539, 10.111915588378906, 10.78403377532959, 11.456151962280273, 12.12826919555664, 12.800387382507324, 13.472504615783691, 14.144622802734375, 14.816740036010742, 15.488858222961426, 16.16097640991211, 16.833093643188477, 17.505210876464844, 18.17732810974121, 18.84944725036621, 19.521564483642578, 20.193681716918945, 20.865798950195312, 21.537918090820312, 22.21003532409668, 22.88215446472168]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 16.0, 19.0, 30.0, 36.0, 65.0, 89.0, 141.0, 211.0, 366.0, 576.0, 967.0, 1595.0, 2719.0, 4678.0, 8094.0, 14379.0, 24947.0, 44576.0, 79729.0, 143520.0, 229249.0, 209950.0, 123994.0, 68771.0, 38246.0, 21841.0, 12457.0, 7042.0, 4159.0, 2425.0, 1409.0, 834.0, 530.0, 330.0, 184.0, 125.0, 76.0, 52.0, 32.0, 31.0, 26.0, 10.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.615570068359375, -2.51824951171875, -2.420928955078125, -2.3236083984375, -2.226287841796875, -2.12896728515625, -2.031646728515625, -1.934326171875, -1.837005615234375, -1.73968505859375, -1.642364501953125, -1.5450439453125, -1.447723388671875, -1.35040283203125, -1.253082275390625, -1.15576171875, -1.058441162109375, -0.96112060546875, -0.863800048828125, -0.7664794921875, -0.669158935546875, -0.57183837890625, -0.474517822265625, -0.377197265625, -0.279876708984375, -0.18255615234375, -0.085235595703125, 0.0120849609375, 0.109405517578125, 0.20672607421875, 0.304046630859375, 0.4013671875, 0.498687744140625, 0.59600830078125, 0.693328857421875, 0.7906494140625, 0.887969970703125, 0.98529052734375, 1.082611083984375, 1.179931640625, 1.277252197265625, 1.37457275390625, 1.471893310546875, 1.5692138671875, 1.666534423828125, 1.76385498046875, 1.861175537109375, 1.95849609375, 2.055816650390625, 2.15313720703125, 2.250457763671875, 2.3477783203125, 2.445098876953125, 2.54241943359375, 2.639739990234375, 2.737060546875, 2.834381103515625, 2.93170166015625, 3.029022216796875, 3.1263427734375, 3.223663330078125, 3.32098388671875, 3.418304443359375, 3.515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 4.0, 9.0, 8.0, 15.0, 15.0, 17.0, 23.0, 25.0, 24.0, 28.0, 44.0, 47.0, 34.0, 41.0, 38.0, 33.0, 45.0, 42.0, 50.0, 50.0, 47.0, 41.0, 34.0, 32.0, 36.0, 31.0, 24.0, 34.0, 28.0, 20.0, 19.0, 11.0, 11.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.1044921875, -20.365234375, -19.6259765625, -18.88671875, -18.1474609375, -17.408203125, -16.6689453125, -15.9296875, -15.1904296875, -14.451171875, -13.7119140625, -12.97265625, -12.2333984375, -11.494140625, -10.7548828125, -10.015625, -9.2763671875, -8.537109375, -7.7978515625, -7.05859375, -6.3193359375, -5.580078125, -4.8408203125, -4.1015625, -3.3623046875, -2.623046875, -1.8837890625, -1.14453125, -0.4052734375, 0.333984375, 1.0732421875, 1.8125, 2.5517578125, 3.291015625, 4.0302734375, 4.76953125, 5.5087890625, 6.248046875, 6.9873046875, 7.7265625, 8.4658203125, 9.205078125, 9.9443359375, 10.68359375, 11.4228515625, 12.162109375, 12.9013671875, 13.640625, 14.3798828125, 15.119140625, 15.8583984375, 16.59765625, 17.3369140625, 18.076171875, 18.8154296875, 19.5546875, 20.2939453125, 21.033203125, 21.7724609375, 22.51171875, 23.2509765625, 23.990234375, 24.7294921875, 25.46875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 13.0, 18.0, 17.0, 48.0, 37.0, 75.0, 118.0, 120.0, 191.0, 245.0, 388.0, 499.0, 753.0, 1143.0, 1648.0, 2448.0, 3641.0, 5381.0, 8062.0, 12696.0, 19959.0, 31642.0, 50034.0, 80258.0, 124326.0, 179364.0, 179013.0, 125348.0, 80830.0, 50552.0, 31732.0, 19977.0, 12697.0, 8439.0, 5599.0, 3400.0, 2467.0, 1637.0, 1073.0, 763.0, 572.0, 413.0, 254.0, 203.0, 141.0, 101.0, 71.0, 51.0, 25.0, 25.0, 21.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0], "bins": [-2.462890625, -2.388275146484375, -2.31365966796875, -2.239044189453125, -2.1644287109375, -2.089813232421875, -2.01519775390625, -1.940582275390625, -1.865966796875, -1.791351318359375, -1.71673583984375, -1.642120361328125, -1.5675048828125, -1.492889404296875, -1.41827392578125, -1.343658447265625, -1.26904296875, -1.194427490234375, -1.11981201171875, -1.045196533203125, -0.9705810546875, -0.895965576171875, -0.82135009765625, -0.746734619140625, -0.672119140625, -0.597503662109375, -0.52288818359375, -0.448272705078125, -0.3736572265625, -0.299041748046875, -0.22442626953125, -0.149810791015625, -0.0751953125, -0.000579833984375, 0.07403564453125, 0.148651123046875, 0.2232666015625, 0.297882080078125, 0.37249755859375, 0.447113037109375, 0.521728515625, 0.596343994140625, 0.67095947265625, 0.745574951171875, 0.8201904296875, 0.894805908203125, 0.96942138671875, 1.044036865234375, 1.11865234375, 1.193267822265625, 1.26788330078125, 1.342498779296875, 1.4171142578125, 1.491729736328125, 1.56634521484375, 1.640960693359375, 1.715576171875, 1.790191650390625, 1.86480712890625, 1.939422607421875, 2.0140380859375, 2.088653564453125, 2.16326904296875, 2.237884521484375, 2.3125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 14.0, 5.0, 8.0, 10.0, 3.0, 13.0, 16.0, 17.0, 14.0, 14.0, 29.0, 27.0, 22.0, 28.0, 31.0, 38.0, 34.0, 35.0, 41.0, 37.0, 43.0, 40.0, 36.0, 39.0, 34.0, 28.0, 40.0, 33.0, 20.0, 25.0, 25.0, 18.0, 29.0, 27.0, 26.0, 18.0, 12.0, 6.0, 13.0, 15.0, 9.0, 6.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8046875, -12.399169921875, -11.99365234375, -11.588134765625, -11.1826171875, -10.777099609375, -10.37158203125, -9.966064453125, -9.560546875, -9.155029296875, -8.74951171875, -8.343994140625, -7.9384765625, -7.532958984375, -7.12744140625, -6.721923828125, -6.31640625, -5.910888671875, -5.50537109375, -5.099853515625, -4.6943359375, -4.288818359375, -3.88330078125, -3.477783203125, -3.072265625, -2.666748046875, -2.26123046875, -1.855712890625, -1.4501953125, -1.044677734375, -0.63916015625, -0.233642578125, 0.171875, 0.577392578125, 0.98291015625, 1.388427734375, 1.7939453125, 2.199462890625, 2.60498046875, 3.010498046875, 3.416015625, 3.821533203125, 4.22705078125, 4.632568359375, 5.0380859375, 5.443603515625, 5.84912109375, 6.254638671875, 6.66015625, 7.065673828125, 7.47119140625, 7.876708984375, 8.2822265625, 8.687744140625, 9.09326171875, 9.498779296875, 9.904296875, 10.309814453125, 10.71533203125, 11.120849609375, 11.5263671875, 11.931884765625, 12.33740234375, 12.742919921875, 13.1484375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 10.0, 16.0, 26.0, 44.0, 41.0, 68.0, 108.0, 154.0, 194.0, 353.0, 525.0, 832.0, 1281.0, 1918.0, 3005.0, 4495.0, 7311.0, 11884.0, 19460.0, 32622.0, 57662.0, 107758.0, 205654.0, 259210.0, 147442.0, 77649.0, 42955.0, 25075.0, 15132.0, 9218.0, 5860.0, 3661.0, 2409.0, 1537.0, 1009.0, 665.0, 420.0, 300.0, 199.0, 128.0, 75.0, 69.0, 35.0, 29.0, 12.0, 13.0, 9.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.1026611328125, -0.09957313537597656, -0.09648513793945312, -0.09339714050292969, -0.09030914306640625, -0.08722114562988281, -0.08413314819335938, -0.08104515075683594, -0.0779571533203125, -0.07486915588378906, -0.07178115844726562, -0.06869316101074219, -0.06560516357421875, -0.06251716613769531, -0.059429168701171875, -0.05634117126464844, -0.053253173828125, -0.05016517639160156, -0.047077178955078125, -0.04398918151855469, -0.04090118408203125, -0.03781318664550781, -0.034725189208984375, -0.03163719177246094, -0.0285491943359375, -0.025461196899414062, -0.022373199462890625, -0.019285202026367188, -0.01619720458984375, -0.013109207153320312, -0.010021209716796875, -0.0069332122802734375, -0.00384521484375, -0.0007572174072265625, 0.002330780029296875, 0.0054187774658203125, 0.00850677490234375, 0.011594772338867188, 0.014682769775390625, 0.017770767211914062, 0.0208587646484375, 0.023946762084960938, 0.027034759521484375, 0.030122756958007812, 0.03321075439453125, 0.03629875183105469, 0.039386749267578125, 0.04247474670410156, 0.045562744140625, 0.04865074157714844, 0.051738739013671875, 0.05482673645019531, 0.05791473388671875, 0.06100273132324219, 0.06409072875976562, 0.06717872619628906, 0.0702667236328125, 0.07335472106933594, 0.07644271850585938, 0.07953071594238281, 0.08261871337890625, 0.08570671081542969, 0.08879470825195312, 0.09188270568847656, 0.094970703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 1.0, 5.0, 6.0, 2.0, 3.0, 7.0, 9.0, 12.0, 14.0, 10.0, 16.0, 14.0, 22.0, 41.0, 26.0, 28.0, 27.0, 39.0, 45.0, 51.0, 27.0, 54.0, 30.0, 44.0, 57.0, 42.0, 41.0, 41.0, 36.0, 42.0, 41.0, 21.0, 22.0, 27.0, 15.0, 18.0, 11.0, 12.0, 11.0, 8.0, 11.0, 7.0, 4.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6868114471435547e-05, -1.6322359442710876e-05, -1.5776604413986206e-05, -1.5230849385261536e-05, -1.4685094356536865e-05, -1.4139339327812195e-05, -1.3593584299087524e-05, -1.3047829270362854e-05, -1.2502074241638184e-05, -1.1956319212913513e-05, -1.1410564184188843e-05, -1.0864809155464172e-05, -1.0319054126739502e-05, -9.773299098014832e-06, -9.227544069290161e-06, -8.68178904056549e-06, -8.13603401184082e-06, -7.59027898311615e-06, -7.0445239543914795e-06, -6.498768925666809e-06, -5.953013896942139e-06, -5.407258868217468e-06, -4.861503839492798e-06, -4.3157488107681274e-06, -3.769993782043457e-06, -3.2242387533187866e-06, -2.678483724594116e-06, -2.132728695869446e-06, -1.5869736671447754e-06, -1.041218638420105e-06, -4.954636096954346e-07, 5.029141902923584e-08, 5.960464477539062e-07, 1.1418014764785767e-06, 1.687556505203247e-06, 2.2333115339279175e-06, 2.779066562652588e-06, 3.3248215913772583e-06, 3.870576620101929e-06, 4.416331648826599e-06, 4.9620866775512695e-06, 5.50784170627594e-06, 6.05359673500061e-06, 6.599351763725281e-06, 7.145106792449951e-06, 7.690861821174622e-06, 8.236616849899292e-06, 8.782371878623962e-06, 9.328126907348633e-06, 9.873881936073303e-06, 1.0419636964797974e-05, 1.0965391993522644e-05, 1.1511147022247314e-05, 1.2056902050971985e-05, 1.2602657079696655e-05, 1.3148412108421326e-05, 1.3694167137145996e-05, 1.4239922165870667e-05, 1.4785677194595337e-05, 1.5331432223320007e-05, 1.5877187252044678e-05, 1.6422942280769348e-05, 1.696869730949402e-05, 1.751445233821869e-05, 1.806020736694336e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 4.0, 12.0, 18.0, 30.0, 44.0, 55.0, 100.0, 169.0, 204.0, 343.0, 576.0, 905.0, 1396.0, 2199.0, 3355.0, 5346.0, 8636.0, 14107.0, 22719.0, 38066.0, 65611.0, 123191.0, 254673.0, 237787.0, 114118.0, 61825.0, 35854.0, 21498.0, 13333.0, 8244.0, 5190.0, 3314.0, 2078.0, 1298.0, 789.0, 536.0, 341.0, 186.0, 142.0, 97.0, 52.0, 27.0, 27.0, 17.0, 16.0, 12.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2152099609375, -0.20847320556640625, -0.2017364501953125, -0.19499969482421875, -0.188262939453125, -0.18152618408203125, -0.1747894287109375, -0.16805267333984375, -0.16131591796875, -0.15457916259765625, -0.1478424072265625, -0.14110565185546875, -0.134368896484375, -0.12763214111328125, -0.1208953857421875, -0.11415863037109375, -0.107421875, -0.10068511962890625, -0.0939483642578125, -0.08721160888671875, -0.080474853515625, -0.07373809814453125, -0.0670013427734375, -0.06026458740234375, -0.05352783203125, -0.04679107666015625, -0.0400543212890625, -0.03331756591796875, -0.026580810546875, -0.01984405517578125, -0.0131072998046875, -0.00637054443359375, 0.0003662109375, 0.00710296630859375, 0.0138397216796875, 0.02057647705078125, 0.027313232421875, 0.03404998779296875, 0.0407867431640625, 0.04752349853515625, 0.05426025390625, 0.06099700927734375, 0.0677337646484375, 0.07447052001953125, 0.081207275390625, 0.08794403076171875, 0.0946807861328125, 0.10141754150390625, 0.108154296875, 0.11489105224609375, 0.1216278076171875, 0.12836456298828125, 0.135101318359375, 0.14183807373046875, 0.1485748291015625, 0.15531158447265625, 0.16204833984375, 0.16878509521484375, 0.1755218505859375, 0.18225860595703125, 0.188995361328125, 0.19573211669921875, 0.2024688720703125, 0.20920562744140625, 0.2159423828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 10.0, 9.0, 8.0, 9.0, 16.0, 11.0, 13.0, 16.0, 27.0, 32.0, 36.0, 47.0, 41.0, 51.0, 60.0, 64.0, 81.0, 83.0, 58.0, 46.0, 43.0, 31.0, 30.0, 32.0, 20.0, 15.0, 13.0, 12.0, 14.0, 13.0, 6.0, 9.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.09429931640625, -0.09148025512695312, -0.08866119384765625, -0.08584213256835938, -0.0830230712890625, -0.08020401000976562, -0.07738494873046875, -0.07456588745117188, -0.071746826171875, -0.06892776489257812, -0.06610870361328125, -0.06328964233398438, -0.0604705810546875, -0.057651519775390625, -0.05483245849609375, -0.052013397216796875, -0.0491943359375, -0.046375274658203125, -0.04355621337890625, -0.040737152099609375, -0.0379180908203125, -0.035099029541015625, -0.03227996826171875, -0.029460906982421875, -0.026641845703125, -0.023822784423828125, -0.02100372314453125, -0.018184661865234375, -0.0153656005859375, -0.012546539306640625, -0.00972747802734375, -0.006908416748046875, -0.00408935546875, -0.001270294189453125, 0.00154876708984375, 0.004367828369140625, 0.0071868896484375, 0.010005950927734375, 0.01282501220703125, 0.015644073486328125, 0.018463134765625, 0.021282196044921875, 0.02410125732421875, 0.026920318603515625, 0.0297393798828125, 0.032558441162109375, 0.03537750244140625, 0.038196563720703125, 0.041015625, 0.043834686279296875, 0.04665374755859375, 0.049472808837890625, 0.0522918701171875, 0.055110931396484375, 0.05792999267578125, 0.060749053955078125, 0.063568115234375, 0.06638717651367188, 0.06920623779296875, 0.07202529907226562, 0.0748443603515625, 0.07766342163085938, 0.08048248291015625, 0.08330154418945312, 0.08612060546875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 14.0, 11.0, 18.0, 23.0, 29.0, 29.0, 40.0, 34.0, 43.0, 54.0, 47.0, 68.0, 76.0, 72.0, 62.0, 62.0, 60.0, 46.0, 35.0, 30.0, 43.0, 19.0, 19.0, 22.0, 9.0, 13.0, 4.0, 1.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.65962791442871, -18.907756805419922, -18.155885696411133, -17.404014587402344, -16.652141571044922, -15.900270462036133, -15.148399353027344, -14.396528244018555, -13.644657135009766, -12.892786026000977, -12.140913963317871, -11.389042854309082, -10.637171745300293, -9.885299682617188, -9.133428573608398, -8.38155746459961, -7.629685401916504, -6.877813816070557, -6.125942707061768, -5.37407112121582, -4.622200012207031, -3.870328426361084, -3.1184568405151367, -2.3665857315063477, -1.6147141456604004, -0.8628427386283875, -0.11097133159637451, 0.6409001350402832, 1.3927714824676514, 2.1446428298950195, 2.896514415740967, 3.648385524749756, 4.400257110595703, 5.15212869644165, 5.9039998054504395, 6.655871391296387, 7.407742500305176, 8.159614562988281, 8.91148567199707, 9.66335678100586, 10.415227890014648, 11.167098999023438, 11.918971061706543, 12.670842170715332, 13.422713279724121, 14.174585342407227, 14.926456451416016, 15.678327560424805, 16.430198669433594, 17.182069778442383, 17.933940887451172, 18.685813903808594, 19.437685012817383, 20.189556121826172, 20.94142723083496, 21.69329833984375, 22.445171356201172, 23.19704246520996, 23.94891357421875, 24.700786590576172, 25.45265769958496, 26.20452880859375, 26.95639991760254, 27.708271026611328, 28.460142135620117]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 5.0, 7.0, 6.0, 8.0, 17.0, 16.0, 10.0, 15.0, 15.0, 31.0, 33.0, 28.0, 28.0, 39.0, 29.0, 46.0, 34.0, 34.0, 21.0, 46.0, 42.0, 43.0, 49.0, 44.0, 38.0, 42.0, 36.0, 27.0, 30.0, 29.0, 25.0, 22.0, 21.0, 20.0, 8.0, 9.0, 12.0, 10.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.081941604614258, -19.4132022857666, -18.744461059570312, -18.075721740722656, -17.406982421875, -16.73824119567871, -16.069501876831055, -15.400761604309082, -14.73202133178711, -14.063281059265137, -13.394540786743164, -12.725801467895508, -12.057061195373535, -11.388320922851562, -10.719581604003906, -10.050841331481934, -9.382101058959961, -8.713360786437988, -8.044620513916016, -7.375881195068359, -6.707140922546387, -6.038400650024414, -5.3696608543396, -4.700921058654785, -4.0321807861328125, -3.363440752029419, -2.6947007179260254, -2.025960683822632, -1.3572206497192383, -0.6884806156158447, -0.019740581512451172, 0.6489992141723633, 1.317739486694336, 1.9864795207977295, 2.655219554901123, 3.3239595890045166, 3.99269962310791, 4.661439895629883, 5.330179691314697, 5.998919486999512, 6.667659759521484, 7.336400032043457, 8.00514030456543, 8.673879623413086, 9.342619895935059, 10.011360168457031, 10.680099487304688, 11.34883975982666, 12.017580032348633, 12.686320304870605, 13.355060577392578, 14.023799896240234, 14.692540168762207, 15.36128044128418, 16.030019760131836, 16.698760986328125, 17.36750030517578, 18.036239624023438, 18.704980850219727, 19.373720169067383, 20.042461395263672, 20.711200714111328, 21.379940032958984, 22.04867935180664, 22.71742057800293]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 10.0, 5.0, 14.0, 26.0, 52.0, 72.0, 112.0, 164.0, 239.0, 385.0, 624.0, 1042.0, 1634.0, 2551.0, 4125.0, 6326.0, 9856.0, 15161.0, 22358.0, 32411.0, 45711.0, 61284.0, 77021.0, 92013.0, 102647.0, 105962.0, 101564.0, 91158.0, 76440.0, 59062.0, 44128.0, 31854.0, 21817.0, 14377.0, 9353.0, 6263.0, 3883.0, 2583.0, 1581.0, 1015.0, 621.0, 384.0, 246.0, 154.0, 96.0, 70.0, 35.0, 33.0, 10.0, 11.0, 10.0, 5.0, 4.0, 2.0, 2.0], "bins": [-12.2109375, -11.8565673828125, -11.502197265625, -11.1478271484375, -10.79345703125, -10.4390869140625, -10.084716796875, -9.7303466796875, -9.3759765625, -9.0216064453125, -8.667236328125, -8.3128662109375, -7.95849609375, -7.6041259765625, -7.249755859375, -6.8953857421875, -6.541015625, -6.1866455078125, -5.832275390625, -5.4779052734375, -5.12353515625, -4.7691650390625, -4.414794921875, -4.0604248046875, -3.7060546875, -3.3516845703125, -2.997314453125, -2.6429443359375, -2.28857421875, -1.9342041015625, -1.579833984375, -1.2254638671875, -0.87109375, -0.5167236328125, -0.162353515625, 0.1920166015625, 0.54638671875, 0.9007568359375, 1.255126953125, 1.6094970703125, 1.9638671875, 2.3182373046875, 2.672607421875, 3.0269775390625, 3.38134765625, 3.7357177734375, 4.090087890625, 4.4444580078125, 4.798828125, 5.1531982421875, 5.507568359375, 5.8619384765625, 6.21630859375, 6.5706787109375, 6.925048828125, 7.2794189453125, 7.6337890625, 7.9881591796875, 8.342529296875, 8.6968994140625, 9.05126953125, 9.4056396484375, 9.760009765625, 10.1143798828125, 10.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 7.0, 10.0, 9.0, 16.0, 12.0, 21.0, 17.0, 23.0, 30.0, 28.0, 30.0, 24.0, 34.0, 31.0, 34.0, 34.0, 22.0, 33.0, 37.0, 42.0, 37.0, 34.0, 47.0, 33.0, 35.0, 35.0, 29.0, 32.0, 29.0, 26.0, 27.0, 25.0, 18.0, 13.0, 12.0, 10.0, 7.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.921875, -18.31201171875, -17.7021484375, -17.09228515625, -16.482421875, -15.87255859375, -15.2626953125, -14.65283203125, -14.04296875, -13.43310546875, -12.8232421875, -12.21337890625, -11.603515625, -10.99365234375, -10.3837890625, -9.77392578125, -9.1640625, -8.55419921875, -7.9443359375, -7.33447265625, -6.724609375, -6.11474609375, -5.5048828125, -4.89501953125, -4.28515625, -3.67529296875, -3.0654296875, -2.45556640625, -1.845703125, -1.23583984375, -0.6259765625, -0.01611328125, 0.59375, 1.20361328125, 1.8134765625, 2.42333984375, 3.033203125, 3.64306640625, 4.2529296875, 4.86279296875, 5.47265625, 6.08251953125, 6.6923828125, 7.30224609375, 7.912109375, 8.52197265625, 9.1318359375, 9.74169921875, 10.3515625, 10.96142578125, 11.5712890625, 12.18115234375, 12.791015625, 13.40087890625, 14.0107421875, 14.62060546875, 15.23046875, 15.84033203125, 16.4501953125, 17.06005859375, 17.669921875, 18.27978515625, 18.8896484375, 19.49951171875, 20.109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 13.0, 15.0, 13.0, 30.0, 55.0, 84.0, 152.0, 221.0, 345.0, 576.0, 852.0, 1399.0, 1998.0, 2976.0, 4357.0, 6392.0, 9311.0, 13384.0, 19010.0, 26119.0, 34928.0, 45251.0, 57660.0, 68988.0, 80086.0, 87806.0, 91247.0, 88958.0, 82907.0, 73889.0, 61708.0, 49909.0, 38856.0, 29007.0, 21341.0, 15239.0, 10877.0, 7434.0, 5071.0, 3472.0, 2231.0, 1586.0, 984.0, 646.0, 432.0, 275.0, 160.0, 131.0, 70.0, 48.0, 23.0, 21.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.40625, -9.0997314453125, -8.793212890625, -8.4866943359375, -8.18017578125, -7.8736572265625, -7.567138671875, -7.2606201171875, -6.9541015625, -6.6475830078125, -6.341064453125, -6.0345458984375, -5.72802734375, -5.4215087890625, -5.114990234375, -4.8084716796875, -4.501953125, -4.1954345703125, -3.888916015625, -3.5823974609375, -3.27587890625, -2.9693603515625, -2.662841796875, -2.3563232421875, -2.0498046875, -1.7432861328125, -1.436767578125, -1.1302490234375, -0.82373046875, -0.5172119140625, -0.210693359375, 0.0958251953125, 0.40234375, 0.7088623046875, 1.015380859375, 1.3218994140625, 1.62841796875, 1.9349365234375, 2.241455078125, 2.5479736328125, 2.8544921875, 3.1610107421875, 3.467529296875, 3.7740478515625, 4.08056640625, 4.3870849609375, 4.693603515625, 5.0001220703125, 5.306640625, 5.6131591796875, 5.919677734375, 6.2261962890625, 6.53271484375, 6.8392333984375, 7.145751953125, 7.4522705078125, 7.7587890625, 8.0653076171875, 8.371826171875, 8.6783447265625, 8.98486328125, 9.2913818359375, 9.597900390625, 9.9044189453125, 10.2109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 1.0, 6.0, 3.0, 3.0, 8.0, 7.0, 7.0, 11.0, 9.0, 17.0, 15.0, 16.0, 17.0, 17.0, 28.0, 23.0, 25.0, 31.0, 39.0, 45.0, 25.0, 32.0, 31.0, 47.0, 32.0, 30.0, 40.0, 30.0, 26.0, 26.0, 31.0, 37.0, 37.0, 42.0, 28.0, 26.0, 24.0, 15.0, 14.0, 11.0, 12.0, 12.0, 9.0, 9.0, 8.0, 11.0, 6.0, 11.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.7109375, -11.3514404296875, -10.991943359375, -10.6324462890625, -10.27294921875, -9.9134521484375, -9.553955078125, -9.1944580078125, -8.8349609375, -8.4754638671875, -8.115966796875, -7.7564697265625, -7.39697265625, -7.0374755859375, -6.677978515625, -6.3184814453125, -5.958984375, -5.5994873046875, -5.239990234375, -4.8804931640625, -4.52099609375, -4.1614990234375, -3.802001953125, -3.4425048828125, -3.0830078125, -2.7235107421875, -2.364013671875, -2.0045166015625, -1.64501953125, -1.2855224609375, -0.926025390625, -0.5665283203125, -0.20703125, 0.1524658203125, 0.511962890625, 0.8714599609375, 1.23095703125, 1.5904541015625, 1.949951171875, 2.3094482421875, 2.6689453125, 3.0284423828125, 3.387939453125, 3.7474365234375, 4.10693359375, 4.4664306640625, 4.825927734375, 5.1854248046875, 5.544921875, 5.9044189453125, 6.263916015625, 6.6234130859375, 6.98291015625, 7.3424072265625, 7.701904296875, 8.0614013671875, 8.4208984375, 8.7803955078125, 9.139892578125, 9.4993896484375, 9.85888671875, 10.2183837890625, 10.577880859375, 10.9373779296875, 11.296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 12.0, 14.0, 26.0, 56.0, 83.0, 123.0, 170.0, 272.0, 450.0, 647.0, 1101.0, 1706.0, 2828.0, 4483.0, 7127.0, 11416.0, 17764.0, 27445.0, 40505.0, 57826.0, 77526.0, 98103.0, 113190.0, 118899.0, 113526.0, 98617.0, 79066.0, 58638.0, 40964.0, 27557.0, 17751.0, 11372.0, 7265.0, 4502.0, 2834.0, 1666.0, 1115.0, 686.0, 426.0, 291.0, 189.0, 105.0, 73.0, 57.0, 36.0, 17.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.71875, -3.6043701171875, -3.489990234375, -3.3756103515625, -3.26123046875, -3.1468505859375, -3.032470703125, -2.9180908203125, -2.8037109375, -2.6893310546875, -2.574951171875, -2.4605712890625, -2.34619140625, -2.2318115234375, -2.117431640625, -2.0030517578125, -1.888671875, -1.7742919921875, -1.659912109375, -1.5455322265625, -1.43115234375, -1.3167724609375, -1.202392578125, -1.0880126953125, -0.9736328125, -0.8592529296875, -0.744873046875, -0.6304931640625, -0.51611328125, -0.4017333984375, -0.287353515625, -0.1729736328125, -0.05859375, 0.0557861328125, 0.170166015625, 0.2845458984375, 0.39892578125, 0.5133056640625, 0.627685546875, 0.7420654296875, 0.8564453125, 0.9708251953125, 1.085205078125, 1.1995849609375, 1.31396484375, 1.4283447265625, 1.542724609375, 1.6571044921875, 1.771484375, 1.8858642578125, 2.000244140625, 2.1146240234375, 2.22900390625, 2.3433837890625, 2.457763671875, 2.5721435546875, 2.6865234375, 2.8009033203125, 2.915283203125, 3.0296630859375, 3.14404296875, 3.2584228515625, 3.372802734375, 3.4871826171875, 3.6015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 8.0, 9.0, 12.0, 18.0, 16.0, 25.0, 26.0, 30.0, 27.0, 34.0, 36.0, 37.0, 53.0, 49.0, 39.0, 47.0, 50.0, 53.0, 53.0, 50.0, 47.0, 39.0, 34.0, 33.0, 20.0, 20.0, 19.0, 18.0, 13.0, 17.0, 14.0, 10.0, 7.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039577484130859375, -0.00038237497210502625, -0.00036897510290145874, -0.00035557523369789124, -0.00034217536449432373, -0.0003287754952907562, -0.0003153756260871887, -0.0003019757568836212, -0.0002885758876800537, -0.0002751760184764862, -0.0002617761492729187, -0.0002483762800693512, -0.0002349764108657837, -0.0002215765416622162, -0.00020817667245864868, -0.00019477680325508118, -0.00018137693405151367, -0.00016797706484794617, -0.00015457719564437866, -0.00014117732644081116, -0.00012777745723724365, -0.00011437758803367615, -0.00010097771883010864, -8.757784962654114e-05, -7.417798042297363e-05, -6.077811121940613e-05, -4.737824201583862e-05, -3.397837281227112e-05, -2.0578503608703613e-05, -7.178634405136108e-06, 6.2212347984313965e-06, 1.96211040019989e-05, 3.3020973205566406e-05, 4.642084240913391e-05, 5.9820711612701416e-05, 7.322058081626892e-05, 8.662045001983643e-05, 0.00010002031922340393, 0.00011342018842697144, 0.00012682005763053894, 0.00014021992683410645, 0.00015361979603767395, 0.00016701966524124146, 0.00018041953444480896, 0.00019381940364837646, 0.00020721927285194397, 0.00022061914205551147, 0.00023401901125907898, 0.0002474188804626465, 0.000260818749666214, 0.0002742186188697815, 0.000287618488073349, 0.0003010183572769165, 0.000314418226480484, 0.0003278180956840515, 0.000341217964887619, 0.0003546178340911865, 0.00036801770329475403, 0.00038141757249832153, 0.00039481744170188904, 0.00040821731090545654, 0.00042161718010902405, 0.00043501704931259155, 0.00044841691851615906, 0.00046181678771972656]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 13.0, 16.0, 14.0, 23.0, 31.0, 59.0, 74.0, 115.0, 202.0, 329.0, 588.0, 949.0, 1695.0, 3065.0, 5647.0, 10759.0, 20018.0, 35850.0, 62986.0, 100219.0, 140109.0, 165250.0, 160370.0, 129607.0, 88769.0, 54080.0, 31034.0, 16730.0, 9039.0, 4789.0, 2613.0, 1426.0, 739.0, 487.0, 299.0, 185.0, 115.0, 75.0, 58.0, 31.0, 26.0, 22.0, 21.0, 7.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.15234375, -4.97979736328125, -4.8072509765625, -4.63470458984375, -4.462158203125, -4.28961181640625, -4.1170654296875, -3.94451904296875, -3.77197265625, -3.59942626953125, -3.4268798828125, -3.25433349609375, -3.081787109375, -2.90924072265625, -2.7366943359375, -2.56414794921875, -2.3916015625, -2.21905517578125, -2.0465087890625, -1.87396240234375, -1.701416015625, -1.52886962890625, -1.3563232421875, -1.18377685546875, -1.01123046875, -0.83868408203125, -0.6661376953125, -0.49359130859375, -0.321044921875, -0.14849853515625, 0.0240478515625, 0.19659423828125, 0.369140625, 0.54168701171875, 0.7142333984375, 0.88677978515625, 1.059326171875, 1.23187255859375, 1.4044189453125, 1.57696533203125, 1.74951171875, 1.92205810546875, 2.0946044921875, 2.26715087890625, 2.439697265625, 2.61224365234375, 2.7847900390625, 2.95733642578125, 3.1298828125, 3.30242919921875, 3.4749755859375, 3.64752197265625, 3.820068359375, 3.99261474609375, 4.1651611328125, 4.33770751953125, 4.51025390625, 4.68280029296875, 4.8553466796875, 5.02789306640625, 5.200439453125, 5.37298583984375, 5.5455322265625, 5.71807861328125, 5.890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 10.0, 11.0, 16.0, 11.0, 10.0, 16.0, 24.0, 23.0, 34.0, 42.0, 47.0, 56.0, 70.0, 53.0, 44.0, 53.0, 42.0, 64.0, 51.0, 49.0, 28.0, 36.0, 36.0, 27.0, 27.0, 22.0, 19.0, 18.0, 10.0, 9.0, 11.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.0703125, -2.007537841796875, -1.94476318359375, -1.881988525390625, -1.8192138671875, -1.756439208984375, -1.69366455078125, -1.630889892578125, -1.568115234375, -1.505340576171875, -1.44256591796875, -1.379791259765625, -1.3170166015625, -1.254241943359375, -1.19146728515625, -1.128692626953125, -1.06591796875, -1.003143310546875, -0.94036865234375, -0.877593994140625, -0.8148193359375, -0.752044677734375, -0.68927001953125, -0.626495361328125, -0.563720703125, -0.500946044921875, -0.43817138671875, -0.375396728515625, -0.3126220703125, -0.249847412109375, -0.18707275390625, -0.124298095703125, -0.0615234375, 0.001251220703125, 0.06402587890625, 0.126800537109375, 0.1895751953125, 0.252349853515625, 0.31512451171875, 0.377899169921875, 0.440673828125, 0.503448486328125, 0.56622314453125, 0.628997802734375, 0.6917724609375, 0.754547119140625, 0.81732177734375, 0.880096435546875, 0.94287109375, 1.005645751953125, 1.06842041015625, 1.131195068359375, 1.1939697265625, 1.256744384765625, 1.31951904296875, 1.382293701171875, 1.445068359375, 1.507843017578125, 1.57061767578125, 1.633392333984375, 1.6961669921875, 1.758941650390625, 1.82171630859375, 1.884490966796875, 1.947265625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 5.0, 15.0, 17.0, 22.0, 17.0, 22.0, 28.0, 29.0, 37.0, 43.0, 42.0, 60.0, 74.0, 57.0, 51.0, 68.0, 56.0, 62.0, 58.0, 42.0, 40.0, 27.0, 32.0, 30.0, 12.0, 12.0, 9.0, 10.0, 5.0, 9.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96094512939453, -18.245296478271484, -17.529647827148438, -16.81399917602539, -16.098350524902344, -15.382701873779297, -14.667054176330566, -13.95140552520752, -13.235756874084473, -12.520108222961426, -11.804459571838379, -11.088811874389648, -10.373163223266602, -9.657514572143555, -8.941865921020508, -8.226217269897461, -7.510568618774414, -6.794919967651367, -6.07927131652832, -5.363623142242432, -4.647974491119385, -3.932325839996338, -3.216677665710449, -2.5010290145874023, -1.7853803634643555, -1.0697318315505981, -0.3540832996368408, 0.36156511306762695, 1.0772137641906738, 1.7928624153137207, 2.5085105895996094, 3.2241592407226562, 3.939809799194336, 4.655458450317383, 5.37110710144043, 6.086755275726318, 6.802403926849365, 7.518052577972412, 8.2337007522583, 8.949349403381348, 9.664998054504395, 10.380646705627441, 11.096295356750488, 11.811943054199219, 12.527591705322266, 13.243240356445312, 13.95888900756836, 14.674537658691406, 15.390186309814453, 16.1058349609375, 16.821483612060547, 17.537132263183594, 18.25278091430664, 18.968429565429688, 19.684078216552734, 20.39972686767578, 21.115375518798828, 21.831024169921875, 22.546672821044922, 23.26232147216797, 23.977970123291016, 24.693618774414062, 25.40926742553711, 26.124916076660156, 26.84056282043457]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 7.0, 5.0, 12.0, 8.0, 17.0, 16.0, 19.0, 12.0, 26.0, 22.0, 31.0, 20.0, 30.0, 33.0, 43.0, 36.0, 36.0, 54.0, 35.0, 47.0, 29.0, 40.0, 47.0, 34.0, 29.0, 47.0, 30.0, 26.0, 33.0, 30.0, 26.0, 12.0, 20.0, 12.0, 17.0, 11.0, 9.0, 12.0, 4.0, 8.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.36363983154297, -20.685218811035156, -20.006799697875977, -19.328378677368164, -18.649959564208984, -17.971538543701172, -17.29311752319336, -16.614696502685547, -15.936277389526367, -15.257857322692871, -14.579437255859375, -13.901016235351562, -13.222596168518066, -12.54417610168457, -11.865755081176758, -11.187335014343262, -10.508914947509766, -9.83049488067627, -9.152074813842773, -8.473653793334961, -7.795233726501465, -7.116813659667969, -6.4383931159973145, -5.75997257232666, -5.081552505493164, -4.403132438659668, -3.7247118949890137, -3.0462915897369385, -2.3678712844848633, -1.689450979232788, -1.011030673980713, -0.3326101303100586, 0.3458099365234375, 1.0242302417755127, 1.702650547027588, 2.381070852279663, 3.0594911575317383, 3.7379114627838135, 4.416331768035889, 5.094752311706543, 5.773172378540039, 6.451592445373535, 7.1300129890441895, 7.808433532714844, 8.48685359954834, 9.165273666381836, 9.843694686889648, 10.522114753723145, 11.20053482055664, 11.878954887390137, 12.557374954223633, 13.235795974731445, 13.914216041564941, 14.592636108398438, 15.27105712890625, 15.949477195739746, 16.627897262573242, 17.306318283081055, 17.984737396240234, 18.663158416748047, 19.34157943725586, 20.01999855041504, 20.69841957092285, 21.37683868408203, 22.055259704589844]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 15.0, 26.0, 52.0, 108.0, 154.0, 278.0, 425.0, 716.0, 1188.0, 2023.0, 3394.0, 5699.0, 9504.0, 15510.0, 25224.0, 40346.0, 63198.0, 97695.0, 144028.0, 207125.0, 278330.0, 354533.0, 419767.0, 456007.0, 452318.0, 411035.0, 346091.0, 268225.0, 197709.0, 137510.0, 93532.0, 60711.0, 38450.0, 24403.0, 15015.0, 9279.0, 5757.0, 3538.0, 2158.0, 1281.0, 771.0, 448.0, 297.0, 159.0, 87.0, 56.0, 42.0, 28.0, 15.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-13.8125, -13.3800048828125, -12.947509765625, -12.5150146484375, -12.08251953125, -11.6500244140625, -11.217529296875, -10.7850341796875, -10.3525390625, -9.9200439453125, -9.487548828125, -9.0550537109375, -8.62255859375, -8.1900634765625, -7.757568359375, -7.3250732421875, -6.892578125, -6.4600830078125, -6.027587890625, -5.5950927734375, -5.16259765625, -4.7301025390625, -4.297607421875, -3.8651123046875, -3.4326171875, -3.0001220703125, -2.567626953125, -2.1351318359375, -1.70263671875, -1.2701416015625, -0.837646484375, -0.4051513671875, 0.02734375, 0.4598388671875, 0.892333984375, 1.3248291015625, 1.75732421875, 2.1898193359375, 2.622314453125, 3.0548095703125, 3.4873046875, 3.9197998046875, 4.352294921875, 4.7847900390625, 5.21728515625, 5.6497802734375, 6.082275390625, 6.5147705078125, 6.947265625, 7.3797607421875, 7.812255859375, 8.2447509765625, 8.67724609375, 9.1097412109375, 9.542236328125, 9.9747314453125, 10.4072265625, 10.8397216796875, 11.272216796875, 11.7047119140625, 12.13720703125, 12.5697021484375, 13.002197265625, 13.4346923828125, 13.8671875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 8.0, 8.0, 7.0, 9.0, 16.0, 7.0, 19.0, 19.0, 17.0, 28.0, 28.0, 31.0, 34.0, 36.0, 32.0, 41.0, 47.0, 38.0, 30.0, 39.0, 36.0, 41.0, 29.0, 46.0, 40.0, 35.0, 25.0, 39.0, 32.0, 23.0, 16.0, 21.0, 15.0, 17.0, 8.0, 20.0, 10.0, 12.0, 6.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.109375, -16.585693359375, -16.06201171875, -15.538330078125, -15.0146484375, -14.490966796875, -13.96728515625, -13.443603515625, -12.919921875, -12.396240234375, -11.87255859375, -11.348876953125, -10.8251953125, -10.301513671875, -9.77783203125, -9.254150390625, -8.73046875, -8.206787109375, -7.68310546875, -7.159423828125, -6.6357421875, -6.112060546875, -5.58837890625, -5.064697265625, -4.541015625, -4.017333984375, -3.49365234375, -2.969970703125, -2.4462890625, -1.922607421875, -1.39892578125, -0.875244140625, -0.3515625, 0.172119140625, 0.69580078125, 1.219482421875, 1.7431640625, 2.266845703125, 2.79052734375, 3.314208984375, 3.837890625, 4.361572265625, 4.88525390625, 5.408935546875, 5.9326171875, 6.456298828125, 6.97998046875, 7.503662109375, 8.02734375, 8.551025390625, 9.07470703125, 9.598388671875, 10.1220703125, 10.645751953125, 11.16943359375, 11.693115234375, 12.216796875, 12.740478515625, 13.26416015625, 13.787841796875, 14.3115234375, 14.835205078125, 15.35888671875, 15.882568359375, 16.40625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 15.0, 13.0, 29.0, 42.0, 95.0, 165.0, 328.0, 573.0, 1027.0, 1897.0, 3506.0, 6094.0, 10951.0, 19280.0, 31882.0, 53592.0, 85637.0, 131601.0, 193207.0, 265260.0, 342417.0, 411167.0, 454394.0, 460554.0, 430210.0, 368847.0, 294363.0, 217866.0, 152551.0, 100705.0, 63536.0, 39107.0, 22955.0, 13387.0, 7646.0, 4245.0, 2323.0, 1296.0, 689.0, 362.0, 217.0, 112.0, 64.0, 42.0, 25.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.734375, -15.2740478515625, -14.813720703125, -14.3533935546875, -13.89306640625, -13.4327392578125, -12.972412109375, -12.5120849609375, -12.0517578125, -11.5914306640625, -11.131103515625, -10.6707763671875, -10.21044921875, -9.7501220703125, -9.289794921875, -8.8294677734375, -8.369140625, -7.9088134765625, -7.448486328125, -6.9881591796875, -6.52783203125, -6.0675048828125, -5.607177734375, -5.1468505859375, -4.6865234375, -4.2261962890625, -3.765869140625, -3.3055419921875, -2.84521484375, -2.3848876953125, -1.924560546875, -1.4642333984375, -1.00390625, -0.5435791015625, -0.083251953125, 0.3770751953125, 0.83740234375, 1.2977294921875, 1.758056640625, 2.2183837890625, 2.6787109375, 3.1390380859375, 3.599365234375, 4.0596923828125, 4.52001953125, 4.9803466796875, 5.440673828125, 5.9010009765625, 6.361328125, 6.8216552734375, 7.281982421875, 7.7423095703125, 8.20263671875, 8.6629638671875, 9.123291015625, 9.5836181640625, 10.0439453125, 10.5042724609375, 10.964599609375, 11.4249267578125, 11.88525390625, 12.3455810546875, 12.805908203125, 13.2662353515625, 13.7265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 6.0, 10.0, 7.0, 12.0, 15.0, 29.0, 38.0, 42.0, 53.0, 62.0, 99.0, 111.0, 127.0, 161.0, 170.0, 210.0, 209.0, 232.0, 248.0, 223.0, 249.0, 224.0, 199.0, 188.0, 198.0, 174.0, 140.0, 114.0, 102.0, 97.0, 74.0, 61.0, 46.0, 33.0, 32.0, 19.0, 12.0, 14.0, 6.0, 8.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.4873046875, -8.193359375, -7.8994140625, -7.60546875, -7.3115234375, -7.017578125, -6.7236328125, -6.4296875, -6.1357421875, -5.841796875, -5.5478515625, -5.25390625, -4.9599609375, -4.666015625, -4.3720703125, -4.078125, -3.7841796875, -3.490234375, -3.1962890625, -2.90234375, -2.6083984375, -2.314453125, -2.0205078125, -1.7265625, -1.4326171875, -1.138671875, -0.8447265625, -0.55078125, -0.2568359375, 0.037109375, 0.3310546875, 0.625, 0.9189453125, 1.212890625, 1.5068359375, 1.80078125, 2.0947265625, 2.388671875, 2.6826171875, 2.9765625, 3.2705078125, 3.564453125, 3.8583984375, 4.15234375, 4.4462890625, 4.740234375, 5.0341796875, 5.328125, 5.6220703125, 5.916015625, 6.2099609375, 6.50390625, 6.7978515625, 7.091796875, 7.3857421875, 7.6796875, 7.9736328125, 8.267578125, 8.5615234375, 8.85546875, 9.1494140625, 9.443359375, 9.7373046875, 10.03125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 11.0, 10.0, 10.0, 18.0, 20.0, 24.0, 26.0, 17.0, 27.0, 33.0, 38.0, 45.0, 52.0, 46.0, 53.0, 58.0, 39.0, 43.0, 59.0, 49.0, 47.0, 34.0, 33.0, 35.0, 37.0, 29.0, 27.0, 11.0, 8.0, 13.0, 11.0, 6.0, 4.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.399248123168945, -17.771133422851562, -17.143016815185547, -16.51490020751953, -15.886785507202148, -15.25866985321045, -14.63055419921875, -14.00243854522705, -13.374322891235352, -12.746207237243652, -12.118091583251953, -11.489975929260254, -10.861860275268555, -10.233744621276855, -9.605628967285156, -8.977513313293457, -8.349397659301758, -7.721282005310059, -7.093166351318359, -6.46505069732666, -5.836935043334961, -5.208819389343262, -4.5807037353515625, -3.9525880813598633, -3.324472427368164, -2.696356773376465, -2.0682411193847656, -1.4401254653930664, -0.8120098114013672, -0.18389415740966797, 0.44422149658203125, 1.0723371505737305, 1.7004528045654297, 2.328568458557129, 2.956684112548828, 3.5847997665405273, 4.212915420532227, 4.841031074523926, 5.469146728515625, 6.097262382507324, 6.725378036499023, 7.353493690490723, 7.981609344482422, 8.609724998474121, 9.23784065246582, 9.86595630645752, 10.494071960449219, 11.122187614440918, 11.750303268432617, 12.378418922424316, 13.006534576416016, 13.634650230407715, 14.262765884399414, 14.890881538391113, 15.518997192382812, 16.147113800048828, 16.77522850036621, 17.403343200683594, 18.03145980834961, 18.659576416015625, 19.287691116333008, 19.91580581665039, 20.543922424316406, 21.172039031982422, 21.800153732299805]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 11.0, 4.0, 4.0, 6.0, 10.0, 12.0, 20.0, 13.0, 14.0, 18.0, 12.0, 16.0, 26.0, 22.0, 31.0, 37.0, 27.0, 37.0, 35.0, 40.0, 38.0, 34.0, 60.0, 34.0, 36.0, 36.0, 43.0, 35.0, 34.0, 34.0, 29.0, 26.0, 26.0, 20.0, 11.0, 21.0, 8.0, 11.0, 17.0, 13.0, 10.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.7728214263916, -19.141103744506836, -18.509384155273438, -17.877666473388672, -17.245948791503906, -16.614229202270508, -15.982511520385742, -15.35079288482666, -14.719074249267578, -14.087355613708496, -13.455636978149414, -12.823919296264648, -12.192200660705566, -11.560482025146484, -10.928764343261719, -10.297045707702637, -9.665327072143555, -9.033608436584473, -8.40188980102539, -7.770172119140625, -7.138453483581543, -6.506734848022461, -5.875016689300537, -5.243298530578613, -4.611579895019531, -3.9798614978790283, -3.3481431007385254, -2.7164247035980225, -2.0847063064575195, -1.4529879093170166, -0.8212695121765137, -0.18955135345458984, 0.4421672821044922, 1.0738856792449951, 1.705604076385498, 2.337322473526001, 2.969040870666504, 3.600759267807007, 4.23247766494751, 4.864195823669434, 5.495914459228516, 6.127633094787598, 6.7593512535095215, 7.391069412231445, 8.022788047790527, 8.65450668334961, 9.286224365234375, 9.917943000793457, 10.549661636352539, 11.181380271911621, 11.813098907470703, 12.444816589355469, 13.07653522491455, 13.708253860473633, 14.339971542358398, 14.97169017791748, 15.603408813476562, 16.235126495361328, 16.866846084594727, 17.498563766479492, 18.13028335571289, 18.762001037597656, 19.393718719482422, 20.025436401367188, 20.657155990600586]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 8.0, 5.0, 12.0, 19.0, 21.0, 48.0, 56.0, 89.0, 175.0, 214.0, 304.0, 500.0, 722.0, 1214.0, 2108.0, 3596.0, 6025.0, 10308.0, 17840.0, 31673.0, 56146.0, 99675.0, 177618.0, 241908.0, 173177.0, 97139.0, 54638.0, 30763.0, 17581.0, 10148.0, 5915.0, 3476.0, 2036.0, 1204.0, 829.0, 496.0, 306.0, 198.0, 121.0, 82.0, 55.0, 38.0, 18.0, 17.0, 11.0, 14.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.921875, -2.8319091796875, -2.741943359375, -2.6519775390625, -2.56201171875, -2.4720458984375, -2.382080078125, -2.2921142578125, -2.2021484375, -2.1121826171875, -2.022216796875, -1.9322509765625, -1.84228515625, -1.7523193359375, -1.662353515625, -1.5723876953125, -1.482421875, -1.3924560546875, -1.302490234375, -1.2125244140625, -1.12255859375, -1.0325927734375, -0.942626953125, -0.8526611328125, -0.7626953125, -0.6727294921875, -0.582763671875, -0.4927978515625, -0.40283203125, -0.3128662109375, -0.222900390625, -0.1329345703125, -0.04296875, 0.0469970703125, 0.136962890625, 0.2269287109375, 0.31689453125, 0.4068603515625, 0.496826171875, 0.5867919921875, 0.6767578125, 0.7667236328125, 0.856689453125, 0.9466552734375, 1.03662109375, 1.1265869140625, 1.216552734375, 1.3065185546875, 1.396484375, 1.4864501953125, 1.576416015625, 1.6663818359375, 1.75634765625, 1.8463134765625, 1.936279296875, 2.0262451171875, 2.1162109375, 2.2061767578125, 2.296142578125, 2.3861083984375, 2.47607421875, 2.5660400390625, 2.656005859375, 2.7459716796875, 2.8359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 1.0, 12.0, 9.0, 6.0, 7.0, 11.0, 10.0, 15.0, 14.0, 16.0, 25.0, 22.0, 22.0, 24.0, 29.0, 40.0, 28.0, 41.0, 37.0, 42.0, 50.0, 47.0, 35.0, 34.0, 48.0, 47.0, 45.0, 36.0, 36.0, 22.0, 27.0, 25.0, 24.0, 21.0, 14.0, 15.0, 17.0, 12.0, 8.0, 6.0, 10.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-22.578125, -21.8779296875, -21.177734375, -20.4775390625, -19.77734375, -19.0771484375, -18.376953125, -17.6767578125, -16.9765625, -16.2763671875, -15.576171875, -14.8759765625, -14.17578125, -13.4755859375, -12.775390625, -12.0751953125, -11.375, -10.6748046875, -9.974609375, -9.2744140625, -8.57421875, -7.8740234375, -7.173828125, -6.4736328125, -5.7734375, -5.0732421875, -4.373046875, -3.6728515625, -2.97265625, -2.2724609375, -1.572265625, -0.8720703125, -0.171875, 0.5283203125, 1.228515625, 1.9287109375, 2.62890625, 3.3291015625, 4.029296875, 4.7294921875, 5.4296875, 6.1298828125, 6.830078125, 7.5302734375, 8.23046875, 8.9306640625, 9.630859375, 10.3310546875, 11.03125, 11.7314453125, 12.431640625, 13.1318359375, 13.83203125, 14.5322265625, 15.232421875, 15.9326171875, 16.6328125, 17.3330078125, 18.033203125, 18.7333984375, 19.43359375, 20.1337890625, 20.833984375, 21.5341796875, 22.234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 6.0, 2.0, 7.0, 14.0, 19.0, 42.0, 47.0, 81.0, 118.0, 140.0, 245.0, 292.0, 428.0, 610.0, 816.0, 1250.0, 1746.0, 2475.0, 3761.0, 5452.0, 8132.0, 12021.0, 18502.0, 28575.0, 44889.0, 69923.0, 108306.0, 159515.0, 184727.0, 137655.0, 91148.0, 58447.0, 37118.0, 23797.0, 15731.0, 10429.0, 6952.0, 4619.0, 3123.0, 2209.0, 1527.0, 1104.0, 734.0, 562.0, 390.0, 267.0, 198.0, 121.0, 74.0, 74.0, 42.0, 32.0, 23.0, 16.0, 11.0, 9.0, 4.0, 5.0, 1.0, 3.0], "bins": [-2.322265625, -2.2503662109375, -2.178466796875, -2.1065673828125, -2.03466796875, -1.9627685546875, -1.890869140625, -1.8189697265625, -1.7470703125, -1.6751708984375, -1.603271484375, -1.5313720703125, -1.45947265625, -1.3875732421875, -1.315673828125, -1.2437744140625, -1.171875, -1.0999755859375, -1.028076171875, -0.9561767578125, -0.88427734375, -0.8123779296875, -0.740478515625, -0.6685791015625, -0.5966796875, -0.5247802734375, -0.452880859375, -0.3809814453125, -0.30908203125, -0.2371826171875, -0.165283203125, -0.0933837890625, -0.021484375, 0.0504150390625, 0.122314453125, 0.1942138671875, 0.26611328125, 0.3380126953125, 0.409912109375, 0.4818115234375, 0.5537109375, 0.6256103515625, 0.697509765625, 0.7694091796875, 0.84130859375, 0.9132080078125, 0.985107421875, 1.0570068359375, 1.12890625, 1.2008056640625, 1.272705078125, 1.3446044921875, 1.41650390625, 1.4884033203125, 1.560302734375, 1.6322021484375, 1.7041015625, 1.7760009765625, 1.847900390625, 1.9197998046875, 1.99169921875, 2.0635986328125, 2.135498046875, 2.2073974609375, 2.279296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 10.0, 9.0, 12.0, 9.0, 15.0, 16.0, 13.0, 17.0, 20.0, 20.0, 25.0, 27.0, 27.0, 30.0, 43.0, 34.0, 33.0, 38.0, 27.0, 39.0, 42.0, 33.0, 32.0, 33.0, 44.0, 38.0, 31.0, 47.0, 27.0, 31.0, 16.0, 22.0, 23.0, 21.0, 19.0, 15.0, 17.0, 7.0, 5.0, 5.0, 4.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.03125, -12.62060546875, -12.2099609375, -11.79931640625, -11.388671875, -10.97802734375, -10.5673828125, -10.15673828125, -9.74609375, -9.33544921875, -8.9248046875, -8.51416015625, -8.103515625, -7.69287109375, -7.2822265625, -6.87158203125, -6.4609375, -6.05029296875, -5.6396484375, -5.22900390625, -4.818359375, -4.40771484375, -3.9970703125, -3.58642578125, -3.17578125, -2.76513671875, -2.3544921875, -1.94384765625, -1.533203125, -1.12255859375, -0.7119140625, -0.30126953125, 0.109375, 0.52001953125, 0.9306640625, 1.34130859375, 1.751953125, 2.16259765625, 2.5732421875, 2.98388671875, 3.39453125, 3.80517578125, 4.2158203125, 4.62646484375, 5.037109375, 5.44775390625, 5.8583984375, 6.26904296875, 6.6796875, 7.09033203125, 7.5009765625, 7.91162109375, 8.322265625, 8.73291015625, 9.1435546875, 9.55419921875, 9.96484375, 10.37548828125, 10.7861328125, 11.19677734375, 11.607421875, 12.01806640625, 12.4287109375, 12.83935546875, 13.25]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 9.0, 14.0, 24.0, 28.0, 40.0, 68.0, 97.0, 168.0, 227.0, 338.0, 442.0, 588.0, 904.0, 1252.0, 1860.0, 2630.0, 3798.0, 5746.0, 8560.0, 12678.0, 19622.0, 31580.0, 51378.0, 87911.0, 159484.0, 239696.0, 172642.0, 95173.0, 55230.0, 33325.0, 21286.0, 13497.0, 8921.0, 5941.0, 4220.0, 2758.0, 1985.0, 1325.0, 947.0, 671.0, 448.0, 305.0, 218.0, 164.0, 122.0, 95.0, 49.0, 30.0, 33.0, 11.0, 8.0, 8.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.08154296875, -0.07911396026611328, -0.07668495178222656, -0.07425594329833984, -0.07182693481445312, -0.0693979263305664, -0.06696891784667969, -0.06453990936279297, -0.06211090087890625, -0.05968189239501953, -0.05725288391113281, -0.054823875427246094, -0.052394866943359375, -0.049965858459472656, -0.04753684997558594, -0.04510784149169922, -0.0426788330078125, -0.04024982452392578, -0.03782081604003906, -0.035391807556152344, -0.032962799072265625, -0.030533790588378906, -0.028104782104492188, -0.02567577362060547, -0.02324676513671875, -0.02081775665283203, -0.018388748168945312, -0.015959739685058594, -0.013530731201171875, -0.011101722717285156, -0.008672714233398438, -0.006243705749511719, -0.003814697265625, -0.0013856887817382812, 0.0010433197021484375, 0.0034723281860351562, 0.005901336669921875, 0.008330345153808594, 0.010759353637695312, 0.013188362121582031, 0.01561737060546875, 0.01804637908935547, 0.020475387573242188, 0.022904396057128906, 0.025333404541015625, 0.027762413024902344, 0.030191421508789062, 0.03262042999267578, 0.0350494384765625, 0.03747844696044922, 0.03990745544433594, 0.042336463928222656, 0.044765472412109375, 0.047194480895996094, 0.04962348937988281, 0.05205249786376953, 0.05448150634765625, 0.05691051483154297, 0.05933952331542969, 0.061768531799316406, 0.06419754028320312, 0.06662654876708984, 0.06905555725097656, 0.07148456573486328, 0.07391357421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 7.0, 8.0, 8.0, 14.0, 15.0, 15.0, 14.0, 25.0, 19.0, 24.0, 31.0, 41.0, 41.0, 36.0, 34.0, 40.0, 36.0, 32.0, 42.0, 35.0, 39.0, 61.0, 34.0, 33.0, 27.0, 32.0, 37.0, 30.0, 31.0, 18.0, 20.0, 25.0, 11.0, 18.0, 16.0, 11.0, 11.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.627206802368164e-05, -1.5798956155776978e-05, -1.5325844287872314e-05, -1.4852732419967651e-05, -1.4379620552062988e-05, -1.3906508684158325e-05, -1.3433396816253662e-05, -1.2960284948348999e-05, -1.2487173080444336e-05, -1.2014061212539673e-05, -1.154094934463501e-05, -1.1067837476730347e-05, -1.0594725608825684e-05, -1.012161374092102e-05, -9.648501873016357e-06, -9.175390005111694e-06, -8.702278137207031e-06, -8.229166269302368e-06, -7.756054401397705e-06, -7.282942533493042e-06, -6.809830665588379e-06, -6.336718797683716e-06, -5.863606929779053e-06, -5.39049506187439e-06, -4.9173831939697266e-06, -4.4442713260650635e-06, -3.9711594581604e-06, -3.4980475902557373e-06, -3.0249357223510742e-06, -2.551823854446411e-06, -2.078711986541748e-06, -1.605600118637085e-06, -1.1324882507324219e-06, -6.593763828277588e-07, -1.862645149230957e-07, 2.868473529815674e-07, 7.599592208862305e-07, 1.2330710887908936e-06, 1.7061829566955566e-06, 2.1792948246002197e-06, 2.652406692504883e-06, 3.125518560409546e-06, 3.598630428314209e-06, 4.071742296218872e-06, 4.544854164123535e-06, 5.017966032028198e-06, 5.491077899932861e-06, 5.964189767837524e-06, 6.4373016357421875e-06, 6.910413503646851e-06, 7.383525371551514e-06, 7.856637239456177e-06, 8.32974910736084e-06, 8.802860975265503e-06, 9.275972843170166e-06, 9.749084711074829e-06, 1.0222196578979492e-05, 1.0695308446884155e-05, 1.1168420314788818e-05, 1.1641532182693481e-05, 1.2114644050598145e-05, 1.2587755918502808e-05, 1.306086778640747e-05, 1.3533979654312134e-05, 1.4007091522216797e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 17.0, 17.0, 31.0, 51.0, 93.0, 125.0, 177.0, 252.0, 400.0, 633.0, 983.0, 1566.0, 2513.0, 3969.0, 6511.0, 10797.0, 17774.0, 29792.0, 51994.0, 93747.0, 185238.0, 293460.0, 155028.0, 80929.0, 45333.0, 26378.0, 15666.0, 9543.0, 5854.0, 3560.0, 2172.0, 1338.0, 923.0, 521.0, 383.0, 257.0, 155.0, 109.0, 75.0, 57.0, 38.0, 21.0, 14.0, 16.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1885986328125, -0.1825885772705078, -0.17657852172851562, -0.17056846618652344, -0.16455841064453125, -0.15854835510253906, -0.15253829956054688, -0.1465282440185547, -0.1405181884765625, -0.1345081329345703, -0.12849807739257812, -0.12248802185058594, -0.11647796630859375, -0.11046791076660156, -0.10445785522460938, -0.09844779968261719, -0.092437744140625, -0.08642768859863281, -0.08041763305664062, -0.07440757751464844, -0.06839752197265625, -0.06238746643066406, -0.056377410888671875, -0.05036735534667969, -0.0443572998046875, -0.03834724426269531, -0.032337188720703125, -0.026327133178710938, -0.02031707763671875, -0.014307022094726562, -0.008296966552734375, -0.0022869110107421875, 0.00372314453125, 0.009733200073242188, 0.015743255615234375, 0.021753311157226562, 0.02776336669921875, 0.03377342224121094, 0.039783477783203125, 0.04579353332519531, 0.0518035888671875, 0.05781364440917969, 0.06382369995117188, 0.06983375549316406, 0.07584381103515625, 0.08185386657714844, 0.08786392211914062, 0.09387397766113281, 0.099884033203125, 0.10589408874511719, 0.11190414428710938, 0.11791419982910156, 0.12392425537109375, 0.12993431091308594, 0.13594436645507812, 0.1419544219970703, 0.1479644775390625, 0.1539745330810547, 0.15998458862304688, 0.16599464416503906, 0.17200469970703125, 0.17801475524902344, 0.18402481079101562, 0.1900348663330078, 0.196044921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 5.0, 9.0, 8.0, 12.0, 14.0, 14.0, 16.0, 26.0, 30.0, 32.0, 51.0, 93.0, 136.0, 138.0, 117.0, 81.0, 36.0, 38.0, 32.0, 19.0, 20.0, 19.0, 8.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.1013174057006836, -0.09759330749511719, -0.09386920928955078, -0.09014511108398438, -0.08642101287841797, -0.08269691467285156, -0.07897281646728516, -0.07524871826171875, -0.07152462005615234, -0.06780052185058594, -0.06407642364501953, -0.060352325439453125, -0.05662822723388672, -0.05290412902832031, -0.049180030822753906, -0.0454559326171875, -0.041731834411621094, -0.03800773620605469, -0.03428363800048828, -0.030559539794921875, -0.02683544158935547, -0.023111343383789062, -0.019387245178222656, -0.01566314697265625, -0.011939048767089844, -0.008214950561523438, -0.004490852355957031, -0.000766754150390625, 0.0029573440551757812, 0.0066814422607421875, 0.010405540466308594, 0.014129638671875, 0.017853736877441406, 0.021577835083007812, 0.02530193328857422, 0.029026031494140625, 0.03275012969970703, 0.03647422790527344, 0.040198326110839844, 0.04392242431640625, 0.047646522521972656, 0.05137062072753906, 0.05509471893310547, 0.058818817138671875, 0.06254291534423828, 0.06626701354980469, 0.0699911117553711, 0.0737152099609375, 0.0774393081665039, 0.08116340637207031, 0.08488750457763672, 0.08861160278320312, 0.09233570098876953, 0.09605979919433594, 0.09978389739990234, 0.10350799560546875, 0.10723209381103516, 0.11095619201660156, 0.11468029022216797, 0.11840438842773438, 0.12212848663330078, 0.1258525848388672, 0.1295766830444336, 0.13330078125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 8.0, 18.0, 17.0, 28.0, 22.0, 20.0, 31.0, 29.0, 34.0, 45.0, 60.0, 41.0, 55.0, 54.0, 39.0, 44.0, 59.0, 48.0, 44.0, 34.0, 41.0, 31.0, 30.0, 35.0, 28.0, 13.0, 10.0, 12.0, 12.0, 5.0, 2.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.31485366821289, -17.69188690185547, -17.06892204284668, -16.44595718383789, -15.822990417480469, -15.200024604797363, -14.577058792114258, -13.954092979431152, -13.331127166748047, -12.708161354064941, -12.085195541381836, -11.46222972869873, -10.839263916015625, -10.21629810333252, -9.593332290649414, -8.970366477966309, -8.347400665283203, -7.724434852600098, -7.101469039916992, -6.478503227233887, -5.855537414550781, -5.232571601867676, -4.60960578918457, -3.986639976501465, -3.3636741638183594, -2.740708351135254, -2.1177425384521484, -1.494776725769043, -0.8718109130859375, -0.24884510040283203, 0.37412071228027344, 0.9970865249633789, 1.6200523376464844, 2.24301815032959, 2.8659839630126953, 3.488949775695801, 4.111915588378906, 4.734881401062012, 5.357847213745117, 5.980813026428223, 6.603778839111328, 7.226744651794434, 7.849710464477539, 8.472676277160645, 9.09564208984375, 9.718607902526855, 10.341573715209961, 10.964539527893066, 11.587505340576172, 12.210471153259277, 12.833436965942383, 13.456402778625488, 14.079368591308594, 14.7023344039917, 15.325300216674805, 15.94826602935791, 16.571231842041016, 17.194198608398438, 17.817163467407227, 18.440128326416016, 19.063095092773438, 19.68606185913086, 20.30902671813965, 20.931991577148438, 21.55495834350586]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 9.0, 6.0, 3.0, 6.0, 10.0, 14.0, 19.0, 12.0, 15.0, 17.0, 12.0, 16.0, 27.0, 21.0, 30.0, 38.0, 28.0, 35.0, 37.0, 39.0, 40.0, 34.0, 58.0, 35.0, 34.0, 41.0, 39.0, 36.0, 33.0, 36.0, 30.0, 23.0, 25.0, 22.0, 11.0, 19.0, 9.0, 12.0, 18.0, 11.0, 10.0, 10.0, 5.0, 7.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.883899688720703, -19.253053665161133, -18.622207641601562, -17.991361618041992, -17.360515594482422, -16.72966766357422, -16.09882164001465, -15.467975616455078, -14.837129592895508, -14.206283569335938, -13.575437545776367, -12.94459056854248, -12.31374454498291, -11.68289852142334, -11.052051544189453, -10.421205520629883, -9.790359497070312, -9.159513473510742, -8.528667449951172, -7.897820472717285, -7.266974449157715, -6.6361284255981445, -6.005281925201416, -5.3744354248046875, -4.743589401245117, -4.112743377685547, -3.4818968772888184, -2.851050615310669, -2.2202043533325195, -1.5893580913543701, -0.9585118293762207, -0.3276653289794922, 0.30318260192871094, 0.9340288639068604, 1.5648751258850098, 2.195721387863159, 2.8265676498413086, 3.457413911819458, 4.088260173797607, 4.719106674194336, 5.349952697753906, 5.980798721313477, 6.611645221710205, 7.242491722106934, 7.873337745666504, 8.504183769226074, 9.135030746459961, 9.765876770019531, 10.396722793579102, 11.027568817138672, 11.658414840698242, 12.289261817932129, 12.9201078414917, 13.55095386505127, 14.181800842285156, 14.812646865844727, 15.443492889404297, 16.074338912963867, 16.705184936523438, 17.336030960083008, 17.966876983642578, 18.59772491455078, 19.22857093811035, 19.859416961669922, 20.490262985229492]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 13.0, 22.0, 23.0, 33.0, 64.0, 101.0, 156.0, 235.0, 374.0, 598.0, 1001.0, 1456.0, 2331.0, 3530.0, 5484.0, 8300.0, 12255.0, 18240.0, 26383.0, 36489.0, 49250.0, 63282.0, 76745.0, 88672.0, 96671.0, 99122.0, 94425.0, 85322.0, 72040.0, 57836.0, 44300.0, 32570.0, 23518.0, 16132.0, 11041.0, 7289.0, 4684.0, 3065.0, 2031.0, 1223.0, 832.0, 527.0, 312.0, 195.0, 145.0, 88.0, 58.0, 34.0, 23.0, 12.0, 5.0, 6.0, 5.0, 3.0, 2.0, 4.0], "bins": [-10.5703125, -10.253173828125, -9.93603515625, -9.618896484375, -9.3017578125, -8.984619140625, -8.66748046875, -8.350341796875, -8.033203125, -7.716064453125, -7.39892578125, -7.081787109375, -6.7646484375, -6.447509765625, -6.13037109375, -5.813232421875, -5.49609375, -5.178955078125, -4.86181640625, -4.544677734375, -4.2275390625, -3.910400390625, -3.59326171875, -3.276123046875, -2.958984375, -2.641845703125, -2.32470703125, -2.007568359375, -1.6904296875, -1.373291015625, -1.05615234375, -0.739013671875, -0.421875, -0.104736328125, 0.21240234375, 0.529541015625, 0.8466796875, 1.163818359375, 1.48095703125, 1.798095703125, 2.115234375, 2.432373046875, 2.74951171875, 3.066650390625, 3.3837890625, 3.700927734375, 4.01806640625, 4.335205078125, 4.65234375, 4.969482421875, 5.28662109375, 5.603759765625, 5.9208984375, 6.238037109375, 6.55517578125, 6.872314453125, 7.189453125, 7.506591796875, 7.82373046875, 8.140869140625, 8.4580078125, 8.775146484375, 9.09228515625, 9.409423828125, 9.7265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 10.0, 3.0, 8.0, 9.0, 10.0, 15.0, 15.0, 17.0, 19.0, 18.0, 20.0, 17.0, 25.0, 23.0, 28.0, 26.0, 31.0, 35.0, 32.0, 39.0, 38.0, 40.0, 42.0, 37.0, 40.0, 42.0, 38.0, 31.0, 30.0, 21.0, 27.0, 27.0, 29.0, 12.0, 17.0, 15.0, 13.0, 24.0, 13.0, 13.0, 9.0, 8.0, 6.0, 10.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0], "bins": [-18.265625, -17.662841796875, -17.06005859375, -16.457275390625, -15.8544921875, -15.251708984375, -14.64892578125, -14.046142578125, -13.443359375, -12.840576171875, -12.23779296875, -11.635009765625, -11.0322265625, -10.429443359375, -9.82666015625, -9.223876953125, -8.62109375, -8.018310546875, -7.41552734375, -6.812744140625, -6.2099609375, -5.607177734375, -5.00439453125, -4.401611328125, -3.798828125, -3.196044921875, -2.59326171875, -1.990478515625, -1.3876953125, -0.784912109375, -0.18212890625, 0.420654296875, 1.0234375, 1.626220703125, 2.22900390625, 2.831787109375, 3.4345703125, 4.037353515625, 4.64013671875, 5.242919921875, 5.845703125, 6.448486328125, 7.05126953125, 7.654052734375, 8.2568359375, 8.859619140625, 9.46240234375, 10.065185546875, 10.66796875, 11.270751953125, 11.87353515625, 12.476318359375, 13.0791015625, 13.681884765625, 14.28466796875, 14.887451171875, 15.490234375, 16.093017578125, 16.69580078125, 17.298583984375, 17.9013671875, 18.504150390625, 19.10693359375, 19.709716796875, 20.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 17.0, 13.0, 11.0, 17.0, 36.0, 67.0, 66.0, 116.0, 170.0, 317.0, 479.0, 747.0, 1289.0, 2055.0, 3260.0, 5241.0, 8389.0, 13284.0, 20209.0, 30616.0, 42890.0, 58935.0, 76868.0, 93677.0, 105661.0, 109802.0, 106467.0, 94222.0, 78237.0, 60970.0, 44883.0, 31292.0, 21137.0, 13610.0, 8743.0, 5600.0, 3531.0, 2126.0, 1333.0, 847.0, 499.0, 282.0, 198.0, 125.0, 85.0, 48.0, 40.0, 18.0, 8.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.171875, -10.8177490234375, -10.463623046875, -10.1094970703125, -9.75537109375, -9.4012451171875, -9.047119140625, -8.6929931640625, -8.3388671875, -7.9847412109375, -7.630615234375, -7.2764892578125, -6.92236328125, -6.5682373046875, -6.214111328125, -5.8599853515625, -5.505859375, -5.1517333984375, -4.797607421875, -4.4434814453125, -4.08935546875, -3.7352294921875, -3.381103515625, -3.0269775390625, -2.6728515625, -2.3187255859375, -1.964599609375, -1.6104736328125, -1.25634765625, -0.9022216796875, -0.548095703125, -0.1939697265625, 0.16015625, 0.5142822265625, 0.868408203125, 1.2225341796875, 1.57666015625, 1.9307861328125, 2.284912109375, 2.6390380859375, 2.9931640625, 3.3472900390625, 3.701416015625, 4.0555419921875, 4.40966796875, 4.7637939453125, 5.117919921875, 5.4720458984375, 5.826171875, 6.1802978515625, 6.534423828125, 6.8885498046875, 7.24267578125, 7.5968017578125, 7.950927734375, 8.3050537109375, 8.6591796875, 9.0133056640625, 9.367431640625, 9.7215576171875, 10.07568359375, 10.4298095703125, 10.783935546875, 11.1380615234375, 11.4921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 9.0, 12.0, 6.0, 7.0, 17.0, 23.0, 20.0, 22.0, 32.0, 31.0, 25.0, 37.0, 39.0, 36.0, 40.0, 31.0, 45.0, 44.0, 37.0, 35.0, 41.0, 42.0, 30.0, 33.0, 35.0, 36.0, 33.0, 21.0, 32.0, 19.0, 12.0, 15.0, 14.0, 13.0, 17.0, 6.0, 7.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.1484375, -12.73486328125, -12.3212890625, -11.90771484375, -11.494140625, -11.08056640625, -10.6669921875, -10.25341796875, -9.83984375, -9.42626953125, -9.0126953125, -8.59912109375, -8.185546875, -7.77197265625, -7.3583984375, -6.94482421875, -6.53125, -6.11767578125, -5.7041015625, -5.29052734375, -4.876953125, -4.46337890625, -4.0498046875, -3.63623046875, -3.22265625, -2.80908203125, -2.3955078125, -1.98193359375, -1.568359375, -1.15478515625, -0.7412109375, -0.32763671875, 0.0859375, 0.49951171875, 0.9130859375, 1.32666015625, 1.740234375, 2.15380859375, 2.5673828125, 2.98095703125, 3.39453125, 3.80810546875, 4.2216796875, 4.63525390625, 5.048828125, 5.46240234375, 5.8759765625, 6.28955078125, 6.703125, 7.11669921875, 7.5302734375, 7.94384765625, 8.357421875, 8.77099609375, 9.1845703125, 9.59814453125, 10.01171875, 10.42529296875, 10.8388671875, 11.25244140625, 11.666015625, 12.07958984375, 12.4931640625, 12.90673828125, 13.3203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 11.0, 8.0, 11.0, 11.0, 31.0, 36.0, 60.0, 98.0, 169.0, 245.0, 331.0, 574.0, 884.0, 1286.0, 1978.0, 3123.0, 4745.0, 7142.0, 10565.0, 15509.0, 22149.0, 30728.0, 41333.0, 54231.0, 67386.0, 79845.0, 89514.0, 95441.0, 94959.0, 89130.0, 79092.0, 66790.0, 53046.0, 40852.0, 30142.0, 21716.0, 14851.0, 10364.0, 6972.0, 4571.0, 3005.0, 1963.0, 1267.0, 852.0, 532.0, 356.0, 242.0, 150.0, 107.0, 67.0, 39.0, 18.0, 16.0, 8.0, 7.0, 5.0, 0.0, 2.0, 3.0], "bins": [-3.12890625, -3.03399658203125, -2.9390869140625, -2.84417724609375, -2.749267578125, -2.65435791015625, -2.5594482421875, -2.46453857421875, -2.36962890625, -2.27471923828125, -2.1798095703125, -2.08489990234375, -1.989990234375, -1.89508056640625, -1.8001708984375, -1.70526123046875, -1.6103515625, -1.51544189453125, -1.4205322265625, -1.32562255859375, -1.230712890625, -1.13580322265625, -1.0408935546875, -0.94598388671875, -0.85107421875, -0.75616455078125, -0.6612548828125, -0.56634521484375, -0.471435546875, -0.37652587890625, -0.2816162109375, -0.18670654296875, -0.091796875, 0.00311279296875, 0.0980224609375, 0.19293212890625, 0.287841796875, 0.38275146484375, 0.4776611328125, 0.57257080078125, 0.66748046875, 0.76239013671875, 0.8572998046875, 0.95220947265625, 1.047119140625, 1.14202880859375, 1.2369384765625, 1.33184814453125, 1.4267578125, 1.52166748046875, 1.6165771484375, 1.71148681640625, 1.806396484375, 1.90130615234375, 1.9962158203125, 2.09112548828125, 2.18603515625, 2.28094482421875, 2.3758544921875, 2.47076416015625, 2.565673828125, 2.66058349609375, 2.7554931640625, 2.85040283203125, 2.9453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 0.0, 9.0, 13.0, 9.0, 12.0, 14.0, 17.0, 18.0, 19.0, 21.0, 24.0, 21.0, 33.0, 23.0, 26.0, 36.0, 41.0, 44.0, 51.0, 45.0, 44.0, 46.0, 34.0, 49.0, 46.0, 24.0, 42.0, 30.0, 29.0, 25.0, 22.0, 17.0, 19.0, 12.0, 15.0, 12.0, 10.0, 9.0, 11.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.0003902912139892578, -0.0003788881003856659, -0.000367484986782074, -0.00035608187317848206, -0.00034467875957489014, -0.0003332756459712982, -0.0003218725323677063, -0.0003104694187641144, -0.00029906630516052246, -0.00028766319155693054, -0.0002762600779533386, -0.0002648569643497467, -0.0002534538507461548, -0.00024205073714256287, -0.00023064762353897095, -0.00021924450993537903, -0.0002078413963317871, -0.0001964382827281952, -0.00018503516912460327, -0.00017363205552101135, -0.00016222894191741943, -0.00015082582831382751, -0.0001394227147102356, -0.00012801960110664368, -0.00011661648750305176, -0.00010521337389945984, -9.381026029586792e-05, -8.2407146692276e-05, -7.100403308868408e-05, -5.960091948509216e-05, -4.8197805881500244e-05, -3.6794692277908325e-05, -2.5391578674316406e-05, -1.3988465070724487e-05, -2.5853514671325684e-06, 8.81776213645935e-06, 2.022087574005127e-05, 3.162398934364319e-05, 4.302710294723511e-05, 5.4430216550827026e-05, 6.583333015441895e-05, 7.723644375801086e-05, 8.863955736160278e-05, 0.0001000426709651947, 0.00011144578456878662, 0.00012284889817237854, 0.00013425201177597046, 0.00014565512537956238, 0.0001570582389831543, 0.00016846135258674622, 0.00017986446619033813, 0.00019126757979393005, 0.00020267069339752197, 0.0002140738070011139, 0.0002254769206047058, 0.00023688003420829773, 0.00024828314781188965, 0.00025968626141548157, 0.0002710893750190735, 0.0002824924886226654, 0.0002938956022262573, 0.00030529871582984924, 0.00031670182943344116, 0.0003281049430370331, 0.000339508056640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 10.0, 21.0, 31.0, 52.0, 84.0, 130.0, 187.0, 287.0, 504.0, 843.0, 1265.0, 2015.0, 3281.0, 5461.0, 8546.0, 13491.0, 20840.0, 31454.0, 45915.0, 63888.0, 82679.0, 100772.0, 111874.0, 115004.0, 107935.0, 92634.0, 73972.0, 54492.0, 38883.0, 25966.0, 16896.0, 10962.0, 6819.0, 4261.0, 2705.0, 1634.0, 1030.0, 663.0, 406.0, 251.0, 153.0, 98.0, 60.0, 36.0, 23.0, 14.0, 14.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.486328125, -3.3671875, -3.248046875, -3.12890625, -3.009765625, -2.890625, -2.771484375, -2.65234375, -2.533203125, -2.4140625, -2.294921875, -2.17578125, -2.056640625, -1.9375, -1.818359375, -1.69921875, -1.580078125, -1.4609375, -1.341796875, -1.22265625, -1.103515625, -0.984375, -0.865234375, -0.74609375, -0.626953125, -0.5078125, -0.388671875, -0.26953125, -0.150390625, -0.03125, 0.087890625, 0.20703125, 0.326171875, 0.4453125, 0.564453125, 0.68359375, 0.802734375, 0.921875, 1.041015625, 1.16015625, 1.279296875, 1.3984375, 1.517578125, 1.63671875, 1.755859375, 1.875, 1.994140625, 2.11328125, 2.232421875, 2.3515625, 2.470703125, 2.58984375, 2.708984375, 2.828125, 2.947265625, 3.06640625, 3.185546875, 3.3046875, 3.423828125, 3.54296875, 3.662109375, 3.78125, 3.900390625, 4.01953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 10.0, 7.0, 8.0, 20.0, 21.0, 24.0, 25.0, 31.0, 47.0, 56.0, 54.0, 48.0, 44.0, 56.0, 57.0, 49.0, 66.0, 39.0, 57.0, 54.0, 42.0, 37.0, 30.0, 20.0, 26.0, 16.0, 14.0, 11.0, 12.0, 3.0, 6.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.830078125, -2.753265380859375, -2.67645263671875, -2.599639892578125, -2.5228271484375, -2.446014404296875, -2.36920166015625, -2.292388916015625, -2.215576171875, -2.138763427734375, -2.06195068359375, -1.985137939453125, -1.9083251953125, -1.831512451171875, -1.75469970703125, -1.677886962890625, -1.60107421875, -1.524261474609375, -1.44744873046875, -1.370635986328125, -1.2938232421875, -1.217010498046875, -1.14019775390625, -1.063385009765625, -0.986572265625, -0.909759521484375, -0.83294677734375, -0.756134033203125, -0.6793212890625, -0.602508544921875, -0.52569580078125, -0.448883056640625, -0.3720703125, -0.295257568359375, -0.21844482421875, -0.141632080078125, -0.0648193359375, 0.011993408203125, 0.08880615234375, 0.165618896484375, 0.242431640625, 0.319244384765625, 0.39605712890625, 0.472869873046875, 0.5496826171875, 0.626495361328125, 0.70330810546875, 0.780120849609375, 0.85693359375, 0.933746337890625, 1.01055908203125, 1.087371826171875, 1.1641845703125, 1.240997314453125, 1.31781005859375, 1.394622802734375, 1.471435546875, 1.548248291015625, 1.62506103515625, 1.701873779296875, 1.7786865234375, 1.855499267578125, 1.93231201171875, 2.009124755859375, 2.0859375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 5.0, 2.0, 11.0, 9.0, 16.0, 20.0, 28.0, 14.0, 18.0, 39.0, 30.0, 34.0, 52.0, 45.0, 52.0, 61.0, 48.0, 47.0, 53.0, 63.0, 40.0, 49.0, 39.0, 36.0, 42.0, 26.0, 29.0, 26.0, 16.0, 14.0, 9.0, 7.0, 1.0, 2.0, 8.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.092493057250977, -15.434326171875, -14.776158332824707, -14.11799144744873, -13.459823608398438, -12.801656723022461, -12.143489837646484, -11.485321998596191, -10.827154159545898, -10.168987274169922, -9.510819435119629, -8.852652549743652, -8.19448471069336, -7.536317825317383, -6.878150463104248, -6.219983100891113, -5.561816215515137, -4.903648853302002, -4.245481491088867, -3.5873143672943115, -2.9291470050811768, -2.270979642868042, -1.6128125190734863, -0.9546451568603516, -0.2964777946472168, 0.3616895079612732, 1.0198568105697632, 1.6780240535736084, 2.336191415786743, 2.994358777999878, 3.6525259017944336, 4.310693264007568, 4.968860626220703, 5.627027988433838, 6.285195350646973, 6.943362236022949, 7.601530075073242, 8.259696960449219, 8.917863845825195, 9.576031684875488, 10.234199523925781, 10.892366409301758, 11.55053424835205, 12.208701133728027, 12.86686897277832, 13.525035858154297, 14.183202743530273, 14.841370582580566, 15.499537467956543, 16.157705307006836, 16.815872192382812, 17.47403907775879, 18.132205963134766, 18.790374755859375, 19.44854164123535, 20.106708526611328, 20.764875411987305, 21.42304229736328, 22.081209182739258, 22.739377975463867, 23.397544860839844, 24.05571174621582, 24.713878631591797, 25.372047424316406, 26.030214309692383]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 3.0, 4.0, 9.0, 4.0, 11.0, 8.0, 9.0, 14.0, 18.0, 17.0, 17.0, 20.0, 23.0, 23.0, 15.0, 35.0, 31.0, 39.0, 30.0, 45.0, 39.0, 41.0, 48.0, 40.0, 39.0, 43.0, 25.0, 36.0, 30.0, 33.0, 43.0, 21.0, 25.0, 23.0, 14.0, 18.0, 14.0, 15.0, 8.0, 9.0, 11.0, 7.0, 7.0, 6.0, 6.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-20.20684242248535, -19.571300506591797, -18.935758590698242, -18.300216674804688, -17.664674758911133, -17.029132843017578, -16.393590927124023, -15.758048057556152, -15.122506141662598, -14.486964225769043, -13.851422309875488, -13.215880393981934, -12.580337524414062, -11.944795608520508, -11.309253692626953, -10.673711776733398, -10.038169860839844, -9.402627944946289, -8.767086029052734, -8.13154411315918, -7.496001720428467, -6.860459804534912, -6.224917411804199, -5.5893754959106445, -4.95383358001709, -4.318291664123535, -3.6827495098114014, -3.0472073554992676, -2.411665439605713, -1.7761235237121582, -1.1405813694000244, -0.5050392150878906, 0.13050079345703125, 0.7660428285598755, 1.4015848636627197, 2.0371270179748535, 2.672668933868408, 3.308210849761963, 3.9437530040740967, 4.5792951583862305, 5.214837074279785, 5.85037899017334, 6.4859209060668945, 7.121463298797607, 7.757005214691162, 8.392547607421875, 9.02808952331543, 9.663631439208984, 10.299173355102539, 10.934715270996094, 11.570257186889648, 12.205799102783203, 12.841341018676758, 13.476882934570312, 14.112425804138184, 14.747967720031738, 15.383509635925293, 16.019052505493164, 16.65459442138672, 17.290136337280273, 17.925678253173828, 18.561220169067383, 19.196762084960938, 19.832304000854492, 20.467845916748047]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 22.0, 25.0, 52.0, 95.0, 153.0, 228.0, 419.0, 706.0, 1123.0, 1815.0, 3134.0, 4998.0, 8445.0, 13603.0, 21781.0, 34397.0, 54142.0, 81541.0, 121214.0, 171528.0, 235083.0, 302159.0, 365451.0, 413921.0, 433064.0, 420231.0, 376944.0, 314370.0, 246913.0, 183809.0, 130368.0, 89640.0, 59312.0, 38188.0, 24482.0, 15777.0, 9749.0, 5942.0, 3654.0, 2279.0, 1374.0, 843.0, 511.0, 295.0, 185.0, 115.0, 81.0, 38.0, 32.0, 22.0, 14.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-13.28125, -12.8472900390625, -12.413330078125, -11.9793701171875, -11.54541015625, -11.1114501953125, -10.677490234375, -10.2435302734375, -9.8095703125, -9.3756103515625, -8.941650390625, -8.5076904296875, -8.07373046875, -7.6397705078125, -7.205810546875, -6.7718505859375, -6.337890625, -5.9039306640625, -5.469970703125, -5.0360107421875, -4.60205078125, -4.1680908203125, -3.734130859375, -3.3001708984375, -2.8662109375, -2.4322509765625, -1.998291015625, -1.5643310546875, -1.13037109375, -0.6964111328125, -0.262451171875, 0.1715087890625, 0.60546875, 1.0394287109375, 1.473388671875, 1.9073486328125, 2.34130859375, 2.7752685546875, 3.209228515625, 3.6431884765625, 4.0771484375, 4.5111083984375, 4.945068359375, 5.3790283203125, 5.81298828125, 6.2469482421875, 6.680908203125, 7.1148681640625, 7.548828125, 7.9827880859375, 8.416748046875, 8.8507080078125, 9.28466796875, 9.7186279296875, 10.152587890625, 10.5865478515625, 11.0205078125, 11.4544677734375, 11.888427734375, 12.3223876953125, 12.75634765625, 13.1903076171875, 13.624267578125, 14.0582275390625, 14.4921875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 2.0, 4.0, 7.0, 7.0, 7.0, 6.0, 6.0, 15.0, 11.0, 17.0, 24.0, 17.0, 21.0, 21.0, 22.0, 27.0, 27.0, 33.0, 36.0, 44.0, 44.0, 50.0, 49.0, 36.0, 35.0, 47.0, 41.0, 39.0, 47.0, 23.0, 25.0, 26.0, 22.0, 23.0, 23.0, 19.0, 18.0, 10.0, 7.0, 9.0, 9.0, 10.0, 5.0, 5.0, 9.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-17.546875, -17.0029296875, -16.458984375, -15.9150390625, -15.37109375, -14.8271484375, -14.283203125, -13.7392578125, -13.1953125, -12.6513671875, -12.107421875, -11.5634765625, -11.01953125, -10.4755859375, -9.931640625, -9.3876953125, -8.84375, -8.2998046875, -7.755859375, -7.2119140625, -6.66796875, -6.1240234375, -5.580078125, -5.0361328125, -4.4921875, -3.9482421875, -3.404296875, -2.8603515625, -2.31640625, -1.7724609375, -1.228515625, -0.6845703125, -0.140625, 0.4033203125, 0.947265625, 1.4912109375, 2.03515625, 2.5791015625, 3.123046875, 3.6669921875, 4.2109375, 4.7548828125, 5.298828125, 5.8427734375, 6.38671875, 6.9306640625, 7.474609375, 8.0185546875, 8.5625, 9.1064453125, 9.650390625, 10.1943359375, 10.73828125, 11.2822265625, 11.826171875, 12.3701171875, 12.9140625, 13.4580078125, 14.001953125, 14.5458984375, 15.08984375, 15.6337890625, 16.177734375, 16.7216796875, 17.265625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 12.0, 6.0, 10.0, 12.0, 30.0, 44.0, 75.0, 145.0, 253.0, 461.0, 711.0, 1240.0, 2006.0, 3374.0, 5666.0, 8992.0, 14350.0, 22364.0, 34651.0, 51911.0, 76191.0, 108684.0, 147979.0, 196053.0, 246734.0, 296992.0, 340954.0, 368607.0, 379691.0, 366623.0, 335312.0, 292259.0, 242078.0, 189852.0, 143470.0, 103404.0, 73172.0, 50098.0, 33017.0, 21632.0, 13600.0, 8372.0, 5248.0, 3146.0, 1967.0, 1153.0, 686.0, 428.0, 244.0, 136.0, 81.0, 55.0, 44.0, 11.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-13.15625, -12.750732421875, -12.34521484375, -11.939697265625, -11.5341796875, -11.128662109375, -10.72314453125, -10.317626953125, -9.912109375, -9.506591796875, -9.10107421875, -8.695556640625, -8.2900390625, -7.884521484375, -7.47900390625, -7.073486328125, -6.66796875, -6.262451171875, -5.85693359375, -5.451416015625, -5.0458984375, -4.640380859375, -4.23486328125, -3.829345703125, -3.423828125, -3.018310546875, -2.61279296875, -2.207275390625, -1.8017578125, -1.396240234375, -0.99072265625, -0.585205078125, -0.1796875, 0.225830078125, 0.63134765625, 1.036865234375, 1.4423828125, 1.847900390625, 2.25341796875, 2.658935546875, 3.064453125, 3.469970703125, 3.87548828125, 4.281005859375, 4.6865234375, 5.092041015625, 5.49755859375, 5.903076171875, 6.30859375, 6.714111328125, 7.11962890625, 7.525146484375, 7.9306640625, 8.336181640625, 8.74169921875, 9.147216796875, 9.552734375, 9.958251953125, 10.36376953125, 10.769287109375, 11.1748046875, 11.580322265625, 11.98583984375, 12.391357421875, 12.796875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 4.0, 8.0, 9.0, 4.0, 12.0, 17.0, 25.0, 38.0, 38.0, 50.0, 65.0, 68.0, 77.0, 97.0, 127.0, 131.0, 158.0, 183.0, 169.0, 179.0, 201.0, 227.0, 219.0, 207.0, 183.0, 195.0, 210.0, 168.0, 143.0, 129.0, 120.0, 103.0, 88.0, 76.0, 65.0, 66.0, 45.0, 39.0, 24.0, 27.0, 16.0, 13.0, 13.0, 11.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.421875, -8.1485595703125, -7.875244140625, -7.6019287109375, -7.32861328125, -7.0552978515625, -6.781982421875, -6.5086669921875, -6.2353515625, -5.9620361328125, -5.688720703125, -5.4154052734375, -5.14208984375, -4.8687744140625, -4.595458984375, -4.3221435546875, -4.048828125, -3.7755126953125, -3.502197265625, -3.2288818359375, -2.95556640625, -2.6822509765625, -2.408935546875, -2.1356201171875, -1.8623046875, -1.5889892578125, -1.315673828125, -1.0423583984375, -0.76904296875, -0.4957275390625, -0.222412109375, 0.0509033203125, 0.32421875, 0.5975341796875, 0.870849609375, 1.1441650390625, 1.41748046875, 1.6907958984375, 1.964111328125, 2.2374267578125, 2.5107421875, 2.7840576171875, 3.057373046875, 3.3306884765625, 3.60400390625, 3.8773193359375, 4.150634765625, 4.4239501953125, 4.697265625, 4.9705810546875, 5.243896484375, 5.5172119140625, 5.79052734375, 6.0638427734375, 6.337158203125, 6.6104736328125, 6.8837890625, 7.1571044921875, 7.430419921875, 7.7037353515625, 7.97705078125, 8.2503662109375, 8.523681640625, 8.7969970703125, 9.0703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 1.0, 6.0, 7.0, 12.0, 14.0, 9.0, 16.0, 30.0, 28.0, 27.0, 31.0, 27.0, 40.0, 39.0, 52.0, 54.0, 53.0, 60.0, 50.0, 56.0, 58.0, 44.0, 32.0, 45.0, 33.0, 37.0, 21.0, 22.0, 24.0, 20.0, 14.0, 8.0, 6.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.79474449157715, -19.080846786499023, -18.3669490814209, -17.653051376342773, -16.93915367126465, -16.225257873535156, -15.511359214782715, -14.797462463378906, -14.083564758300781, -13.369667053222656, -12.655769348144531, -11.941871643066406, -11.227974891662598, -10.514077186584473, -9.800179481506348, -9.086282730102539, -8.372384071350098, -7.658486366271973, -6.944589138031006, -6.230691432952881, -5.516794204711914, -4.802896499633789, -4.088998794555664, -3.3751015663146973, -2.6612038612365723, -1.9473063945770264, -1.233408808708191, -0.5195112228393555, 0.19438624382019043, 0.9082837104797363, 1.6221814155578613, 2.336078643798828, 3.049976348876953, 3.763873815536499, 4.477771282196045, 5.19166898727417, 5.905566215515137, 6.619463920593262, 7.333361625671387, 8.047258377075195, 8.76115608215332, 9.475053787231445, 10.18895149230957, 10.902849197387695, 11.616745948791504, 12.330643653869629, 13.044541358947754, 13.758438110351562, 14.472336769104004, 15.186234474182129, 15.900132179260254, 16.614028930664062, 17.327926635742188, 18.041824340820312, 18.755722045898438, 19.469619750976562, 20.183517456054688, 20.897415161132812, 21.611312866210938, 22.325210571289062, 23.039108276367188, 23.753005981445312, 24.466903686523438, 25.18079948425293, 25.894697189331055]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 2.0, 13.0, 8.0, 10.0, 5.0, 15.0, 12.0, 17.0, 18.0, 20.0, 21.0, 26.0, 26.0, 43.0, 22.0, 23.0, 25.0, 34.0, 23.0, 32.0, 48.0, 35.0, 33.0, 39.0, 37.0, 40.0, 35.0, 29.0, 29.0, 25.0, 26.0, 27.0, 16.0, 22.0, 21.0, 13.0, 11.0, 13.0, 14.0, 12.0, 15.0, 12.0, 14.0, 11.0, 6.0, 5.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-19.253223419189453, -18.640270233154297, -18.027318954467773, -17.414365768432617, -16.801414489746094, -16.188461303710938, -15.575508117675781, -14.962555885314941, -14.349603652954102, -13.736651420593262, -13.123699188232422, -12.510746002197266, -11.897793769836426, -11.284841537475586, -10.67188835144043, -10.05893611907959, -9.44598388671875, -8.83303165435791, -8.22007942199707, -7.607126235961914, -6.994174003601074, -6.381221771240234, -5.768269062042236, -5.155316352844238, -4.542364120483398, -3.9294116497039795, -3.3164591789245605, -2.7035067081451416, -2.0905542373657227, -1.4776017665863037, -0.8646492958068848, -0.2516965866088867, 0.36125755310058594, 0.9742100238800049, 1.5871624946594238, 2.2001149654388428, 2.8130674362182617, 3.4260199069976807, 4.0389723777771, 4.651925086975098, 5.2648773193359375, 5.877829551696777, 6.490782260894775, 7.103734970092773, 7.716687202453613, 8.329639434814453, 8.94259262084961, 9.55554485321045, 10.168497085571289, 10.781449317932129, 11.394401550292969, 12.007354736328125, 12.620306968688965, 13.233259201049805, 13.846212387084961, 14.4591646194458, 15.07211685180664, 15.68506908416748, 16.29802131652832, 16.910974502563477, 17.52392578125, 18.136878967285156, 18.749832153320312, 19.36278533935547, 19.975736618041992]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 8.0, 3.0, 12.0, 21.0, 30.0, 35.0, 82.0, 87.0, 135.0, 214.0, 333.0, 511.0, 811.0, 1281.0, 2099.0, 3327.0, 5876.0, 9966.0, 17357.0, 30294.0, 53639.0, 94926.0, 168662.0, 241876.0, 180668.0, 101827.0, 57253.0, 32306.0, 18505.0, 10569.0, 6095.0, 3782.0, 2210.0, 1355.0, 824.0, 551.0, 342.0, 241.0, 166.0, 95.0, 60.0, 40.0, 29.0, 18.0, 12.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.662628173828125, -2.56939697265625, -2.476165771484375, -2.3829345703125, -2.289703369140625, -2.19647216796875, -2.103240966796875, -2.010009765625, -1.916778564453125, -1.82354736328125, -1.730316162109375, -1.6370849609375, -1.543853759765625, -1.45062255859375, -1.357391357421875, -1.26416015625, -1.170928955078125, -1.07769775390625, -0.984466552734375, -0.8912353515625, -0.798004150390625, -0.70477294921875, -0.611541748046875, -0.518310546875, -0.425079345703125, -0.33184814453125, -0.238616943359375, -0.1453857421875, -0.052154541015625, 0.04107666015625, 0.134307861328125, 0.2275390625, 0.320770263671875, 0.41400146484375, 0.507232666015625, 0.6004638671875, 0.693695068359375, 0.78692626953125, 0.880157470703125, 0.973388671875, 1.066619873046875, 1.15985107421875, 1.253082275390625, 1.3463134765625, 1.439544677734375, 1.53277587890625, 1.626007080078125, 1.71923828125, 1.812469482421875, 1.90570068359375, 1.998931884765625, 2.0921630859375, 2.185394287109375, 2.27862548828125, 2.371856689453125, 2.465087890625, 2.558319091796875, 2.65155029296875, 2.744781494140625, 2.8380126953125, 2.931243896484375, 3.02447509765625, 3.117706298828125, 3.2109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 3.0, 5.0, 8.0, 9.0, 6.0, 15.0, 12.0, 17.0, 25.0, 25.0, 24.0, 24.0, 21.0, 28.0, 31.0, 30.0, 34.0, 31.0, 33.0, 40.0, 46.0, 31.0, 32.0, 40.0, 36.0, 29.0, 37.0, 29.0, 27.0, 33.0, 26.0, 27.0, 22.0, 19.0, 17.0, 13.0, 15.0, 13.0, 16.0, 17.0, 8.0, 8.0, 8.0, 5.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-21.0, -20.345703125, -19.69140625, -19.037109375, -18.3828125, -17.728515625, -17.07421875, -16.419921875, -15.765625, -15.111328125, -14.45703125, -13.802734375, -13.1484375, -12.494140625, -11.83984375, -11.185546875, -10.53125, -9.876953125, -9.22265625, -8.568359375, -7.9140625, -7.259765625, -6.60546875, -5.951171875, -5.296875, -4.642578125, -3.98828125, -3.333984375, -2.6796875, -2.025390625, -1.37109375, -0.716796875, -0.0625, 0.591796875, 1.24609375, 1.900390625, 2.5546875, 3.208984375, 3.86328125, 4.517578125, 5.171875, 5.826171875, 6.48046875, 7.134765625, 7.7890625, 8.443359375, 9.09765625, 9.751953125, 10.40625, 11.060546875, 11.71484375, 12.369140625, 13.0234375, 13.677734375, 14.33203125, 14.986328125, 15.640625, 16.294921875, 16.94921875, 17.603515625, 18.2578125, 18.912109375, 19.56640625, 20.220703125, 20.875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 9.0, 6.0, 15.0, 10.0, 32.0, 38.0, 62.0, 78.0, 138.0, 177.0, 301.0, 425.0, 593.0, 941.0, 1374.0, 1993.0, 3035.0, 4517.0, 6800.0, 10697.0, 17230.0, 27475.0, 44968.0, 73212.0, 117045.0, 174351.0, 194071.0, 137562.0, 88249.0, 53340.0, 32592.0, 20358.0, 12876.0, 8211.0, 5343.0, 3393.0, 2261.0, 1549.0, 1024.0, 682.0, 486.0, 299.0, 263.0, 157.0, 111.0, 67.0, 51.0, 28.0, 27.0, 16.0, 9.0, 2.0, 8.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.728515625, -2.64373779296875, -2.5589599609375, -2.47418212890625, -2.389404296875, -2.30462646484375, -2.2198486328125, -2.13507080078125, -2.05029296875, -1.96551513671875, -1.8807373046875, -1.79595947265625, -1.711181640625, -1.62640380859375, -1.5416259765625, -1.45684814453125, -1.3720703125, -1.28729248046875, -1.2025146484375, -1.11773681640625, -1.032958984375, -0.94818115234375, -0.8634033203125, -0.77862548828125, -0.69384765625, -0.60906982421875, -0.5242919921875, -0.43951416015625, -0.354736328125, -0.26995849609375, -0.1851806640625, -0.10040283203125, -0.015625, 0.06915283203125, 0.1539306640625, 0.23870849609375, 0.323486328125, 0.40826416015625, 0.4930419921875, 0.57781982421875, 0.66259765625, 0.74737548828125, 0.8321533203125, 0.91693115234375, 1.001708984375, 1.08648681640625, 1.1712646484375, 1.25604248046875, 1.3408203125, 1.42559814453125, 1.5103759765625, 1.59515380859375, 1.679931640625, 1.76470947265625, 1.8494873046875, 1.93426513671875, 2.01904296875, 2.10382080078125, 2.1885986328125, 2.27337646484375, 2.358154296875, 2.44293212890625, 2.5277099609375, 2.61248779296875, 2.697265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 10.0, 9.0, 16.0, 15.0, 13.0, 28.0, 26.0, 14.0, 24.0, 30.0, 24.0, 38.0, 30.0, 30.0, 43.0, 46.0, 40.0, 54.0, 37.0, 44.0, 43.0, 40.0, 24.0, 37.0, 38.0, 35.0, 28.0, 25.0, 20.0, 17.0, 13.0, 17.0, 15.0, 12.0, 7.0, 12.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.3515625, -12.8795166015625, -12.407470703125, -11.9354248046875, -11.46337890625, -10.9913330078125, -10.519287109375, -10.0472412109375, -9.5751953125, -9.1031494140625, -8.631103515625, -8.1590576171875, -7.68701171875, -7.2149658203125, -6.742919921875, -6.2708740234375, -5.798828125, -5.3267822265625, -4.854736328125, -4.3826904296875, -3.91064453125, -3.4385986328125, -2.966552734375, -2.4945068359375, -2.0224609375, -1.5504150390625, -1.078369140625, -0.6063232421875, -0.13427734375, 0.3377685546875, 0.809814453125, 1.2818603515625, 1.75390625, 2.2259521484375, 2.697998046875, 3.1700439453125, 3.64208984375, 4.1141357421875, 4.586181640625, 5.0582275390625, 5.5302734375, 6.0023193359375, 6.474365234375, 6.9464111328125, 7.41845703125, 7.8905029296875, 8.362548828125, 8.8345947265625, 9.306640625, 9.7786865234375, 10.250732421875, 10.7227783203125, 11.19482421875, 11.6668701171875, 12.138916015625, 12.6109619140625, 13.0830078125, 13.5550537109375, 14.027099609375, 14.4991455078125, 14.97119140625, 15.4432373046875, 15.915283203125, 16.3873291015625, 16.859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 17.0, 16.0, 20.0, 38.0, 59.0, 81.0, 125.0, 177.0, 266.0, 392.0, 626.0, 940.0, 1305.0, 1870.0, 2811.0, 4377.0, 6488.0, 10176.0, 15861.0, 25042.0, 42447.0, 74419.0, 141607.0, 249225.0, 208624.0, 108956.0, 59184.0, 34275.0, 20934.0, 13076.0, 8446.0, 5400.0, 3703.0, 2447.0, 1656.0, 1161.0, 756.0, 493.0, 382.0, 225.0, 135.0, 108.0, 76.0, 50.0, 31.0, 23.0, 10.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.08306884765625, -0.0806112289428711, -0.07815361022949219, -0.07569599151611328, -0.07323837280273438, -0.07078075408935547, -0.06832313537597656, -0.06586551666259766, -0.06340789794921875, -0.060950279235839844, -0.05849266052246094, -0.05603504180908203, -0.053577423095703125, -0.05111980438232422, -0.04866218566894531, -0.046204566955566406, -0.0437469482421875, -0.041289329528808594, -0.03883171081542969, -0.03637409210205078, -0.033916473388671875, -0.03145885467529297, -0.029001235961914062, -0.026543617248535156, -0.02408599853515625, -0.021628379821777344, -0.019170761108398438, -0.01671314239501953, -0.014255523681640625, -0.011797904968261719, -0.009340286254882812, -0.006882667541503906, -0.004425048828125, -0.0019674301147460938, 0.0004901885986328125, 0.0029478073120117188, 0.005405426025390625, 0.007863044738769531, 0.010320663452148438, 0.012778282165527344, 0.01523590087890625, 0.017693519592285156, 0.020151138305664062, 0.02260875701904297, 0.025066375732421875, 0.02752399444580078, 0.029981613159179688, 0.032439231872558594, 0.0348968505859375, 0.037354469299316406, 0.03981208801269531, 0.04226970672607422, 0.044727325439453125, 0.04718494415283203, 0.04964256286621094, 0.052100181579589844, 0.05455780029296875, 0.057015419006347656, 0.05947303771972656, 0.06193065643310547, 0.06438827514648438, 0.06684589385986328, 0.06930351257324219, 0.0717611312866211, 0.07421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 11.0, 8.0, 9.0, 7.0, 10.0, 8.0, 13.0, 20.0, 14.0, 28.0, 23.0, 36.0, 26.0, 25.0, 27.0, 39.0, 50.0, 38.0, 50.0, 55.0, 56.0, 48.0, 49.0, 35.0, 39.0, 34.0, 40.0, 34.0, 32.0, 18.0, 28.0, 18.0, 10.0, 9.0, 11.0, 8.0, 7.0, 11.0, 3.0, 4.0, 7.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.519918441772461e-05, -1.4706514775753021e-05, -1.4213845133781433e-05, -1.3721175491809845e-05, -1.3228505849838257e-05, -1.2735836207866669e-05, -1.224316656589508e-05, -1.1750496923923492e-05, -1.1257827281951904e-05, -1.0765157639980316e-05, -1.0272487998008728e-05, -9.77981835603714e-06, -9.287148714065552e-06, -8.794479072093964e-06, -8.301809430122375e-06, -7.809139788150787e-06, -7.316470146179199e-06, -6.823800504207611e-06, -6.331130862236023e-06, -5.838461220264435e-06, -5.345791578292847e-06, -4.8531219363212585e-06, -4.36045229434967e-06, -3.867782652378082e-06, -3.375113010406494e-06, -2.882443368434906e-06, -2.389773726463318e-06, -1.8971040844917297e-06, -1.4044344425201416e-06, -9.117648005485535e-07, -4.1909515857696533e-07, 7.35744833946228e-08, 5.662441253662109e-07, 1.058913767337799e-06, 1.5515834093093872e-06, 2.0442530512809753e-06, 2.5369226932525635e-06, 3.0295923352241516e-06, 3.5222619771957397e-06, 4.014931619167328e-06, 4.507601261138916e-06, 5.000270903110504e-06, 5.492940545082092e-06, 5.98561018705368e-06, 6.4782798290252686e-06, 6.970949470996857e-06, 7.463619112968445e-06, 7.956288754940033e-06, 8.448958396911621e-06, 8.94162803888321e-06, 9.434297680854797e-06, 9.926967322826385e-06, 1.0419636964797974e-05, 1.0912306606769562e-05, 1.140497624874115e-05, 1.1897645890712738e-05, 1.2390315532684326e-05, 1.2882985174655914e-05, 1.3375654816627502e-05, 1.386832445859909e-05, 1.4360994100570679e-05, 1.4853663742542267e-05, 1.5346333384513855e-05, 1.5839003026485443e-05, 1.633167266845703e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 13.0, 15.0, 19.0, 33.0, 55.0, 59.0, 97.0, 136.0, 206.0, 319.0, 461.0, 681.0, 1040.0, 1506.0, 2295.0, 3293.0, 4904.0, 7147.0, 11057.0, 16984.0, 26695.0, 42239.0, 69684.0, 124641.0, 238208.0, 213791.0, 110708.0, 63005.0, 38477.0, 24059.0, 15712.0, 10134.0, 6750.0, 4482.0, 3181.0, 2066.0, 1446.0, 936.0, 652.0, 472.0, 321.0, 187.0, 141.0, 81.0, 54.0, 37.0, 29.0, 21.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1513671875, -0.1464691162109375, -0.141571044921875, -0.1366729736328125, -0.13177490234375, -0.1268768310546875, -0.121978759765625, -0.1170806884765625, -0.1121826171875, -0.1072845458984375, -0.102386474609375, -0.0974884033203125, -0.09259033203125, -0.0876922607421875, -0.082794189453125, -0.0778961181640625, -0.072998046875, -0.0680999755859375, -0.063201904296875, -0.0583038330078125, -0.05340576171875, -0.0485076904296875, -0.043609619140625, -0.0387115478515625, -0.0338134765625, -0.0289154052734375, -0.024017333984375, -0.0191192626953125, -0.01422119140625, -0.0093231201171875, -0.004425048828125, 0.0004730224609375, 0.00537109375, 0.0102691650390625, 0.015167236328125, 0.0200653076171875, 0.02496337890625, 0.0298614501953125, 0.034759521484375, 0.0396575927734375, 0.0445556640625, 0.0494537353515625, 0.054351806640625, 0.0592498779296875, 0.06414794921875, 0.0690460205078125, 0.073944091796875, 0.0788421630859375, 0.083740234375, 0.0886383056640625, 0.093536376953125, 0.0984344482421875, 0.10333251953125, 0.1082305908203125, 0.113128662109375, 0.1180267333984375, 0.1229248046875, 0.1278228759765625, 0.132720947265625, 0.1376190185546875, 0.14251708984375, 0.1474151611328125, 0.152313232421875, 0.1572113037109375, 0.162109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 8.0, 12.0, 11.0, 12.0, 17.0, 18.0, 26.0, 22.0, 30.0, 51.0, 65.0, 85.0, 91.0, 89.0, 93.0, 73.0, 54.0, 45.0, 29.0, 32.0, 19.0, 14.0, 18.0, 9.0, 11.0, 6.0, 5.0, 5.0, 8.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08746337890625, -0.08448028564453125, -0.0814971923828125, -0.07851409912109375, -0.075531005859375, -0.07254791259765625, -0.0695648193359375, -0.06658172607421875, -0.0635986328125, -0.06061553955078125, -0.0576324462890625, -0.05464935302734375, -0.051666259765625, -0.04868316650390625, -0.0457000732421875, -0.04271697998046875, -0.03973388671875, -0.03675079345703125, -0.0337677001953125, -0.03078460693359375, -0.027801513671875, -0.02481842041015625, -0.0218353271484375, -0.01885223388671875, -0.015869140625, -0.01288604736328125, -0.0099029541015625, -0.00691986083984375, -0.003936767578125, -0.00095367431640625, 0.0020294189453125, 0.00501251220703125, 0.00799560546875, 0.01097869873046875, 0.0139617919921875, 0.01694488525390625, 0.019927978515625, 0.02291107177734375, 0.0258941650390625, 0.02887725830078125, 0.0318603515625, 0.03484344482421875, 0.0378265380859375, 0.04080963134765625, 0.043792724609375, 0.04677581787109375, 0.0497589111328125, 0.05274200439453125, 0.05572509765625, 0.05870819091796875, 0.0616912841796875, 0.06467437744140625, 0.067657470703125, 0.07064056396484375, 0.0736236572265625, 0.07660675048828125, 0.07958984375, 0.08257293701171875, 0.0855560302734375, 0.08853912353515625, 0.091522216796875, 0.09450531005859375, 0.0974884033203125, 0.10047149658203125, 0.10345458984375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 15.0, 11.0, 13.0, 13.0, 25.0, 24.0, 27.0, 31.0, 28.0, 34.0, 32.0, 58.0, 57.0, 50.0, 59.0, 43.0, 65.0, 46.0, 56.0, 36.0, 34.0, 38.0, 39.0, 21.0, 26.0, 25.0, 22.0, 11.0, 14.0, 9.0, 10.0, 2.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.748821258544922, -19.04790687561035, -18.34699249267578, -17.646080017089844, -16.945165634155273, -16.244251251220703, -15.54333782196045, -14.842424392700195, -14.141510009765625, -13.440595626831055, -12.7396821975708, -12.038768768310547, -11.337854385375977, -10.636940002441406, -9.936026573181152, -9.235113143920898, -8.534198760986328, -7.833284854888916, -7.132370948791504, -6.431457042694092, -5.73054313659668, -5.029629230499268, -4.3287153244018555, -3.6278014183044434, -2.9268875122070312, -2.225973606109619, -1.525059700012207, -0.8241457939147949, -0.12323188781738281, 0.5776820182800293, 1.2785959243774414, 1.9795098304748535, 2.6804256439208984, 3.3813395500183105, 4.082253456115723, 4.783167362213135, 5.484081268310547, 6.184995174407959, 6.885909080505371, 7.586822986602783, 8.287736892700195, 8.988651275634766, 9.68956470489502, 10.390478134155273, 11.091392517089844, 11.792306900024414, 12.493220329284668, 13.194133758544922, 13.895048141479492, 14.595962524414062, 15.296875953674316, 15.99778938293457, 16.69870376586914, 17.39961814880371, 18.10053253173828, 18.80144500732422, 19.50235939025879, 20.20327377319336, 20.904186248779297, 21.605100631713867, 22.306015014648438, 23.006929397583008, 23.707843780517578, 24.408756256103516, 25.109670639038086]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 4.0, 3.0, 11.0, 9.0, 10.0, 5.0, 13.0, 14.0, 17.0, 16.0, 22.0, 20.0, 27.0, 25.0, 44.0, 22.0, 23.0, 25.0, 34.0, 23.0, 33.0, 43.0, 39.0, 32.0, 40.0, 38.0, 39.0, 38.0, 27.0, 28.0, 24.0, 28.0, 27.0, 15.0, 22.0, 21.0, 13.0, 11.0, 13.0, 15.0, 12.0, 14.0, 13.0, 13.0, 12.0, 5.0, 5.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-19.268037796020508, -18.65593147277832, -18.043825149536133, -17.431718826293945, -16.819612503051758, -16.20750617980957, -15.595398902893066, -14.983292579650879, -14.371186256408691, -13.759079933166504, -13.146973609924316, -12.534867286682129, -11.922760009765625, -11.310653686523438, -10.69854736328125, -10.086441040039062, -9.474334716796875, -8.862228393554688, -8.2501220703125, -7.638015270233154, -7.025908946990967, -6.413802623748779, -5.801695823669434, -5.189589500427246, -4.577483177185059, -3.965376853942871, -3.3532702922821045, -2.741163730621338, -2.1290574073791504, -1.516951084136963, -0.9048445224761963, -0.2927379608154297, 0.319366455078125, 0.931472897529602, 1.543579339981079, 2.1556859016418457, 2.767792224884033, 3.3798985481262207, 3.9920051097869873, 4.604111671447754, 5.216217994689941, 5.828324317932129, 6.440430641174316, 7.052537441253662, 7.66464376449585, 8.276750564575195, 8.888856887817383, 9.50096321105957, 10.113069534301758, 10.725175857543945, 11.337282180786133, 11.94938850402832, 12.561494827270508, 13.173601150512695, 13.7857084274292, 14.397814750671387, 15.009921073913574, 15.622027397155762, 16.234134674072266, 16.846240997314453, 17.45834732055664, 18.070453643798828, 18.682559967041016, 19.294666290283203, 19.90677261352539]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 13.0, 19.0, 22.0, 51.0, 66.0, 109.0, 160.0, 262.0, 427.0, 602.0, 892.0, 1417.0, 2233.0, 3239.0, 4677.0, 6986.0, 10022.0, 14291.0, 19613.0, 26673.0, 35170.0, 45663.0, 56399.0, 67174.0, 76441.0, 83972.0, 86899.0, 85993.0, 81377.0, 72848.0, 61925.0, 51201.0, 40828.0, 31634.0, 23428.0, 17181.0, 12422.0, 8545.0, 5747.0, 3993.0, 2670.0, 1839.0, 1185.0, 790.0, 521.0, 305.0, 214.0, 138.0, 98.0, 60.0, 43.0, 28.0, 15.0, 16.0, 6.0, 6.0, 4.0, 4.0], "bins": [-9.3515625, -9.0662841796875, -8.781005859375, -8.4957275390625, -8.21044921875, -7.9251708984375, -7.639892578125, -7.3546142578125, -7.0693359375, -6.7840576171875, -6.498779296875, -6.2135009765625, -5.92822265625, -5.6429443359375, -5.357666015625, -5.0723876953125, -4.787109375, -4.5018310546875, -4.216552734375, -3.9312744140625, -3.64599609375, -3.3607177734375, -3.075439453125, -2.7901611328125, -2.5048828125, -2.2196044921875, -1.934326171875, -1.6490478515625, -1.36376953125, -1.0784912109375, -0.793212890625, -0.5079345703125, -0.22265625, 0.0626220703125, 0.347900390625, 0.6331787109375, 0.91845703125, 1.2037353515625, 1.489013671875, 1.7742919921875, 2.0595703125, 2.3448486328125, 2.630126953125, 2.9154052734375, 3.20068359375, 3.4859619140625, 3.771240234375, 4.0565185546875, 4.341796875, 4.6270751953125, 4.912353515625, 5.1976318359375, 5.48291015625, 5.7681884765625, 6.053466796875, 6.3387451171875, 6.6240234375, 6.9093017578125, 7.194580078125, 7.4798583984375, 7.76513671875, 8.0504150390625, 8.335693359375, 8.6209716796875, 8.90625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 3.0, 7.0, 2.0, 9.0, 5.0, 4.0, 12.0, 13.0, 10.0, 13.0, 9.0, 16.0, 28.0, 29.0, 26.0, 34.0, 28.0, 36.0, 24.0, 34.0, 37.0, 36.0, 40.0, 45.0, 32.0, 44.0, 44.0, 34.0, 26.0, 33.0, 30.0, 35.0, 20.0, 22.0, 20.0, 19.0, 23.0, 13.0, 17.0, 23.0, 11.0, 9.0, 6.0, 9.0, 10.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-20.578125, -19.921142578125, -19.26416015625, -18.607177734375, -17.9501953125, -17.293212890625, -16.63623046875, -15.979248046875, -15.322265625, -14.665283203125, -14.00830078125, -13.351318359375, -12.6943359375, -12.037353515625, -11.38037109375, -10.723388671875, -10.06640625, -9.409423828125, -8.75244140625, -8.095458984375, -7.4384765625, -6.781494140625, -6.12451171875, -5.467529296875, -4.810546875, -4.153564453125, -3.49658203125, -2.839599609375, -2.1826171875, -1.525634765625, -0.86865234375, -0.211669921875, 0.4453125, 1.102294921875, 1.75927734375, 2.416259765625, 3.0732421875, 3.730224609375, 4.38720703125, 5.044189453125, 5.701171875, 6.358154296875, 7.01513671875, 7.672119140625, 8.3291015625, 8.986083984375, 9.64306640625, 10.300048828125, 10.95703125, 11.614013671875, 12.27099609375, 12.927978515625, 13.5849609375, 14.241943359375, 14.89892578125, 15.555908203125, 16.212890625, 16.869873046875, 17.52685546875, 18.183837890625, 18.8408203125, 19.497802734375, 20.15478515625, 20.811767578125, 21.46875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 20.0, 23.0, 28.0, 56.0, 97.0, 138.0, 222.0, 398.0, 638.0, 1031.0, 1637.0, 2465.0, 3905.0, 6024.0, 9010.0, 13195.0, 19352.0, 27121.0, 37533.0, 49538.0, 62508.0, 75973.0, 87246.0, 93800.0, 96200.0, 92685.0, 84133.0, 71661.0, 58162.0, 45509.0, 33676.0, 24253.0, 16944.0, 11508.0, 7896.0, 5045.0, 3320.0, 2112.0, 1345.0, 794.0, 531.0, 310.0, 202.0, 141.0, 69.0, 37.0, 20.0, 15.0, 10.0, 4.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.2396240234375, -8.924560546875, -8.6094970703125, -8.29443359375, -7.9793701171875, -7.664306640625, -7.3492431640625, -7.0341796875, -6.7191162109375, -6.404052734375, -6.0889892578125, -5.77392578125, -5.4588623046875, -5.143798828125, -4.8287353515625, -4.513671875, -4.1986083984375, -3.883544921875, -3.5684814453125, -3.25341796875, -2.9383544921875, -2.623291015625, -2.3082275390625, -1.9931640625, -1.6781005859375, -1.363037109375, -1.0479736328125, -0.73291015625, -0.4178466796875, -0.102783203125, 0.2122802734375, 0.52734375, 0.8424072265625, 1.157470703125, 1.4725341796875, 1.78759765625, 2.1026611328125, 2.417724609375, 2.7327880859375, 3.0478515625, 3.3629150390625, 3.677978515625, 3.9930419921875, 4.30810546875, 4.6231689453125, 4.938232421875, 5.2532958984375, 5.568359375, 5.8834228515625, 6.198486328125, 6.5135498046875, 6.82861328125, 7.1436767578125, 7.458740234375, 7.7738037109375, 8.0888671875, 8.4039306640625, 8.718994140625, 9.0340576171875, 9.34912109375, 9.6641845703125, 9.979248046875, 10.2943115234375, 10.609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 3.0, 3.0, 2.0, 7.0, 1.0, 6.0, 4.0, 8.0, 3.0, 11.0, 8.0, 13.0, 19.0, 16.0, 13.0, 25.0, 27.0, 24.0, 33.0, 27.0, 38.0, 35.0, 34.0, 36.0, 43.0, 44.0, 43.0, 36.0, 54.0, 33.0, 37.0, 38.0, 34.0, 27.0, 27.0, 24.0, 28.0, 14.0, 19.0, 19.0, 12.0, 18.0, 9.0, 14.0, 13.0, 9.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.0703125, -12.64208984375, -12.2138671875, -11.78564453125, -11.357421875, -10.92919921875, -10.5009765625, -10.07275390625, -9.64453125, -9.21630859375, -8.7880859375, -8.35986328125, -7.931640625, -7.50341796875, -7.0751953125, -6.64697265625, -6.21875, -5.79052734375, -5.3623046875, -4.93408203125, -4.505859375, -4.07763671875, -3.6494140625, -3.22119140625, -2.79296875, -2.36474609375, -1.9365234375, -1.50830078125, -1.080078125, -0.65185546875, -0.2236328125, 0.20458984375, 0.6328125, 1.06103515625, 1.4892578125, 1.91748046875, 2.345703125, 2.77392578125, 3.2021484375, 3.63037109375, 4.05859375, 4.48681640625, 4.9150390625, 5.34326171875, 5.771484375, 6.19970703125, 6.6279296875, 7.05615234375, 7.484375, 7.91259765625, 8.3408203125, 8.76904296875, 9.197265625, 9.62548828125, 10.0537109375, 10.48193359375, 10.91015625, 11.33837890625, 11.7666015625, 12.19482421875, 12.623046875, 13.05126953125, 13.4794921875, 13.90771484375, 14.3359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 5.0, 11.0, 23.0, 48.0, 76.0, 108.0, 145.0, 265.0, 378.0, 622.0, 972.0, 1533.0, 2272.0, 3432.0, 5319.0, 7737.0, 11631.0, 16619.0, 23319.0, 31341.0, 42131.0, 53763.0, 65628.0, 76487.0, 85112.0, 90261.0, 90757.0, 86289.0, 77635.0, 67080.0, 54400.0, 43201.0, 32907.0, 24102.0, 16845.0, 12056.0, 8169.0, 5531.0, 3612.0, 2357.0, 1603.0, 1087.0, 593.0, 375.0, 283.0, 147.0, 113.0, 69.0, 50.0, 18.0, 20.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.732421875, -2.63836669921875, -2.5443115234375, -2.45025634765625, -2.356201171875, -2.26214599609375, -2.1680908203125, -2.07403564453125, -1.97998046875, -1.88592529296875, -1.7918701171875, -1.69781494140625, -1.603759765625, -1.50970458984375, -1.4156494140625, -1.32159423828125, -1.2275390625, -1.13348388671875, -1.0394287109375, -0.94537353515625, -0.851318359375, -0.75726318359375, -0.6632080078125, -0.56915283203125, -0.47509765625, -0.38104248046875, -0.2869873046875, -0.19293212890625, -0.098876953125, -0.00482177734375, 0.0892333984375, 0.18328857421875, 0.27734375, 0.37139892578125, 0.4654541015625, 0.55950927734375, 0.653564453125, 0.74761962890625, 0.8416748046875, 0.93572998046875, 1.02978515625, 1.12384033203125, 1.2178955078125, 1.31195068359375, 1.406005859375, 1.50006103515625, 1.5941162109375, 1.68817138671875, 1.7822265625, 1.87628173828125, 1.9703369140625, 2.06439208984375, 2.158447265625, 2.25250244140625, 2.3465576171875, 2.44061279296875, 2.53466796875, 2.62872314453125, 2.7227783203125, 2.81683349609375, 2.910888671875, 3.00494384765625, 3.0989990234375, 3.19305419921875, 3.287109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 9.0, 11.0, 12.0, 16.0, 16.0, 17.0, 29.0, 30.0, 36.0, 28.0, 34.0, 47.0, 40.0, 42.0, 40.0, 38.0, 52.0, 47.0, 49.0, 44.0, 36.0, 35.0, 38.0, 31.0, 26.0, 38.0, 22.0, 23.0, 20.0, 10.0, 7.0, 17.0, 4.0, 8.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00045299530029296875, -0.00043886899948120117, -0.0004247426986694336, -0.000410616397857666, -0.00039649009704589844, -0.00038236379623413086, -0.0003682374954223633, -0.0003541111946105957, -0.0003399848937988281, -0.00032585859298706055, -0.00031173229217529297, -0.0002976059913635254, -0.0002834796905517578, -0.00026935338973999023, -0.00025522708892822266, -0.00024110078811645508, -0.0002269744873046875, -0.00021284818649291992, -0.00019872188568115234, -0.00018459558486938477, -0.0001704692840576172, -0.0001563429832458496, -0.00014221668243408203, -0.00012809038162231445, -0.00011396408081054688, -9.98377799987793e-05, -8.571147918701172e-05, -7.158517837524414e-05, -5.745887756347656e-05, -4.3332576751708984e-05, -2.9206275939941406e-05, -1.5079975128173828e-05, -9.5367431640625e-07, 1.3172626495361328e-05, 2.7298927307128906e-05, 4.1425228118896484e-05, 5.555152893066406e-05, 6.967782974243164e-05, 8.380413055419922e-05, 9.79304313659668e-05, 0.00011205673217773438, 0.00012618303298950195, 0.00014030933380126953, 0.0001544356346130371, 0.0001685619354248047, 0.00018268823623657227, 0.00019681453704833984, 0.00021094083786010742, 0.000225067138671875, 0.00023919343948364258, 0.00025331974029541016, 0.00026744604110717773, 0.0002815723419189453, 0.0002956986427307129, 0.00030982494354248047, 0.00032395124435424805, 0.0003380775451660156, 0.0003522038459777832, 0.0003663301467895508, 0.00038045644760131836, 0.00039458274841308594, 0.0004087090492248535, 0.0004228353500366211, 0.00043696165084838867, 0.00045108795166015625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 24.0, 31.0, 47.0, 63.0, 102.0, 163.0, 270.0, 391.0, 572.0, 888.0, 1402.0, 2272.0, 3365.0, 5470.0, 8483.0, 13083.0, 20077.0, 29604.0, 42121.0, 57924.0, 75349.0, 91402.0, 102988.0, 108582.0, 105483.0, 94744.0, 79732.0, 62362.0, 46253.0, 32631.0, 21896.0, 14455.0, 9389.0, 6077.0, 3885.0, 2480.0, 1570.0, 1062.0, 653.0, 435.0, 255.0, 180.0, 124.0, 87.0, 44.0, 25.0, 22.0, 11.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.611328125, -3.493408203125, -3.37548828125, -3.257568359375, -3.1396484375, -3.021728515625, -2.90380859375, -2.785888671875, -2.66796875, -2.550048828125, -2.43212890625, -2.314208984375, -2.1962890625, -2.078369140625, -1.96044921875, -1.842529296875, -1.724609375, -1.606689453125, -1.48876953125, -1.370849609375, -1.2529296875, -1.135009765625, -1.01708984375, -0.899169921875, -0.78125, -0.663330078125, -0.54541015625, -0.427490234375, -0.3095703125, -0.191650390625, -0.07373046875, 0.044189453125, 0.162109375, 0.280029296875, 0.39794921875, 0.515869140625, 0.6337890625, 0.751708984375, 0.86962890625, 0.987548828125, 1.10546875, 1.223388671875, 1.34130859375, 1.459228515625, 1.5771484375, 1.695068359375, 1.81298828125, 1.930908203125, 2.048828125, 2.166748046875, 2.28466796875, 2.402587890625, 2.5205078125, 2.638427734375, 2.75634765625, 2.874267578125, 2.9921875, 3.110107421875, 3.22802734375, 3.345947265625, 3.4638671875, 3.581787109375, 3.69970703125, 3.817626953125, 3.935546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 4.0, 13.0, 4.0, 4.0, 8.0, 7.0, 18.0, 15.0, 25.0, 19.0, 23.0, 30.0, 35.0, 41.0, 33.0, 41.0, 40.0, 30.0, 46.0, 48.0, 53.0, 58.0, 41.0, 31.0, 35.0, 38.0, 31.0, 33.0, 32.0, 33.0, 30.0, 19.0, 13.0, 16.0, 12.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.765625, -1.7064208984375, -1.647216796875, -1.5880126953125, -1.52880859375, -1.4696044921875, -1.410400390625, -1.3511962890625, -1.2919921875, -1.2327880859375, -1.173583984375, -1.1143798828125, -1.05517578125, -0.9959716796875, -0.936767578125, -0.8775634765625, -0.818359375, -0.7591552734375, -0.699951171875, -0.6407470703125, -0.58154296875, -0.5223388671875, -0.463134765625, -0.4039306640625, -0.3447265625, -0.2855224609375, -0.226318359375, -0.1671142578125, -0.10791015625, -0.0487060546875, 0.010498046875, 0.0697021484375, 0.12890625, 0.1881103515625, 0.247314453125, 0.3065185546875, 0.36572265625, 0.4249267578125, 0.484130859375, 0.5433349609375, 0.6025390625, 0.6617431640625, 0.720947265625, 0.7801513671875, 0.83935546875, 0.8985595703125, 0.957763671875, 1.0169677734375, 1.076171875, 1.1353759765625, 1.194580078125, 1.2537841796875, 1.31298828125, 1.3721923828125, 1.431396484375, 1.4906005859375, 1.5498046875, 1.6090087890625, 1.668212890625, 1.7274169921875, 1.78662109375, 1.8458251953125, 1.905029296875, 1.9642333984375, 2.0234375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 5.0, 13.0, 14.0, 17.0, 23.0, 21.0, 27.0, 24.0, 22.0, 24.0, 31.0, 36.0, 42.0, 38.0, 47.0, 44.0, 59.0, 61.0, 51.0, 39.0, 39.0, 38.0, 46.0, 22.0, 33.0, 23.0, 22.0, 21.0, 19.0, 21.0, 20.0, 5.0, 6.0, 6.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.6627140045166, -18.03164291381836, -17.400571823120117, -16.769500732421875, -16.138431549072266, -15.507359504699707, -14.876289367675781, -14.245218276977539, -13.614147186279297, -12.983076095581055, -12.352005004882812, -11.720934867858887, -11.089863777160645, -10.458792686462402, -9.827722549438477, -9.196651458740234, -8.565580368041992, -7.93450927734375, -7.303438663482666, -6.672368049621582, -6.04129695892334, -5.410225868225098, -4.779155254364014, -4.14808464050293, -3.5170135498046875, -2.8859426975250244, -2.2548718452453613, -1.6238009929656982, -0.9927301406860352, -0.36165928840637207, 0.269411563873291, 0.900482177734375, 1.53155517578125, 2.162626028060913, 2.793696880340576, 3.4247677326202393, 4.055838584899902, 4.6869096755981445, 5.3179802894592285, 5.9490509033203125, 6.580121994018555, 7.211193084716797, 7.842263698577881, 8.473334312438965, 9.104405403137207, 9.73547649383545, 10.366546630859375, 10.997617721557617, 11.62868881225586, 12.259759902954102, 12.890830993652344, 13.52190113067627, 14.152972221374512, 14.784043312072754, 15.41511344909668, 16.046184539794922, 16.677255630493164, 17.308326721191406, 17.93939781188965, 18.57046890258789, 19.2015380859375, 19.832609176635742, 20.463680267333984, 21.094751358032227, 21.72582244873047]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 13.0, 22.0, 25.0, 23.0, 28.0, 39.0, 31.0, 33.0, 38.0, 29.0, 34.0, 30.0, 42.0, 36.0, 35.0, 54.0, 51.0, 39.0, 27.0, 42.0, 29.0, 34.0, 25.0, 22.0, 33.0, 22.0, 19.0, 16.0, 10.0, 11.0, 10.0, 22.0, 9.0, 7.0, 7.0, 6.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.167316436767578, -23.409618377685547, -22.651920318603516, -21.894222259521484, -21.136524200439453, -20.378826141357422, -19.62112808227539, -18.86343002319336, -18.105731964111328, -17.348033905029297, -16.590335845947266, -15.832637786865234, -15.074939727783203, -14.317241668701172, -13.559542655944824, -12.801844596862793, -12.044145584106445, -11.286447525024414, -10.528749465942383, -9.771051406860352, -9.01335334777832, -8.255655288696289, -7.497956275939941, -6.74025821685791, -5.982560157775879, -5.224862098693848, -4.467164039611816, -3.709465503692627, -2.9517674446105957, -2.1940693855285645, -1.436370849609375, -0.6786727905273438, 0.07902336120605469, 0.8367215394973755, 1.5944197177886963, 2.3521180152893066, 3.109816074371338, 3.867514133453369, 4.625212669372559, 5.38291072845459, 6.140608787536621, 6.898306846618652, 7.656004905700684, 8.413703918457031, 9.171401977539062, 9.929100036621094, 10.686798095703125, 11.444496154785156, 12.202194213867188, 12.959892272949219, 13.71759033203125, 14.475288391113281, 15.232986450195312, 15.990684509277344, 16.748382568359375, 17.506080627441406, 18.263778686523438, 19.02147674560547, 19.7791748046875, 20.53687286376953, 21.294570922851562, 22.052268981933594, 22.809967041015625, 23.567665100097656, 24.32536506652832]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 25.0, 35.0, 58.0, 76.0, 123.0, 220.0, 353.0, 582.0, 950.0, 1544.0, 2632.0, 3996.0, 6860.0, 10734.0, 16630.0, 26367.0, 40185.0, 60060.0, 88233.0, 125649.0, 172424.0, 225683.0, 284417.0, 336911.0, 377955.0, 397213.0, 392290.0, 361244.0, 314139.0, 258213.0, 201367.0, 151175.0, 109125.0, 76292.0, 52514.0, 34787.0, 22998.0, 14741.0, 9525.0, 6138.0, 3689.0, 2363.0, 1439.0, 921.0, 540.0, 327.0, 194.0, 151.0, 65.0, 55.0, 29.0, 12.0, 12.0, 4.0, 6.0, 2.0, 3.0, 1.0], "bins": [-14.328125, -13.87744140625, -13.4267578125, -12.97607421875, -12.525390625, -12.07470703125, -11.6240234375, -11.17333984375, -10.72265625, -10.27197265625, -9.8212890625, -9.37060546875, -8.919921875, -8.46923828125, -8.0185546875, -7.56787109375, -7.1171875, -6.66650390625, -6.2158203125, -5.76513671875, -5.314453125, -4.86376953125, -4.4130859375, -3.96240234375, -3.51171875, -3.06103515625, -2.6103515625, -2.15966796875, -1.708984375, -1.25830078125, -0.8076171875, -0.35693359375, 0.09375, 0.54443359375, 0.9951171875, 1.44580078125, 1.896484375, 2.34716796875, 2.7978515625, 3.24853515625, 3.69921875, 4.14990234375, 4.6005859375, 5.05126953125, 5.501953125, 5.95263671875, 6.4033203125, 6.85400390625, 7.3046875, 7.75537109375, 8.2060546875, 8.65673828125, 9.107421875, 9.55810546875, 10.0087890625, 10.45947265625, 10.91015625, 11.36083984375, 11.8115234375, 12.26220703125, 12.712890625, 13.16357421875, 13.6142578125, 14.06494140625, 14.515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 10.0, 10.0, 11.0, 12.0, 16.0, 16.0, 26.0, 26.0, 27.0, 29.0, 29.0, 43.0, 30.0, 38.0, 45.0, 39.0, 40.0, 36.0, 52.0, 35.0, 46.0, 38.0, 36.0, 38.0, 34.0, 23.0, 22.0, 31.0, 25.0, 18.0, 14.0, 25.0, 11.0, 16.0, 11.0, 6.0, 7.0, 4.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.953125, -20.30029296875, -19.6474609375, -18.99462890625, -18.341796875, -17.68896484375, -17.0361328125, -16.38330078125, -15.73046875, -15.07763671875, -14.4248046875, -13.77197265625, -13.119140625, -12.46630859375, -11.8134765625, -11.16064453125, -10.5078125, -9.85498046875, -9.2021484375, -8.54931640625, -7.896484375, -7.24365234375, -6.5908203125, -5.93798828125, -5.28515625, -4.63232421875, -3.9794921875, -3.32666015625, -2.673828125, -2.02099609375, -1.3681640625, -0.71533203125, -0.0625, 0.59033203125, 1.2431640625, 1.89599609375, 2.548828125, 3.20166015625, 3.8544921875, 4.50732421875, 5.16015625, 5.81298828125, 6.4658203125, 7.11865234375, 7.771484375, 8.42431640625, 9.0771484375, 9.72998046875, 10.3828125, 11.03564453125, 11.6884765625, 12.34130859375, 12.994140625, 13.64697265625, 14.2998046875, 14.95263671875, 15.60546875, 16.25830078125, 16.9111328125, 17.56396484375, 18.216796875, 18.86962890625, 19.5224609375, 20.17529296875, 20.828125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 16.0, 21.0, 49.0, 62.0, 143.0, 213.0, 390.0, 678.0, 1245.0, 2126.0, 3567.0, 6167.0, 10526.0, 17259.0, 28611.0, 44955.0, 69613.0, 102398.0, 147043.0, 200973.0, 262494.0, 321046.0, 372496.0, 403169.0, 409187.0, 391368.0, 347984.0, 291735.0, 230534.0, 173377.0, 123918.0, 84598.0, 55825.0, 35360.0, 22051.0, 13562.0, 8132.0, 4759.0, 2727.0, 1685.0, 913.0, 544.0, 346.0, 171.0, 107.0, 60.0, 34.0, 17.0, 13.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.3125, -15.806640625, -15.30078125, -14.794921875, -14.2890625, -13.783203125, -13.27734375, -12.771484375, -12.265625, -11.759765625, -11.25390625, -10.748046875, -10.2421875, -9.736328125, -9.23046875, -8.724609375, -8.21875, -7.712890625, -7.20703125, -6.701171875, -6.1953125, -5.689453125, -5.18359375, -4.677734375, -4.171875, -3.666015625, -3.16015625, -2.654296875, -2.1484375, -1.642578125, -1.13671875, -0.630859375, -0.125, 0.380859375, 0.88671875, 1.392578125, 1.8984375, 2.404296875, 2.91015625, 3.416015625, 3.921875, 4.427734375, 4.93359375, 5.439453125, 5.9453125, 6.451171875, 6.95703125, 7.462890625, 7.96875, 8.474609375, 8.98046875, 9.486328125, 9.9921875, 10.498046875, 11.00390625, 11.509765625, 12.015625, 12.521484375, 13.02734375, 13.533203125, 14.0390625, 14.544921875, 15.05078125, 15.556640625, 16.0625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 3.0, 13.0, 13.0, 17.0, 17.0, 32.0, 53.0, 58.0, 63.0, 70.0, 87.0, 99.0, 118.0, 132.0, 147.0, 159.0, 196.0, 168.0, 211.0, 221.0, 226.0, 226.0, 179.0, 187.0, 184.0, 154.0, 167.0, 149.0, 108.0, 127.0, 106.0, 84.0, 62.0, 46.0, 42.0, 40.0, 25.0, 18.0, 13.0, 18.0, 12.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.7578125, -8.4412841796875, -8.124755859375, -7.8082275390625, -7.49169921875, -7.1751708984375, -6.858642578125, -6.5421142578125, -6.2255859375, -5.9090576171875, -5.592529296875, -5.2760009765625, -4.95947265625, -4.6429443359375, -4.326416015625, -4.0098876953125, -3.693359375, -3.3768310546875, -3.060302734375, -2.7437744140625, -2.42724609375, -2.1107177734375, -1.794189453125, -1.4776611328125, -1.1611328125, -0.8446044921875, -0.528076171875, -0.2115478515625, 0.10498046875, 0.4215087890625, 0.738037109375, 1.0545654296875, 1.37109375, 1.6876220703125, 2.004150390625, 2.3206787109375, 2.63720703125, 2.9537353515625, 3.270263671875, 3.5867919921875, 3.9033203125, 4.2198486328125, 4.536376953125, 4.8529052734375, 5.16943359375, 5.4859619140625, 5.802490234375, 6.1190185546875, 6.435546875, 6.7520751953125, 7.068603515625, 7.3851318359375, 7.70166015625, 8.0181884765625, 8.334716796875, 8.6512451171875, 8.9677734375, 9.2843017578125, 9.600830078125, 9.9173583984375, 10.23388671875, 10.5504150390625, 10.866943359375, 11.1834716796875, 11.5]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 7.0, 10.0, 15.0, 7.0, 9.0, 18.0, 12.0, 20.0, 20.0, 29.0, 26.0, 37.0, 38.0, 49.0, 51.0, 54.0, 42.0, 43.0, 49.0, 47.0, 54.0, 42.0, 39.0, 39.0, 44.0, 35.0, 20.0, 33.0, 26.0, 11.0, 10.0, 8.0, 10.0, 3.0, 5.0, 10.0, 6.0, 5.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.613582611083984, -23.887020111083984, -23.160457611083984, -22.43389320373535, -21.70733070373535, -20.98076820373535, -20.25420379638672, -19.52764129638672, -18.80107879638672, -18.07451629638672, -17.34795379638672, -16.621389389038086, -15.894826889038086, -15.168264389038086, -14.44170093536377, -13.715137481689453, -12.988574981689453, -12.262012481689453, -11.535449028015137, -10.80888557434082, -10.08232307434082, -9.35576057434082, -8.629197120666504, -7.902634143829346, -7.1760711669921875, -6.449508190155029, -5.722945213317871, -4.996382236480713, -4.269819259643555, -3.5432562828063965, -2.8166933059692383, -2.09013032913208, -1.3635692596435547, -0.6370062828063965, 0.08955669403076172, 0.8161196708679199, 1.5426826477050781, 2.2692456245422363, 2.9958086013793945, 3.7223715782165527, 4.448934555053711, 5.175497531890869, 5.902060508728027, 6.6286234855651855, 7.355186462402344, 8.081748962402344, 8.80831241607666, 9.534875869750977, 10.261438369750977, 10.988000869750977, 11.714564323425293, 12.44112777709961, 13.16769027709961, 13.89425277709961, 14.620816230773926, 15.347379684448242, 16.073942184448242, 16.800504684448242, 17.527069091796875, 18.253631591796875, 18.980194091796875, 19.706756591796875, 20.433319091796875, 21.159883499145508, 21.886445999145508]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 10.0, 10.0, 16.0, 17.0, 29.0, 22.0, 29.0, 28.0, 17.0, 34.0, 26.0, 26.0, 36.0, 36.0, 37.0, 40.0, 35.0, 47.0, 46.0, 43.0, 35.0, 36.0, 30.0, 32.0, 30.0, 40.0, 23.0, 26.0, 17.0, 18.0, 17.0, 17.0, 13.0, 16.0, 11.0, 10.0, 6.0, 5.0, 5.0, 4.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.615243911743164, -24.830129623413086, -24.045015335083008, -23.25990104675293, -22.47478675842285, -21.689672470092773, -20.904560089111328, -20.11944580078125, -19.334331512451172, -18.549217224121094, -17.764102935791016, -16.978988647460938, -16.19387435913086, -15.408760070800781, -14.62364673614502, -13.838532447814941, -13.053417205810547, -12.268302917480469, -11.48318862915039, -10.698074340820312, -9.912960052490234, -9.127845764160156, -8.342732429504395, -7.557618141174316, -6.772503852844238, -5.98738956451416, -5.202275276184082, -4.417161464691162, -3.632047176361084, -2.846932888031006, -2.061819076538086, -1.2767047882080078, -0.4915924072265625, 0.2935217618942261, 1.0786359310150146, 1.8637499809265137, 2.648864269256592, 3.43397855758667, 4.21909236907959, 5.004206657409668, 5.789320945739746, 6.574435234069824, 7.359549522399902, 8.144662857055664, 8.929777145385742, 9.71489143371582, 10.500005722045898, 11.285120010375977, 12.070234298706055, 12.855348587036133, 13.640462875366211, 14.425577163696289, 15.210691452026367, 15.995805740356445, 16.78091812133789, 17.56603240966797, 18.351146697998047, 19.136260986328125, 19.921375274658203, 20.70648956298828, 21.49160385131836, 22.276718139648438, 23.061832427978516, 23.846946716308594, 24.632061004638672]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 12.0, 15.0, 26.0, 20.0, 43.0, 62.0, 91.0, 164.0, 251.0, 385.0, 580.0, 864.0, 1248.0, 2018.0, 3241.0, 5210.0, 8410.0, 13471.0, 21555.0, 34992.0, 58269.0, 94223.0, 149020.0, 199817.0, 168677.0, 109294.0, 68190.0, 41451.0, 25132.0, 15603.0, 9572.0, 6009.0, 3821.0, 2369.0, 1590.0, 984.0, 631.0, 403.0, 285.0, 187.0, 129.0, 73.0, 52.0, 41.0, 26.0, 17.0, 12.0, 12.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.830078125, -2.740692138671875, -2.65130615234375, -2.561920166015625, -2.4725341796875, -2.383148193359375, -2.29376220703125, -2.204376220703125, -2.114990234375, -2.025604248046875, -1.93621826171875, -1.846832275390625, -1.7574462890625, -1.668060302734375, -1.57867431640625, -1.489288330078125, -1.39990234375, -1.310516357421875, -1.22113037109375, -1.131744384765625, -1.0423583984375, -0.952972412109375, -0.86358642578125, -0.774200439453125, -0.684814453125, -0.595428466796875, -0.50604248046875, -0.416656494140625, -0.3272705078125, -0.237884521484375, -0.14849853515625, -0.059112548828125, 0.0302734375, 0.119659423828125, 0.20904541015625, 0.298431396484375, 0.3878173828125, 0.477203369140625, 0.56658935546875, 0.655975341796875, 0.745361328125, 0.834747314453125, 0.92413330078125, 1.013519287109375, 1.1029052734375, 1.192291259765625, 1.28167724609375, 1.371063232421875, 1.46044921875, 1.549835205078125, 1.63922119140625, 1.728607177734375, 1.8179931640625, 1.907379150390625, 1.99676513671875, 2.086151123046875, 2.175537109375, 2.264923095703125, 2.35430908203125, 2.443695068359375, 2.5330810546875, 2.622467041015625, 2.71185302734375, 2.801239013671875, 2.890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 6.0, 14.0, 14.0, 22.0, 29.0, 19.0, 22.0, 32.0, 20.0, 24.0, 43.0, 29.0, 37.0, 37.0, 45.0, 42.0, 36.0, 52.0, 45.0, 49.0, 43.0, 37.0, 35.0, 32.0, 20.0, 30.0, 24.0, 17.0, 14.0, 21.0, 19.0, 21.0, 9.0, 7.0, 9.0, 6.0, 3.0, 2.0, 10.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.453125, -26.599853515625, -25.74658203125, -24.893310546875, -24.0400390625, -23.186767578125, -22.33349609375, -21.480224609375, -20.626953125, -19.773681640625, -18.92041015625, -18.067138671875, -17.2138671875, -16.360595703125, -15.50732421875, -14.654052734375, -13.80078125, -12.947509765625, -12.09423828125, -11.240966796875, -10.3876953125, -9.534423828125, -8.68115234375, -7.827880859375, -6.974609375, -6.121337890625, -5.26806640625, -4.414794921875, -3.5615234375, -2.708251953125, -1.85498046875, -1.001708984375, -0.1484375, 0.704833984375, 1.55810546875, 2.411376953125, 3.2646484375, 4.117919921875, 4.97119140625, 5.824462890625, 6.677734375, 7.531005859375, 8.38427734375, 9.237548828125, 10.0908203125, 10.944091796875, 11.79736328125, 12.650634765625, 13.50390625, 14.357177734375, 15.21044921875, 16.063720703125, 16.9169921875, 17.770263671875, 18.62353515625, 19.476806640625, 20.330078125, 21.183349609375, 22.03662109375, 22.889892578125, 23.7431640625, 24.596435546875, 25.44970703125, 26.302978515625, 27.15625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 4.0, 4.0, 13.0, 11.0, 22.0, 30.0, 42.0, 63.0, 90.0, 161.0, 179.0, 273.0, 406.0, 572.0, 784.0, 1092.0, 1532.0, 2102.0, 3084.0, 4444.0, 6628.0, 9629.0, 14619.0, 21747.0, 32931.0, 51203.0, 78019.0, 115358.0, 159933.0, 167497.0, 125082.0, 85731.0, 55596.0, 36086.0, 23551.0, 15885.0, 10661.0, 7186.0, 4927.0, 3428.0, 2302.0, 1639.0, 1137.0, 851.0, 569.0, 421.0, 325.0, 217.0, 139.0, 124.0, 85.0, 41.0, 37.0, 27.0, 16.0, 14.0, 10.0, 2.0, 1.0, 3.0, 2.0], "bins": [-2.642578125, -2.560272216796875, -2.47796630859375, -2.395660400390625, -2.3133544921875, -2.231048583984375, -2.14874267578125, -2.066436767578125, -1.984130859375, -1.901824951171875, -1.81951904296875, -1.737213134765625, -1.6549072265625, -1.572601318359375, -1.49029541015625, -1.407989501953125, -1.32568359375, -1.243377685546875, -1.16107177734375, -1.078765869140625, -0.9964599609375, -0.914154052734375, -0.83184814453125, -0.749542236328125, -0.667236328125, -0.584930419921875, -0.50262451171875, -0.420318603515625, -0.3380126953125, -0.255706787109375, -0.17340087890625, -0.091094970703125, -0.0087890625, 0.073516845703125, 0.15582275390625, 0.238128662109375, 0.3204345703125, 0.402740478515625, 0.48504638671875, 0.567352294921875, 0.649658203125, 0.731964111328125, 0.81427001953125, 0.896575927734375, 0.9788818359375, 1.061187744140625, 1.14349365234375, 1.225799560546875, 1.30810546875, 1.390411376953125, 1.47271728515625, 1.555023193359375, 1.6373291015625, 1.719635009765625, 1.80194091796875, 1.884246826171875, 1.966552734375, 2.048858642578125, 2.13116455078125, 2.213470458984375, 2.2957763671875, 2.378082275390625, 2.46038818359375, 2.542694091796875, 2.625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 4.0, 9.0, 10.0, 16.0, 8.0, 17.0, 14.0, 24.0, 17.0, 25.0, 29.0, 30.0, 34.0, 26.0, 32.0, 31.0, 32.0, 28.0, 40.0, 33.0, 29.0, 42.0, 35.0, 31.0, 32.0, 29.0, 38.0, 35.0, 30.0, 24.0, 33.0, 26.0, 27.0, 21.0, 14.0, 18.0, 11.0, 13.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 5.0, 5.0, 6.0, 0.0, 0.0, 1.0], "bins": [-16.34375, -15.8681640625, -15.392578125, -14.9169921875, -14.44140625, -13.9658203125, -13.490234375, -13.0146484375, -12.5390625, -12.0634765625, -11.587890625, -11.1123046875, -10.63671875, -10.1611328125, -9.685546875, -9.2099609375, -8.734375, -8.2587890625, -7.783203125, -7.3076171875, -6.83203125, -6.3564453125, -5.880859375, -5.4052734375, -4.9296875, -4.4541015625, -3.978515625, -3.5029296875, -3.02734375, -2.5517578125, -2.076171875, -1.6005859375, -1.125, -0.6494140625, -0.173828125, 0.3017578125, 0.77734375, 1.2529296875, 1.728515625, 2.2041015625, 2.6796875, 3.1552734375, 3.630859375, 4.1064453125, 4.58203125, 5.0576171875, 5.533203125, 6.0087890625, 6.484375, 6.9599609375, 7.435546875, 7.9111328125, 8.38671875, 8.8623046875, 9.337890625, 9.8134765625, 10.2890625, 10.7646484375, 11.240234375, 11.7158203125, 12.19140625, 12.6669921875, 13.142578125, 13.6181640625, 14.09375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 12.0, 19.0, 16.0, 30.0, 43.0, 66.0, 89.0, 137.0, 208.0, 302.0, 454.0, 646.0, 985.0, 1504.0, 2183.0, 3327.0, 4950.0, 7618.0, 12255.0, 19416.0, 31987.0, 54819.0, 98731.0, 188241.0, 255512.0, 158853.0, 83971.0, 46461.0, 27557.0, 17016.0, 10642.0, 7018.0, 4419.0, 2981.0, 2000.0, 1339.0, 879.0, 624.0, 373.0, 280.0, 161.0, 131.0, 84.0, 61.0, 44.0, 39.0, 29.0, 10.0, 13.0, 10.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0933837890625, -0.09040641784667969, -0.08742904663085938, -0.08445167541503906, -0.08147430419921875, -0.07849693298339844, -0.07551956176757812, -0.07254219055175781, -0.0695648193359375, -0.06658744812011719, -0.06361007690429688, -0.06063270568847656, -0.05765533447265625, -0.05467796325683594, -0.051700592041015625, -0.04872322082519531, -0.045745849609375, -0.04276847839355469, -0.039791107177734375, -0.03681373596191406, -0.03383636474609375, -0.030858993530273438, -0.027881622314453125, -0.024904251098632812, -0.0219268798828125, -0.018949508666992188, -0.015972137451171875, -0.012994766235351562, -0.01001739501953125, -0.0070400238037109375, -0.004062652587890625, -0.0010852813720703125, 0.00189208984375, 0.0048694610595703125, 0.007846832275390625, 0.010824203491210938, 0.01380157470703125, 0.016778945922851562, 0.019756317138671875, 0.022733688354492188, 0.0257110595703125, 0.028688430786132812, 0.031665802001953125, 0.03464317321777344, 0.03762054443359375, 0.04059791564941406, 0.043575286865234375, 0.04655265808105469, 0.049530029296875, 0.05250740051269531, 0.055484771728515625, 0.05846214294433594, 0.06143951416015625, 0.06441688537597656, 0.06739425659179688, 0.07037162780761719, 0.0733489990234375, 0.07632637023925781, 0.07930374145507812, 0.08228111267089844, 0.08525848388671875, 0.08823585510253906, 0.09121322631835938, 0.09419059753417969, 0.09716796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 13.0, 10.0, 6.0, 7.0, 17.0, 13.0, 18.0, 18.0, 23.0, 23.0, 28.0, 26.0, 36.0, 38.0, 35.0, 34.0, 47.0, 37.0, 48.0, 55.0, 35.0, 39.0, 45.0, 58.0, 31.0, 28.0, 19.0, 23.0, 29.0, 25.0, 16.0, 20.0, 16.0, 15.0, 14.0, 8.0, 9.0, 10.0, 6.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9371509552001953e-05, -1.8822960555553436e-05, -1.827441155910492e-05, -1.7725862562656403e-05, -1.7177313566207886e-05, -1.662876456975937e-05, -1.6080215573310852e-05, -1.5531666576862335e-05, -1.4983117580413818e-05, -1.4434568583965302e-05, -1.3886019587516785e-05, -1.3337470591068268e-05, -1.2788921594619751e-05, -1.2240372598171234e-05, -1.1691823601722717e-05, -1.11432746052742e-05, -1.0594725608825684e-05, -1.0046176612377167e-05, -9.49762761592865e-06, -8.949078619480133e-06, -8.400529623031616e-06, -7.8519806265831e-06, -7.3034316301345825e-06, -6.754882633686066e-06, -6.206333637237549e-06, -5.657784640789032e-06, -5.109235644340515e-06, -4.560686647891998e-06, -4.0121376514434814e-06, -3.4635886549949646e-06, -2.9150396585464478e-06, -2.366490662097931e-06, -1.817941665649414e-06, -1.2693926692008972e-06, -7.208436727523804e-07, -1.7229467630386353e-07, 3.762543201446533e-07, 9.248033165931702e-07, 1.473352313041687e-06, 2.021901309490204e-06, 2.5704503059387207e-06, 3.1189993023872375e-06, 3.6675482988357544e-06, 4.216097295284271e-06, 4.764646291732788e-06, 5.313195288181305e-06, 5.861744284629822e-06, 6.410293281078339e-06, 6.9588422775268555e-06, 7.507391273975372e-06, 8.05594027042389e-06, 8.604489266872406e-06, 9.153038263320923e-06, 9.70158725976944e-06, 1.0250136256217957e-05, 1.0798685252666473e-05, 1.134723424911499e-05, 1.1895783245563507e-05, 1.2444332242012024e-05, 1.299288123846054e-05, 1.3541430234909058e-05, 1.4089979231357574e-05, 1.4638528227806091e-05, 1.5187077224254608e-05, 1.5735626220703125e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 14.0, 32.0, 50.0, 80.0, 140.0, 185.0, 276.0, 438.0, 685.0, 1065.0, 1665.0, 2590.0, 3972.0, 6450.0, 10387.0, 17062.0, 28415.0, 49068.0, 93533.0, 203754.0, 305586.0, 149479.0, 72827.0, 39662.0, 23314.0, 14332.0, 8698.0, 5362.0, 3467.0, 2139.0, 1413.0, 911.0, 517.0, 363.0, 218.0, 170.0, 96.0, 48.0, 34.0, 22.0, 10.0, 9.0, 6.0, 0.0, 3.0, 3.0], "bins": [-0.275634765625, -0.26844024658203125, -0.2612457275390625, -0.25405120849609375, -0.246856689453125, -0.23966217041015625, -0.2324676513671875, -0.22527313232421875, -0.21807861328125, -0.21088409423828125, -0.2036895751953125, -0.19649505615234375, -0.189300537109375, -0.18210601806640625, -0.1749114990234375, -0.16771697998046875, -0.1605224609375, -0.15332794189453125, -0.1461334228515625, -0.13893890380859375, -0.131744384765625, -0.12454986572265625, -0.1173553466796875, -0.11016082763671875, -0.10296630859375, -0.09577178955078125, -0.0885772705078125, -0.08138275146484375, -0.074188232421875, -0.06699371337890625, -0.0597991943359375, -0.05260467529296875, -0.04541015625, -0.03821563720703125, -0.0310211181640625, -0.02382659912109375, -0.016632080078125, -0.00943756103515625, -0.0022430419921875, 0.00495147705078125, 0.01214599609375, 0.01934051513671875, 0.0265350341796875, 0.03372955322265625, 0.040924072265625, 0.04811859130859375, 0.0553131103515625, 0.06250762939453125, 0.0697021484375, 0.07689666748046875, 0.0840911865234375, 0.09128570556640625, 0.098480224609375, 0.10567474365234375, 0.1128692626953125, 0.12006378173828125, 0.12725830078125, 0.13445281982421875, 0.1416473388671875, 0.14884185791015625, 0.156036376953125, 0.16323089599609375, 0.1704254150390625, 0.17761993408203125, 0.184814453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 1.0, 6.0, 10.0, 5.0, 5.0, 7.0, 6.0, 17.0, 10.0, 20.0, 19.0, 21.0, 26.0, 32.0, 37.0, 29.0, 46.0, 43.0, 55.0, 65.0, 73.0, 61.0, 56.0, 40.0, 40.0, 47.0, 30.0, 21.0, 25.0, 22.0, 22.0, 11.0, 11.0, 14.0, 12.0, 6.0, 5.0, 9.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.106201171875, -0.10307502746582031, -0.09994888305664062, -0.09682273864746094, -0.09369659423828125, -0.09057044982910156, -0.08744430541992188, -0.08431816101074219, -0.0811920166015625, -0.07806587219238281, -0.07493972778320312, -0.07181358337402344, -0.06868743896484375, -0.06556129455566406, -0.062435150146484375, -0.05930900573730469, -0.056182861328125, -0.05305671691894531, -0.049930572509765625, -0.04680442810058594, -0.04367828369140625, -0.04055213928222656, -0.037425994873046875, -0.03429985046386719, -0.0311737060546875, -0.028047561645507812, -0.024921417236328125, -0.021795272827148438, -0.01866912841796875, -0.015542984008789062, -0.012416839599609375, -0.009290695190429688, -0.00616455078125, -0.0030384063720703125, 8.7738037109375e-05, 0.0032138824462890625, 0.00634002685546875, 0.009466171264648438, 0.012592315673828125, 0.015718460083007812, 0.0188446044921875, 0.021970748901367188, 0.025096893310546875, 0.028223037719726562, 0.03134918212890625, 0.03447532653808594, 0.037601470947265625, 0.04072761535644531, 0.043853759765625, 0.04697990417480469, 0.050106048583984375, 0.05323219299316406, 0.05635833740234375, 0.05948448181152344, 0.06261062622070312, 0.06573677062988281, 0.0688629150390625, 0.07198905944824219, 0.07511520385742188, 0.07824134826660156, 0.08136749267578125, 0.08449363708496094, 0.08761978149414062, 0.09074592590332031, 0.0938720703125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 4.0, 4.0, 7.0, 16.0, 9.0, 8.0, 16.0, 11.0, 17.0, 17.0, 28.0, 29.0, 34.0, 38.0, 51.0, 38.0, 57.0, 46.0, 43.0, 48.0, 43.0, 58.0, 43.0, 41.0, 42.0, 41.0, 34.0, 33.0, 32.0, 23.0, 17.0, 10.0, 6.0, 11.0, 8.0, 2.0, 10.0, 8.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.042255401611328, -24.314136505126953, -23.58601951599121, -22.85790252685547, -22.129783630371094, -21.40166473388672, -20.673547744750977, -19.945430755615234, -19.21731185913086, -18.489192962646484, -17.761075973510742, -17.032958984375, -16.304840087890625, -15.576722145080566, -14.848604202270508, -14.12048625946045, -13.39236831665039, -12.664250373840332, -11.936132431030273, -11.208014488220215, -10.479896545410156, -9.751778602600098, -9.023660659790039, -8.29554271697998, -7.567424774169922, -6.839306831359863, -6.111188888549805, -5.383070945739746, -4.6549530029296875, -3.926835060119629, -3.1987171173095703, -2.4705991744995117, -1.742483139038086, -1.0143651962280273, -0.28624725341796875, 0.44187068939208984, 1.1699886322021484, 1.898106575012207, 2.6262245178222656, 3.354342460632324, 4.082460403442383, 4.810578346252441, 5.5386962890625, 6.266814231872559, 6.994932174682617, 7.723050117492676, 8.451168060302734, 9.179286003112793, 9.907403945922852, 10.63552188873291, 11.363639831542969, 12.091757774353027, 12.819875717163086, 13.547993659973145, 14.276111602783203, 15.004229545593262, 15.73234748840332, 16.460464477539062, 17.188583374023438, 17.916702270507812, 18.644819259643555, 19.372936248779297, 20.101055145263672, 20.829174041748047, 21.55729103088379]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 10.0, 11.0, 15.0, 17.0, 30.0, 22.0, 28.0, 28.0, 16.0, 36.0, 26.0, 25.0, 36.0, 36.0, 36.0, 41.0, 36.0, 47.0, 45.0, 41.0, 37.0, 37.0, 29.0, 31.0, 32.0, 40.0, 24.0, 23.0, 17.0, 20.0, 16.0, 18.0, 13.0, 15.0, 12.0, 9.0, 6.0, 6.0, 4.0, 4.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.85509490966797, -25.070707321166992, -24.286319732666016, -23.50193214416504, -22.717544555664062, -21.933156967163086, -21.14876937866211, -20.364381790161133, -19.579994201660156, -18.79560661315918, -18.011219024658203, -17.226831436157227, -16.44244384765625, -15.658056259155273, -14.873668670654297, -14.08928108215332, -13.304893493652344, -12.520505905151367, -11.73611831665039, -10.951730728149414, -10.167343139648438, -9.382955551147461, -8.598567962646484, -7.814180374145508, -7.029792785644531, -6.245405197143555, -5.461017608642578, -4.676630020141602, -3.892242431640625, -3.1078548431396484, -2.323467254638672, -1.5390796661376953, -0.7546939849853516, 0.029693603515625, 0.8140811920166016, 1.5984687805175781, 2.3828563690185547, 3.1672439575195312, 3.951631546020508, 4.736019134521484, 5.520406723022461, 6.3047943115234375, 7.089181900024414, 7.873569488525391, 8.657957077026367, 9.442344665527344, 10.22673225402832, 11.011119842529297, 11.795507431030273, 12.57989501953125, 13.364282608032227, 14.148670196533203, 14.93305778503418, 15.717445373535156, 16.501832962036133, 17.28622055053711, 18.070608139038086, 18.854995727539062, 19.63938331604004, 20.423770904541016, 21.208158493041992, 21.99254608154297, 22.776933670043945, 23.561321258544922, 24.3457088470459]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 10.0, 16.0, 26.0, 36.0, 69.0, 116.0, 182.0, 343.0, 542.0, 885.0, 1366.0, 2077.0, 3521.0, 5352.0, 8537.0, 12293.0, 17913.0, 25969.0, 36104.0, 47952.0, 60978.0, 74454.0, 85743.0, 93836.0, 96337.0, 93719.0, 85383.0, 73733.0, 60256.0, 47184.0, 35443.0, 25692.0, 18029.0, 12094.0, 8138.0, 5296.0, 3402.0, 2072.0, 1384.0, 832.0, 491.0, 313.0, 178.0, 106.0, 70.0, 27.0, 24.0, 17.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3046875, -9.966552734375, -9.62841796875, -9.290283203125, -8.9521484375, -8.614013671875, -8.27587890625, -7.937744140625, -7.599609375, -7.261474609375, -6.92333984375, -6.585205078125, -6.2470703125, -5.908935546875, -5.57080078125, -5.232666015625, -4.89453125, -4.556396484375, -4.21826171875, -3.880126953125, -3.5419921875, -3.203857421875, -2.86572265625, -2.527587890625, -2.189453125, -1.851318359375, -1.51318359375, -1.175048828125, -0.8369140625, -0.498779296875, -0.16064453125, 0.177490234375, 0.515625, 0.853759765625, 1.19189453125, 1.530029296875, 1.8681640625, 2.206298828125, 2.54443359375, 2.882568359375, 3.220703125, 3.558837890625, 3.89697265625, 4.235107421875, 4.5732421875, 4.911376953125, 5.24951171875, 5.587646484375, 5.92578125, 6.263916015625, 6.60205078125, 6.940185546875, 7.2783203125, 7.616455078125, 7.95458984375, 8.292724609375, 8.630859375, 8.968994140625, 9.30712890625, 9.645263671875, 9.9833984375, 10.321533203125, 10.65966796875, 10.997802734375, 11.3359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 13.0, 16.0, 13.0, 30.0, 26.0, 30.0, 30.0, 21.0, 34.0, 35.0, 34.0, 41.0, 31.0, 47.0, 45.0, 44.0, 46.0, 36.0, 48.0, 46.0, 27.0, 41.0, 36.0, 32.0, 23.0, 20.0, 19.0, 20.0, 18.0, 13.0, 16.0, 17.0, 10.0, 5.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.9375, -28.05810546875, -27.1787109375, -26.29931640625, -25.419921875, -24.54052734375, -23.6611328125, -22.78173828125, -21.90234375, -21.02294921875, -20.1435546875, -19.26416015625, -18.384765625, -17.50537109375, -16.6259765625, -15.74658203125, -14.8671875, -13.98779296875, -13.1083984375, -12.22900390625, -11.349609375, -10.47021484375, -9.5908203125, -8.71142578125, -7.83203125, -6.95263671875, -6.0732421875, -5.19384765625, -4.314453125, -3.43505859375, -2.5556640625, -1.67626953125, -0.796875, 0.08251953125, 0.9619140625, 1.84130859375, 2.720703125, 3.60009765625, 4.4794921875, 5.35888671875, 6.23828125, 7.11767578125, 7.9970703125, 8.87646484375, 9.755859375, 10.63525390625, 11.5146484375, 12.39404296875, 13.2734375, 14.15283203125, 15.0322265625, 15.91162109375, 16.791015625, 17.67041015625, 18.5498046875, 19.42919921875, 20.30859375, 21.18798828125, 22.0673828125, 22.94677734375, 23.826171875, 24.70556640625, 25.5849609375, 26.46435546875, 27.34375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 9.0, 14.0, 15.0, 33.0, 40.0, 81.0, 96.0, 172.0, 240.0, 429.0, 652.0, 1012.0, 1542.0, 2438.0, 3622.0, 5541.0, 8310.0, 12013.0, 17286.0, 24413.0, 32866.0, 43691.0, 54914.0, 66543.0, 77582.0, 85413.0, 90327.0, 89510.0, 84564.0, 76325.0, 65325.0, 53752.0, 42145.0, 32106.0, 23383.0, 16673.0, 11863.0, 8124.0, 5340.0, 3597.0, 2335.0, 1544.0, 1001.0, 587.0, 398.0, 250.0, 155.0, 109.0, 58.0, 53.0, 24.0, 17.0, 15.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.3125, -9.98974609375, -9.6669921875, -9.34423828125, -9.021484375, -8.69873046875, -8.3759765625, -8.05322265625, -7.73046875, -7.40771484375, -7.0849609375, -6.76220703125, -6.439453125, -6.11669921875, -5.7939453125, -5.47119140625, -5.1484375, -4.82568359375, -4.5029296875, -4.18017578125, -3.857421875, -3.53466796875, -3.2119140625, -2.88916015625, -2.56640625, -2.24365234375, -1.9208984375, -1.59814453125, -1.275390625, -0.95263671875, -0.6298828125, -0.30712890625, 0.015625, 0.33837890625, 0.6611328125, 0.98388671875, 1.306640625, 1.62939453125, 1.9521484375, 2.27490234375, 2.59765625, 2.92041015625, 3.2431640625, 3.56591796875, 3.888671875, 4.21142578125, 4.5341796875, 4.85693359375, 5.1796875, 5.50244140625, 5.8251953125, 6.14794921875, 6.470703125, 6.79345703125, 7.1162109375, 7.43896484375, 7.76171875, 8.08447265625, 8.4072265625, 8.72998046875, 9.052734375, 9.37548828125, 9.6982421875, 10.02099609375, 10.34375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 15.0, 18.0, 15.0, 17.0, 19.0, 25.0, 29.0, 18.0, 37.0, 40.0, 39.0, 28.0, 24.0, 49.0, 56.0, 43.0, 57.0, 36.0, 48.0, 49.0, 45.0, 26.0, 37.0, 35.0, 37.0, 26.0, 17.0, 24.0, 20.0, 17.0, 10.0, 8.0, 9.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -16.208251953125, -15.60400390625, -14.999755859375, -14.3955078125, -13.791259765625, -13.18701171875, -12.582763671875, -11.978515625, -11.374267578125, -10.77001953125, -10.165771484375, -9.5615234375, -8.957275390625, -8.35302734375, -7.748779296875, -7.14453125, -6.540283203125, -5.93603515625, -5.331787109375, -4.7275390625, -4.123291015625, -3.51904296875, -2.914794921875, -2.310546875, -1.706298828125, -1.10205078125, -0.497802734375, 0.1064453125, 0.710693359375, 1.31494140625, 1.919189453125, 2.5234375, 3.127685546875, 3.73193359375, 4.336181640625, 4.9404296875, 5.544677734375, 6.14892578125, 6.753173828125, 7.357421875, 7.961669921875, 8.56591796875, 9.170166015625, 9.7744140625, 10.378662109375, 10.98291015625, 11.587158203125, 12.19140625, 12.795654296875, 13.39990234375, 14.004150390625, 14.6083984375, 15.212646484375, 15.81689453125, 16.421142578125, 17.025390625, 17.629638671875, 18.23388671875, 18.838134765625, 19.4423828125, 20.046630859375, 20.65087890625, 21.255126953125, 21.859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 10.0, 15.0, 22.0, 29.0, 41.0, 82.0, 128.0, 252.0, 351.0, 578.0, 1047.0, 1687.0, 2844.0, 4905.0, 7755.0, 12535.0, 19481.0, 29299.0, 41941.0, 57225.0, 74204.0, 89198.0, 101029.0, 106255.0, 104127.0, 95746.0, 81612.0, 66352.0, 49463.0, 35529.0, 24039.0, 15714.0, 9996.0, 6055.0, 3579.0, 2235.0, 1261.0, 792.0, 436.0, 281.0, 156.0, 97.0, 66.0, 36.0, 31.0, 14.0, 11.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.0078125, -3.88543701171875, -3.7630615234375, -3.64068603515625, -3.518310546875, -3.39593505859375, -3.2735595703125, -3.15118408203125, -3.02880859375, -2.90643310546875, -2.7840576171875, -2.66168212890625, -2.539306640625, -2.41693115234375, -2.2945556640625, -2.17218017578125, -2.0498046875, -1.92742919921875, -1.8050537109375, -1.68267822265625, -1.560302734375, -1.43792724609375, -1.3155517578125, -1.19317626953125, -1.07080078125, -0.94842529296875, -0.8260498046875, -0.70367431640625, -0.581298828125, -0.45892333984375, -0.3365478515625, -0.21417236328125, -0.091796875, 0.03057861328125, 0.1529541015625, 0.27532958984375, 0.397705078125, 0.52008056640625, 0.6424560546875, 0.76483154296875, 0.88720703125, 1.00958251953125, 1.1319580078125, 1.25433349609375, 1.376708984375, 1.49908447265625, 1.6214599609375, 1.74383544921875, 1.8662109375, 1.98858642578125, 2.1109619140625, 2.23333740234375, 2.355712890625, 2.47808837890625, 2.6004638671875, 2.72283935546875, 2.84521484375, 2.96759033203125, 3.0899658203125, 3.21234130859375, 3.334716796875, 3.45709228515625, 3.5794677734375, 3.70184326171875, 3.82421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 8.0, 12.0, 8.0, 12.0, 11.0, 12.0, 14.0, 10.0, 27.0, 11.0, 25.0, 34.0, 38.0, 37.0, 33.0, 49.0, 37.0, 31.0, 47.0, 50.0, 51.0, 32.0, 49.0, 47.0, 30.0, 34.0, 37.0, 27.0, 27.0, 26.0, 18.0, 17.0, 13.0, 9.0, 10.0, 9.0, 15.0, 5.0, 10.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00044083595275878906, -0.0004268437623977661, -0.00041285157203674316, -0.0003988593816757202, -0.00038486719131469727, -0.0003708750009536743, -0.00035688281059265137, -0.0003428906202316284, -0.00032889842987060547, -0.0003149062395095825, -0.00030091404914855957, -0.0002869218587875366, -0.00027292966842651367, -0.0002589374780654907, -0.0002449452877044678, -0.00023095309734344482, -0.00021696090698242188, -0.00020296871662139893, -0.00018897652626037598, -0.00017498433589935303, -0.00016099214553833008, -0.00014699995517730713, -0.00013300776481628418, -0.00011901557445526123, -0.00010502338409423828, -9.103119373321533e-05, -7.703900337219238e-05, -6.304681301116943e-05, -4.9054622650146484e-05, -3.5062432289123535e-05, -2.1070241928100586e-05, -7.078051567077637e-06, 6.9141387939453125e-06, 2.0906329154968262e-05, 3.489851951599121e-05, 4.889070987701416e-05, 6.288290023803711e-05, 7.687509059906006e-05, 9.086728096008301e-05, 0.00010485947132110596, 0.0001188516616821289, 0.00013284385204315186, 0.0001468360424041748, 0.00016082823276519775, 0.0001748204231262207, 0.00018881261348724365, 0.0002028048038482666, 0.00021679699420928955, 0.0002307891845703125, 0.00024478137493133545, 0.0002587735652923584, 0.00027276575565338135, 0.0002867579460144043, 0.00030075013637542725, 0.0003147423267364502, 0.00032873451709747314, 0.0003427267074584961, 0.00035671889781951904, 0.000370711088180542, 0.00038470327854156494, 0.0003986954689025879, 0.00041268765926361084, 0.0004266798496246338, 0.00044067203998565674, 0.0004546642303466797]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 8.0, 12.0, 14.0, 22.0, 24.0, 49.0, 85.0, 123.0, 177.0, 317.0, 502.0, 733.0, 1257.0, 2094.0, 3463.0, 5720.0, 9661.0, 15390.0, 24832.0, 38024.0, 54360.0, 73719.0, 93306.0, 108417.0, 115994.0, 114644.0, 102980.0, 85164.0, 66177.0, 46756.0, 31776.0, 20581.0, 12736.0, 7647.0, 4735.0, 2831.0, 1636.0, 927.0, 618.0, 385.0, 223.0, 162.0, 94.0, 64.0, 36.0, 30.0, 21.0, 17.0, 9.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.4375, -4.29791259765625, -4.1583251953125, -4.01873779296875, -3.879150390625, -3.73956298828125, -3.5999755859375, -3.46038818359375, -3.32080078125, -3.18121337890625, -3.0416259765625, -2.90203857421875, -2.762451171875, -2.62286376953125, -2.4832763671875, -2.34368896484375, -2.2041015625, -2.06451416015625, -1.9249267578125, -1.78533935546875, -1.645751953125, -1.50616455078125, -1.3665771484375, -1.22698974609375, -1.08740234375, -0.94781494140625, -0.8082275390625, -0.66864013671875, -0.529052734375, -0.38946533203125, -0.2498779296875, -0.11029052734375, 0.029296875, 0.16888427734375, 0.3084716796875, 0.44805908203125, 0.587646484375, 0.72723388671875, 0.8668212890625, 1.00640869140625, 1.14599609375, 1.28558349609375, 1.4251708984375, 1.56475830078125, 1.704345703125, 1.84393310546875, 1.9835205078125, 2.12310791015625, 2.2626953125, 2.40228271484375, 2.5418701171875, 2.68145751953125, 2.821044921875, 2.96063232421875, 3.1002197265625, 3.23980712890625, 3.37939453125, 3.51898193359375, 3.6585693359375, 3.79815673828125, 3.937744140625, 4.07733154296875, 4.2169189453125, 4.35650634765625, 4.49609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 3.0, 11.0, 7.0, 15.0, 22.0, 27.0, 34.0, 40.0, 40.0, 50.0, 61.0, 63.0, 55.0, 74.0, 57.0, 60.0, 58.0, 67.0, 52.0, 31.0, 38.0, 19.0, 27.0, 24.0, 20.0, 9.0, 5.0, 1.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.541015625, -2.455780029296875, -2.37054443359375, -2.285308837890625, -2.2000732421875, -2.114837646484375, -2.02960205078125, -1.944366455078125, -1.859130859375, -1.773895263671875, -1.68865966796875, -1.603424072265625, -1.5181884765625, -1.432952880859375, -1.34771728515625, -1.262481689453125, -1.17724609375, -1.092010498046875, -1.00677490234375, -0.921539306640625, -0.8363037109375, -0.751068115234375, -0.66583251953125, -0.580596923828125, -0.495361328125, -0.410125732421875, -0.32489013671875, -0.239654541015625, -0.1544189453125, -0.069183349609375, 0.01605224609375, 0.101287841796875, 0.1865234375, 0.271759033203125, 0.35699462890625, 0.442230224609375, 0.5274658203125, 0.612701416015625, 0.69793701171875, 0.783172607421875, 0.868408203125, 0.953643798828125, 1.03887939453125, 1.124114990234375, 1.2093505859375, 1.294586181640625, 1.37982177734375, 1.465057373046875, 1.55029296875, 1.635528564453125, 1.72076416015625, 1.805999755859375, 1.8912353515625, 1.976470947265625, 2.06170654296875, 2.146942138671875, 2.232177734375, 2.317413330078125, 2.40264892578125, 2.487884521484375, 2.5731201171875, 2.658355712890625, 2.74359130859375, 2.828826904296875, 2.9140625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 7.0, 2.0, 3.0, 3.0, 8.0, 10.0, 9.0, 11.0, 15.0, 18.0, 16.0, 15.0, 29.0, 32.0, 31.0, 28.0, 48.0, 49.0, 42.0, 39.0, 32.0, 44.0, 44.0, 56.0, 56.0, 47.0, 43.0, 33.0, 24.0, 32.0, 37.0, 25.0, 29.0, 16.0, 15.0, 10.0, 8.0, 5.0, 4.0, 7.0, 7.0, 9.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.956127166748047, -23.24897575378418, -22.541824340820312, -21.834674835205078, -21.12752342224121, -20.420372009277344, -19.713220596313477, -19.00606918334961, -18.298919677734375, -17.591768264770508, -16.88461685180664, -16.177467346191406, -15.470315933227539, -14.763164520263672, -14.056013107299805, -13.348862648010254, -12.641711235046387, -11.93455982208252, -11.227409362792969, -10.520257949829102, -9.81310749053955, -9.105956077575684, -8.398805618286133, -7.691654205322266, -6.984503269195557, -6.277352333068848, -5.570201396942139, -4.86305046081543, -4.1558990478515625, -3.4487483501434326, -2.7415971755981445, -2.0344462394714355, -1.3272953033447266, -0.6201443076133728, 0.08700668811798096, 0.7941577434539795, 1.5013086795806885, 2.2084596157073975, 2.9156107902526855, 3.6227617263793945, 4.3299126625061035, 5.0370635986328125, 5.7442145347595215, 6.4513654708862305, 7.158516883850098, 7.865667343139648, 8.572818756103516, 9.279970169067383, 9.987120628356934, 10.6942720413208, 11.401422500610352, 12.108573913574219, 12.81572437286377, 13.522875785827637, 14.230026245117188, 14.937177658081055, 15.644329071044922, 16.35148048400879, 17.058631896972656, 17.76578140258789, 18.472932815551758, 19.180084228515625, 19.887235641479492, 20.59438705444336, 21.301536560058594]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 8.0, 7.0, 9.0, 12.0, 9.0, 15.0, 25.0, 20.0, 31.0, 30.0, 34.0, 28.0, 34.0, 36.0, 31.0, 25.0, 47.0, 45.0, 35.0, 39.0, 41.0, 41.0, 31.0, 36.0, 23.0, 40.0, 30.0, 31.0, 27.0, 25.0, 26.0, 20.0, 15.0, 9.0, 11.0, 14.0, 8.0, 12.0, 6.0, 5.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.08310890197754, -26.21101951599121, -25.338930130004883, -24.466840744018555, -23.594751358032227, -22.72266387939453, -21.850574493408203, -20.978485107421875, -20.106395721435547, -19.23430633544922, -18.36221694946289, -17.490127563476562, -16.618038177490234, -15.745949745178223, -14.873860359191895, -14.001771926879883, -13.129681587219238, -12.25759220123291, -11.385502815246582, -10.51341438293457, -9.641324996948242, -8.769235610961914, -7.897146224975586, -7.025057315826416, -6.152967929840088, -5.28087854385376, -4.40878963470459, -3.5367002487182617, -2.6646111011505127, -1.7925219535827637, -0.9204325675964355, -0.048343658447265625, 0.8237457275390625, 1.6958348751068115, 2.5679240226745605, 3.4400134086608887, 4.312102317810059, 5.184191703796387, 6.056281089782715, 6.928369998931885, 7.800459384918213, 8.672548294067383, 9.544637680053711, 10.416727066040039, 11.288816452026367, 12.160905838012695, 13.032995223999023, 13.905083656311035, 14.777173042297363, 15.649262428283691, 16.521350860595703, 17.39344024658203, 18.26552963256836, 19.137619018554688, 20.009708404541016, 20.881797790527344, 21.753887176513672, 22.6259765625, 23.498065948486328, 24.370155334472656, 25.242244720458984, 26.114334106445312, 26.98642349243164, 27.858510971069336, 28.730600357055664]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 12.0, 21.0, 59.0, 104.0, 157.0, 304.0, 550.0, 1018.0, 1762.0, 2982.0, 5187.0, 8743.0, 15033.0, 24482.0, 39851.0, 63770.0, 99411.0, 148066.0, 210314.0, 283273.0, 358261.0, 419378.0, 451482.0, 446545.0, 408927.0, 344271.0, 270687.0, 199546.0, 139534.0, 93210.0, 60768.0, 38139.0, 23420.0, 14305.0, 8580.0, 5029.0, 2931.0, 1741.0, 1030.0, 586.0, 372.0, 192.0, 115.0, 57.0, 27.0, 24.0, 18.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.703369140625, -18.07861328125, -17.453857421875, -16.8291015625, -16.204345703125, -15.57958984375, -14.954833984375, -14.330078125, -13.705322265625, -13.08056640625, -12.455810546875, -11.8310546875, -11.206298828125, -10.58154296875, -9.956787109375, -9.33203125, -8.707275390625, -8.08251953125, -7.457763671875, -6.8330078125, -6.208251953125, -5.58349609375, -4.958740234375, -4.333984375, -3.709228515625, -3.08447265625, -2.459716796875, -1.8349609375, -1.210205078125, -0.58544921875, 0.039306640625, 0.6640625, 1.288818359375, 1.91357421875, 2.538330078125, 3.1630859375, 3.787841796875, 4.41259765625, 5.037353515625, 5.662109375, 6.286865234375, 6.91162109375, 7.536376953125, 8.1611328125, 8.785888671875, 9.41064453125, 10.035400390625, 10.66015625, 11.284912109375, 11.90966796875, 12.534423828125, 13.1591796875, 13.783935546875, 14.40869140625, 15.033447265625, 15.658203125, 16.282958984375, 16.90771484375, 17.532470703125, 18.1572265625, 18.781982421875, 19.40673828125, 20.031494140625, 20.65625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 1.0, 5.0, 6.0, 4.0, 3.0, 11.0, 10.0, 15.0, 14.0, 11.0, 16.0, 29.0, 22.0, 21.0, 33.0, 31.0, 37.0, 26.0, 34.0, 36.0, 42.0, 38.0, 34.0, 34.0, 36.0, 41.0, 37.0, 25.0, 32.0, 40.0, 25.0, 21.0, 39.0, 22.0, 20.0, 18.0, 19.0, 19.0, 12.0, 12.0, 11.0, 11.0, 6.0, 9.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-23.578125, -22.855712890625, -22.13330078125, -21.410888671875, -20.6884765625, -19.966064453125, -19.24365234375, -18.521240234375, -17.798828125, -17.076416015625, -16.35400390625, -15.631591796875, -14.9091796875, -14.186767578125, -13.46435546875, -12.741943359375, -12.01953125, -11.297119140625, -10.57470703125, -9.852294921875, -9.1298828125, -8.407470703125, -7.68505859375, -6.962646484375, -6.240234375, -5.517822265625, -4.79541015625, -4.072998046875, -3.3505859375, -2.628173828125, -1.90576171875, -1.183349609375, -0.4609375, 0.261474609375, 0.98388671875, 1.706298828125, 2.4287109375, 3.151123046875, 3.87353515625, 4.595947265625, 5.318359375, 6.040771484375, 6.76318359375, 7.485595703125, 8.2080078125, 8.930419921875, 9.65283203125, 10.375244140625, 11.09765625, 11.820068359375, 12.54248046875, 13.264892578125, 13.9873046875, 14.709716796875, 15.43212890625, 16.154541015625, 16.876953125, 17.599365234375, 18.32177734375, 19.044189453125, 19.7666015625, 20.489013671875, 21.21142578125, 21.933837890625, 22.65625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 11.0, 17.0, 29.0, 48.0, 82.0, 153.0, 237.0, 432.0, 657.0, 1046.0, 1823.0, 3252.0, 5338.0, 8809.0, 14470.0, 23970.0, 37332.0, 58328.0, 88078.0, 128398.0, 178496.0, 238227.0, 299969.0, 357312.0, 398994.0, 415457.0, 405786.0, 366649.0, 313454.0, 251700.0, 190159.0, 138586.0, 94907.0, 64015.0, 41352.0, 26057.0, 16287.0, 9740.0, 5884.0, 3465.0, 2180.0, 1269.0, 720.0, 449.0, 278.0, 141.0, 104.0, 63.0, 31.0, 19.0, 8.0, 8.0, 6.0, 3.0, 2.0], "bins": [-21.796875, -21.1669921875, -20.537109375, -19.9072265625, -19.27734375, -18.6474609375, -18.017578125, -17.3876953125, -16.7578125, -16.1279296875, -15.498046875, -14.8681640625, -14.23828125, -13.6083984375, -12.978515625, -12.3486328125, -11.71875, -11.0888671875, -10.458984375, -9.8291015625, -9.19921875, -8.5693359375, -7.939453125, -7.3095703125, -6.6796875, -6.0498046875, -5.419921875, -4.7900390625, -4.16015625, -3.5302734375, -2.900390625, -2.2705078125, -1.640625, -1.0107421875, -0.380859375, 0.2490234375, 0.87890625, 1.5087890625, 2.138671875, 2.7685546875, 3.3984375, 4.0283203125, 4.658203125, 5.2880859375, 5.91796875, 6.5478515625, 7.177734375, 7.8076171875, 8.4375, 9.0673828125, 9.697265625, 10.3271484375, 10.95703125, 11.5869140625, 12.216796875, 12.8466796875, 13.4765625, 14.1064453125, 14.736328125, 15.3662109375, 15.99609375, 16.6259765625, 17.255859375, 17.8857421875, 18.515625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 11.0, 18.0, 23.0, 21.0, 37.0, 44.0, 58.0, 67.0, 80.0, 102.0, 112.0, 125.0, 160.0, 177.0, 202.0, 214.0, 222.0, 234.0, 207.0, 210.0, 212.0, 187.0, 193.0, 168.0, 176.0, 146.0, 123.0, 116.0, 80.0, 74.0, 61.0, 41.0, 39.0, 30.0, 22.0, 19.0, 15.0, 17.0, 6.0, 6.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.90625, -12.4854736328125, -12.064697265625, -11.6439208984375, -11.22314453125, -10.8023681640625, -10.381591796875, -9.9608154296875, -9.5400390625, -9.1192626953125, -8.698486328125, -8.2777099609375, -7.85693359375, -7.4361572265625, -7.015380859375, -6.5946044921875, -6.173828125, -5.7530517578125, -5.332275390625, -4.9114990234375, -4.49072265625, -4.0699462890625, -3.649169921875, -3.2283935546875, -2.8076171875, -2.3868408203125, -1.966064453125, -1.5452880859375, -1.12451171875, -0.7037353515625, -0.282958984375, 0.1378173828125, 0.55859375, 0.9793701171875, 1.400146484375, 1.8209228515625, 2.24169921875, 2.6624755859375, 3.083251953125, 3.5040283203125, 3.9248046875, 4.3455810546875, 4.766357421875, 5.1871337890625, 5.60791015625, 6.0286865234375, 6.449462890625, 6.8702392578125, 7.291015625, 7.7117919921875, 8.132568359375, 8.5533447265625, 8.97412109375, 9.3948974609375, 9.815673828125, 10.2364501953125, 10.6572265625, 11.0780029296875, 11.498779296875, 11.9195556640625, 12.34033203125, 12.7611083984375, 13.181884765625, 13.6026611328125, 14.0234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 3.0, 6.0, 10.0, 5.0, 12.0, 10.0, 14.0, 19.0, 25.0, 29.0, 40.0, 37.0, 44.0, 44.0, 55.0, 51.0, 62.0, 56.0, 50.0, 61.0, 59.0, 49.0, 45.0, 34.0, 36.0, 32.0, 18.0, 18.0, 23.0, 8.0, 9.0, 13.0, 8.0, 1.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.709590911865234, -33.64313888549805, -32.57668685913086, -31.510234832763672, -30.443784713745117, -29.37733268737793, -28.310880661010742, -27.244428634643555, -26.177978515625, -25.111526489257812, -24.045074462890625, -22.978622436523438, -21.912172317504883, -20.845720291137695, -19.779268264770508, -18.71281623840332, -17.646364212036133, -16.579912185668945, -15.513461112976074, -14.447009086608887, -13.380558013916016, -12.314105987548828, -11.24765396118164, -10.181201934814453, -9.114750862121582, -8.048298835754395, -6.981847763061523, -5.915395736694336, -4.848944187164307, -3.7824926376342773, -2.71604061126709, -1.6495890617370605, -0.5831375122070312, 0.4833141565322876, 1.5497658252716064, 2.616217613220215, 3.682669162750244, 4.749120712280273, 5.815572738647461, 6.88202428817749, 7.9484758377075195, 9.014927864074707, 10.081378936767578, 11.147830963134766, 12.214282989501953, 13.280734062194824, 14.347186088562012, 15.413637161254883, 16.48008918762207, 17.546541213989258, 18.612993240356445, 19.679443359375, 20.745895385742188, 21.812347412109375, 22.878799438476562, 23.94525146484375, 25.011703491210938, 26.078155517578125, 27.144607543945312, 28.2110595703125, 29.277509689331055, 30.343961715698242, 31.41041374206543, 32.476863861083984, 33.54331588745117]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 9.0, 16.0, 13.0, 12.0, 16.0, 11.0, 22.0, 28.0, 30.0, 20.0, 33.0, 27.0, 32.0, 36.0, 39.0, 43.0, 26.0, 39.0, 45.0, 37.0, 46.0, 35.0, 26.0, 39.0, 33.0, 24.0, 25.0, 30.0, 22.0, 22.0, 19.0, 15.0, 17.0, 22.0, 11.0, 12.0, 8.0, 5.0, 6.0, 7.0, 2.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-31.980066299438477, -30.99169158935547, -30.003314971923828, -29.01494026184082, -28.026565551757812, -27.038188934326172, -26.049814224243164, -25.061439514160156, -24.073062896728516, -23.084688186645508, -22.096311569213867, -21.10793685913086, -20.11956214904785, -19.131187438964844, -18.142810821533203, -17.154436111450195, -16.166061401367188, -15.177685737609863, -14.189311027526855, -13.200935363769531, -12.212560653686523, -11.2241849899292, -10.235809326171875, -9.247434616088867, -8.259058952331543, -7.270683765411377, -6.282308578491211, -5.293932914733887, -4.305557727813721, -3.3171825408935547, -2.3288068771362305, -1.3404316902160645, -0.35205841064453125, 0.6363168954849243, 1.6246922016143799, 2.613067626953125, 3.601442813873291, 4.589818000793457, 5.578193664550781, 6.566568851470947, 7.554944038391113, 8.543319702148438, 9.531694412231445, 10.52007007598877, 11.508445739746094, 12.496820449829102, 13.485196113586426, 14.47357177734375, 15.461946487426758, 16.450321197509766, 17.438697814941406, 18.427072525024414, 19.415447235107422, 20.403823852539062, 21.39219856262207, 22.380573272705078, 23.36894989013672, 24.357324600219727, 25.345701217651367, 26.334075927734375, 27.322450637817383, 28.31082534790039, 29.29920196533203, 30.28757667541504, 31.275951385498047]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 11.0, 10.0, 22.0, 28.0, 33.0, 47.0, 72.0, 151.0, 233.0, 314.0, 504.0, 740.0, 1321.0, 1948.0, 3129.0, 4961.0, 8449.0, 13930.0, 23484.0, 39217.0, 67090.0, 113082.0, 181086.0, 213717.0, 150940.0, 90591.0, 53603.0, 31949.0, 18774.0, 11212.0, 6703.0, 4181.0, 2551.0, 1572.0, 994.0, 657.0, 420.0, 312.0, 173.0, 129.0, 81.0, 47.0, 38.0, 18.0, 12.0, 8.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33984375, -3.229583740234375, -3.11932373046875, -3.009063720703125, -2.8988037109375, -2.788543701171875, -2.67828369140625, -2.568023681640625, -2.457763671875, -2.347503662109375, -2.23724365234375, -2.126983642578125, -2.0167236328125, -1.906463623046875, -1.79620361328125, -1.685943603515625, -1.57568359375, -1.465423583984375, -1.35516357421875, -1.244903564453125, -1.1346435546875, -1.024383544921875, -0.91412353515625, -0.803863525390625, -0.693603515625, -0.583343505859375, -0.47308349609375, -0.362823486328125, -0.2525634765625, -0.142303466796875, -0.03204345703125, 0.078216552734375, 0.1884765625, 0.298736572265625, 0.40899658203125, 0.519256591796875, 0.6295166015625, 0.739776611328125, 0.85003662109375, 0.960296630859375, 1.070556640625, 1.180816650390625, 1.29107666015625, 1.401336669921875, 1.5115966796875, 1.621856689453125, 1.73211669921875, 1.842376708984375, 1.95263671875, 2.062896728515625, 2.17315673828125, 2.283416748046875, 2.3936767578125, 2.503936767578125, 2.61419677734375, 2.724456787109375, 2.834716796875, 2.944976806640625, 3.05523681640625, 3.165496826171875, 3.2757568359375, 3.386016845703125, 3.49627685546875, 3.606536865234375, 3.716796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 6.0, 8.0, 16.0, 12.0, 12.0, 13.0, 11.0, 16.0, 19.0, 31.0, 28.0, 38.0, 32.0, 37.0, 39.0, 43.0, 33.0, 39.0, 37.0, 46.0, 33.0, 53.0, 34.0, 41.0, 40.0, 30.0, 36.0, 31.0, 22.0, 25.0, 22.0, 20.0, 16.0, 16.0, 15.0, 12.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.1875, -33.05859375, -31.9296875, -30.80078125, -29.671875, -28.54296875, -27.4140625, -26.28515625, -25.15625, -24.02734375, -22.8984375, -21.76953125, -20.640625, -19.51171875, -18.3828125, -17.25390625, -16.125, -14.99609375, -13.8671875, -12.73828125, -11.609375, -10.48046875, -9.3515625, -8.22265625, -7.09375, -5.96484375, -4.8359375, -3.70703125, -2.578125, -1.44921875, -0.3203125, 0.80859375, 1.9375, 3.06640625, 4.1953125, 5.32421875, 6.453125, 7.58203125, 8.7109375, 9.83984375, 10.96875, 12.09765625, 13.2265625, 14.35546875, 15.484375, 16.61328125, 17.7421875, 18.87109375, 20.0, 21.12890625, 22.2578125, 23.38671875, 24.515625, 25.64453125, 26.7734375, 27.90234375, 29.03125, 30.16015625, 31.2890625, 32.41796875, 33.546875, 34.67578125, 35.8046875, 36.93359375, 38.0625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 10.0, 11.0, 17.0, 29.0, 38.0, 44.0, 67.0, 94.0, 133.0, 188.0, 321.0, 453.0, 646.0, 989.0, 1451.0, 2197.0, 3475.0, 5602.0, 8905.0, 14347.0, 23160.0, 38332.0, 62848.0, 101035.0, 156368.0, 199579.0, 158780.0, 102869.0, 63858.0, 39327.0, 23908.0, 14395.0, 9024.0, 5665.0, 3550.0, 2251.0, 1462.0, 1019.0, 692.0, 438.0, 302.0, 207.0, 127.0, 106.0, 65.0, 39.0, 43.0, 22.0, 22.0, 15.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.71875, -3.60076904296875, -3.4827880859375, -3.36480712890625, -3.246826171875, -3.12884521484375, -3.0108642578125, -2.89288330078125, -2.77490234375, -2.65692138671875, -2.5389404296875, -2.42095947265625, -2.302978515625, -2.18499755859375, -2.0670166015625, -1.94903564453125, -1.8310546875, -1.71307373046875, -1.5950927734375, -1.47711181640625, -1.359130859375, -1.24114990234375, -1.1231689453125, -1.00518798828125, -0.88720703125, -0.76922607421875, -0.6512451171875, -0.53326416015625, -0.415283203125, -0.29730224609375, -0.1793212890625, -0.06134033203125, 0.056640625, 0.17462158203125, 0.2926025390625, 0.41058349609375, 0.528564453125, 0.64654541015625, 0.7645263671875, 0.88250732421875, 1.00048828125, 1.11846923828125, 1.2364501953125, 1.35443115234375, 1.472412109375, 1.59039306640625, 1.7083740234375, 1.82635498046875, 1.9443359375, 2.06231689453125, 2.1802978515625, 2.29827880859375, 2.416259765625, 2.53424072265625, 2.6522216796875, 2.77020263671875, 2.88818359375, 3.00616455078125, 3.1241455078125, 3.24212646484375, 3.360107421875, 3.47808837890625, 3.5960693359375, 3.71405029296875, 3.83203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 9.0, 6.0, 12.0, 17.0, 10.0, 16.0, 16.0, 25.0, 26.0, 37.0, 20.0, 23.0, 27.0, 34.0, 42.0, 31.0, 41.0, 36.0, 45.0, 49.0, 36.0, 24.0, 37.0, 36.0, 35.0, 39.0, 37.0, 32.0, 30.0, 21.0, 15.0, 22.0, 13.0, 9.0, 10.0, 19.0, 12.0, 7.0, 7.0, 8.0, 3.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-22.71875, -22.06005859375, -21.4013671875, -20.74267578125, -20.083984375, -19.42529296875, -18.7666015625, -18.10791015625, -17.44921875, -16.79052734375, -16.1318359375, -15.47314453125, -14.814453125, -14.15576171875, -13.4970703125, -12.83837890625, -12.1796875, -11.52099609375, -10.8623046875, -10.20361328125, -9.544921875, -8.88623046875, -8.2275390625, -7.56884765625, -6.91015625, -6.25146484375, -5.5927734375, -4.93408203125, -4.275390625, -3.61669921875, -2.9580078125, -2.29931640625, -1.640625, -0.98193359375, -0.3232421875, 0.33544921875, 0.994140625, 1.65283203125, 2.3115234375, 2.97021484375, 3.62890625, 4.28759765625, 4.9462890625, 5.60498046875, 6.263671875, 6.92236328125, 7.5810546875, 8.23974609375, 8.8984375, 9.55712890625, 10.2158203125, 10.87451171875, 11.533203125, 12.19189453125, 12.8505859375, 13.50927734375, 14.16796875, 14.82666015625, 15.4853515625, 16.14404296875, 16.802734375, 17.46142578125, 18.1201171875, 18.77880859375, 19.4375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 5.0, 13.0, 13.0, 15.0, 25.0, 35.0, 47.0, 93.0, 119.0, 186.0, 295.0, 410.0, 648.0, 966.0, 1495.0, 2197.0, 3411.0, 5557.0, 9309.0, 15294.0, 26141.0, 46025.0, 85157.0, 165816.0, 267319.0, 192081.0, 99200.0, 52805.0, 29358.0, 16817.0, 10026.0, 6392.0, 4097.0, 2544.0, 1588.0, 1068.0, 641.0, 429.0, 303.0, 166.0, 143.0, 104.0, 65.0, 49.0, 30.0, 21.0, 15.0, 7.0, 9.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10693359375, -0.10355091094970703, -0.10016822814941406, -0.0967855453491211, -0.09340286254882812, -0.09002017974853516, -0.08663749694824219, -0.08325481414794922, -0.07987213134765625, -0.07648944854736328, -0.07310676574707031, -0.06972408294677734, -0.06634140014648438, -0.0629587173461914, -0.05957603454589844, -0.05619335174560547, -0.0528106689453125, -0.04942798614501953, -0.04604530334472656, -0.042662620544433594, -0.039279937744140625, -0.035897254943847656, -0.03251457214355469, -0.02913188934326172, -0.02574920654296875, -0.02236652374267578, -0.018983840942382812, -0.015601158142089844, -0.012218475341796875, -0.008835792541503906, -0.0054531097412109375, -0.0020704269409179688, 0.001312255859375, 0.004694938659667969, 0.008077621459960938, 0.011460304260253906, 0.014842987060546875, 0.018225669860839844, 0.021608352661132812, 0.02499103546142578, 0.02837371826171875, 0.03175640106201172, 0.03513908386230469, 0.038521766662597656, 0.041904449462890625, 0.045287132263183594, 0.04866981506347656, 0.05205249786376953, 0.0554351806640625, 0.05881786346435547, 0.06220054626464844, 0.0655832290649414, 0.06896591186523438, 0.07234859466552734, 0.07573127746582031, 0.07911396026611328, 0.08249664306640625, 0.08587932586669922, 0.08926200866699219, 0.09264469146728516, 0.09602737426757812, 0.0994100570678711, 0.10279273986816406, 0.10617542266845703, 0.10955810546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 8.0, 12.0, 11.0, 20.0, 11.0, 17.0, 27.0, 23.0, 39.0, 38.0, 25.0, 43.0, 36.0, 42.0, 36.0, 48.0, 38.0, 72.0, 49.0, 44.0, 44.0, 50.0, 50.0, 37.0, 33.0, 30.0, 22.0, 15.0, 14.0, 12.0, 12.0, 10.0, 9.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.014636993408203e-05, -1.9420869648456573e-05, -1.8695369362831116e-05, -1.7969869077205658e-05, -1.72443687915802e-05, -1.6518868505954742e-05, -1.5793368220329285e-05, -1.5067867934703827e-05, -1.4342367649078369e-05, -1.3616867363452911e-05, -1.2891367077827454e-05, -1.2165866792201996e-05, -1.1440366506576538e-05, -1.071486622095108e-05, -9.989365935325623e-06, -9.263865649700165e-06, -8.538365364074707e-06, -7.81286507844925e-06, -7.0873647928237915e-06, -6.361864507198334e-06, -5.636364221572876e-06, -4.910863935947418e-06, -4.1853636503219604e-06, -3.4598633646965027e-06, -2.734363079071045e-06, -2.008862793445587e-06, -1.2833625078201294e-06, -5.578622221946716e-07, 1.6763806343078613e-07, 8.931383490562439e-07, 1.6186386346817017e-06, 2.3441389203071594e-06, 3.069639205932617e-06, 3.795139491558075e-06, 4.520639777183533e-06, 5.2461400628089905e-06, 5.971640348434448e-06, 6.697140634059906e-06, 7.422640919685364e-06, 8.148141205310822e-06, 8.87364149093628e-06, 9.599141776561737e-06, 1.0324642062187195e-05, 1.1050142347812653e-05, 1.177564263343811e-05, 1.2501142919063568e-05, 1.3226643204689026e-05, 1.3952143490314484e-05, 1.4677643775939941e-05, 1.54031440615654e-05, 1.6128644347190857e-05, 1.6854144632816315e-05, 1.7579644918441772e-05, 1.830514520406723e-05, 1.9030645489692688e-05, 1.9756145775318146e-05, 2.0481646060943604e-05, 2.120714634656906e-05, 2.193264663219452e-05, 2.2658146917819977e-05, 2.3383647203445435e-05, 2.4109147489070892e-05, 2.483464777469635e-05, 2.5560148060321808e-05, 2.6285648345947266e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 11.0, 9.0, 9.0, 14.0, 27.0, 53.0, 72.0, 84.0, 160.0, 226.0, 357.0, 577.0, 843.0, 1302.0, 1834.0, 2833.0, 4054.0, 6375.0, 9344.0, 14303.0, 21926.0, 35116.0, 56797.0, 99546.0, 195624.0, 262268.0, 136738.0, 74039.0, 44202.0, 27525.0, 17843.0, 11398.0, 7671.0, 5118.0, 3502.0, 2286.0, 1472.0, 1035.0, 670.0, 439.0, 309.0, 200.0, 124.0, 86.0, 56.0, 31.0, 24.0, 11.0, 9.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.2342529296875, -0.22720718383789062, -0.22016143798828125, -0.21311569213867188, -0.2060699462890625, -0.19902420043945312, -0.19197845458984375, -0.18493270874023438, -0.177886962890625, -0.17084121704101562, -0.16379547119140625, -0.15674972534179688, -0.1497039794921875, -0.14265823364257812, -0.13561248779296875, -0.12856674194335938, -0.12152099609375, -0.11447525024414062, -0.10742950439453125, -0.10038375854492188, -0.0933380126953125, -0.08629226684570312, -0.07924652099609375, -0.07220077514648438, -0.065155029296875, -0.058109283447265625, -0.05106353759765625, -0.044017791748046875, -0.0369720458984375, -0.029926300048828125, -0.02288055419921875, -0.015834808349609375, -0.0087890625, -0.001743316650390625, 0.00530242919921875, 0.012348175048828125, 0.0193939208984375, 0.026439666748046875, 0.03348541259765625, 0.040531158447265625, 0.047576904296875, 0.054622650146484375, 0.06166839599609375, 0.06871414184570312, 0.0757598876953125, 0.08280563354492188, 0.08985137939453125, 0.09689712524414062, 0.10394287109375, 0.11098861694335938, 0.11803436279296875, 0.12508010864257812, 0.1321258544921875, 0.13917160034179688, 0.14621734619140625, 0.15326309204101562, 0.160308837890625, 0.16735458374023438, 0.17440032958984375, 0.18144607543945312, 0.1884918212890625, 0.19553756713867188, 0.20258331298828125, 0.20962905883789062, 0.2166748046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 5.0, 7.0, 9.0, 8.0, 9.0, 17.0, 8.0, 15.0, 21.0, 18.0, 26.0, 28.0, 39.0, 69.0, 99.0, 176.0, 115.0, 89.0, 48.0, 34.0, 18.0, 24.0, 18.0, 19.0, 14.0, 17.0, 7.0, 8.0, 8.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10791587829589844, -0.10401535034179688, -0.10011482238769531, -0.09621429443359375, -0.09231376647949219, -0.08841323852539062, -0.08451271057128906, -0.0806121826171875, -0.07671165466308594, -0.07281112670898438, -0.06891059875488281, -0.06501007080078125, -0.06110954284667969, -0.057209014892578125, -0.05330848693847656, -0.049407958984375, -0.04550743103027344, -0.041606903076171875, -0.03770637512207031, -0.03380584716796875, -0.029905319213867188, -0.026004791259765625, -0.022104263305664062, -0.0182037353515625, -0.014303207397460938, -0.010402679443359375, -0.0065021514892578125, -0.00260162353515625, 0.0012989044189453125, 0.005199432373046875, 0.009099960327148438, 0.01300048828125, 0.016901016235351562, 0.020801544189453125, 0.024702072143554688, 0.02860260009765625, 0.03250312805175781, 0.036403656005859375, 0.04030418395996094, 0.0442047119140625, 0.04810523986816406, 0.052005767822265625, 0.05590629577636719, 0.05980682373046875, 0.06370735168457031, 0.06760787963867188, 0.07150840759277344, 0.075408935546875, 0.07930946350097656, 0.08320999145507812, 0.08711051940917969, 0.09101104736328125, 0.09491157531738281, 0.09881210327148438, 0.10271263122558594, 0.1066131591796875, 0.11051368713378906, 0.11441421508789062, 0.11831474304199219, 0.12221527099609375, 0.1261157989501953, 0.13001632690429688, 0.13391685485839844, 0.1378173828125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 2.0, 15.0, 9.0, 15.0, 14.0, 33.0, 25.0, 41.0, 33.0, 47.0, 44.0, 56.0, 57.0, 58.0, 58.0, 53.0, 59.0, 59.0, 46.0, 44.0, 39.0, 34.0, 33.0, 14.0, 21.0, 18.0, 14.0, 8.0, 11.0, 7.0, 2.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.00875473022461, -33.93449401855469, -32.860233306884766, -31.785972595214844, -30.711711883544922, -29.637451171875, -28.563190460205078, -27.488929748535156, -26.414669036865234, -25.340408325195312, -24.26614761352539, -23.19188690185547, -22.117626190185547, -21.043365478515625, -19.969104766845703, -18.89484405517578, -17.82058334350586, -16.746322631835938, -15.672061920166016, -14.597801208496094, -13.523540496826172, -12.44927978515625, -11.375019073486328, -10.300758361816406, -9.226497650146484, -8.152236938476562, -7.077976226806641, -6.003715515136719, -4.929454803466797, -3.855194091796875, -2.780933380126953, -1.7066726684570312, -0.6324119567871094, 0.4418487548828125, 1.5161094665527344, 2.5903701782226562, 3.664630889892578, 4.7388916015625, 5.813152313232422, 6.887413024902344, 7.961673736572266, 9.035934448242188, 10.11019515991211, 11.184455871582031, 12.258716583251953, 13.332977294921875, 14.407238006591797, 15.481498718261719, 16.55575942993164, 17.630020141601562, 18.704280853271484, 19.778541564941406, 20.852802276611328, 21.92706298828125, 23.001323699951172, 24.075584411621094, 25.149845123291016, 26.224105834960938, 27.29836654663086, 28.37262725830078, 29.446887969970703, 30.521148681640625, 31.595409393310547, 32.66967010498047, 33.74393081665039]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 8.0, 8.0, 11.0, 8.0, 16.0, 14.0, 11.0, 16.0, 11.0, 23.0, 27.0, 29.0, 23.0, 30.0, 28.0, 33.0, 36.0, 37.0, 44.0, 28.0, 40.0, 41.0, 40.0, 45.0, 34.0, 29.0, 37.0, 33.0, 25.0, 24.0, 31.0, 22.0, 23.0, 18.0, 15.0, 18.0, 20.0, 11.0, 11.0, 9.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0], "bins": [-31.977569580078125, -30.98874855041504, -29.999929428100586, -29.0111083984375, -28.022289276123047, -27.03346824645996, -26.044647216796875, -25.055828094482422, -24.067007064819336, -23.07818603515625, -22.089366912841797, -21.10054588317871, -20.111726760864258, -19.122905731201172, -18.13408660888672, -17.145265579223633, -16.156444549560547, -15.167624473571777, -14.178804397583008, -13.189983367919922, -12.201163291931152, -11.212343215942383, -10.223523139953613, -9.234703063964844, -8.24588394165039, -7.257063865661621, -6.268243312835693, -5.279423236846924, -4.290602684020996, -3.3017826080322266, -2.312962532043457, -1.3241419792175293, -0.33532142639160156, 0.6534988284111023, 1.6423190832138062, 2.6311392784118652, 3.619959592819214, 4.6087799072265625, 5.597599983215332, 6.58642053604126, 7.575240612030029, 8.564061164855957, 9.552881240844727, 10.541701316833496, 11.530521392822266, 12.519342422485352, 13.508161544799805, 14.49698257446289, 15.48580265045166, 16.47462272644043, 17.463443756103516, 18.45226287841797, 19.441083908081055, 20.42990493774414, 21.418724060058594, 22.40754508972168, 23.396364212036133, 24.38518524169922, 25.374004364013672, 26.362825393676758, 27.35164451599121, 28.340465545654297, 29.32928466796875, 30.318105697631836, 31.306926727294922]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 19.0, 34.0, 39.0, 74.0, 133.0, 194.0, 301.0, 514.0, 806.0, 1257.0, 2074.0, 3368.0, 5091.0, 8117.0, 12402.0, 18308.0, 27098.0, 38227.0, 51872.0, 66952.0, 82201.0, 94042.0, 101037.0, 101200.0, 95985.0, 84438.0, 69959.0, 55008.0, 40737.0, 29190.0, 20193.0, 13505.0, 8840.0, 5651.0, 3613.0, 2291.0, 1406.0, 925.0, 580.0, 338.0, 187.0, 116.0, 93.0, 39.0, 31.0, 26.0, 15.0, 14.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.421875, -13.0037841796875, -12.585693359375, -12.1676025390625, -11.74951171875, -11.3314208984375, -10.913330078125, -10.4952392578125, -10.0771484375, -9.6590576171875, -9.240966796875, -8.8228759765625, -8.40478515625, -7.9866943359375, -7.568603515625, -7.1505126953125, -6.732421875, -6.3143310546875, -5.896240234375, -5.4781494140625, -5.06005859375, -4.6419677734375, -4.223876953125, -3.8057861328125, -3.3876953125, -2.9696044921875, -2.551513671875, -2.1334228515625, -1.71533203125, -1.2972412109375, -0.879150390625, -0.4610595703125, -0.04296875, 0.3751220703125, 0.793212890625, 1.2113037109375, 1.62939453125, 2.0474853515625, 2.465576171875, 2.8836669921875, 3.3017578125, 3.7198486328125, 4.137939453125, 4.5560302734375, 4.97412109375, 5.3922119140625, 5.810302734375, 6.2283935546875, 6.646484375, 7.0645751953125, 7.482666015625, 7.9007568359375, 8.31884765625, 8.7369384765625, 9.155029296875, 9.5731201171875, 9.9912109375, 10.4093017578125, 10.827392578125, 11.2454833984375, 11.66357421875, 12.0816650390625, 12.499755859375, 12.9178466796875, 13.3359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 7.0, 4.0, 12.0, 11.0, 13.0, 17.0, 16.0, 10.0, 24.0, 25.0, 25.0, 33.0, 31.0, 31.0, 44.0, 38.0, 28.0, 49.0, 49.0, 45.0, 53.0, 44.0, 45.0, 34.0, 25.0, 37.0, 31.0, 34.0, 24.0, 23.0, 19.0, 21.0, 22.0, 19.0, 15.0, 12.0, 6.0, 5.0, 5.0, 3.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -35.92578125, -34.7890625, -33.65234375, -32.515625, -31.37890625, -30.2421875, -29.10546875, -27.96875, -26.83203125, -25.6953125, -24.55859375, -23.421875, -22.28515625, -21.1484375, -20.01171875, -18.875, -17.73828125, -16.6015625, -15.46484375, -14.328125, -13.19140625, -12.0546875, -10.91796875, -9.78125, -8.64453125, -7.5078125, -6.37109375, -5.234375, -4.09765625, -2.9609375, -1.82421875, -0.6875, 0.44921875, 1.5859375, 2.72265625, 3.859375, 4.99609375, 6.1328125, 7.26953125, 8.40625, 9.54296875, 10.6796875, 11.81640625, 12.953125, 14.08984375, 15.2265625, 16.36328125, 17.5, 18.63671875, 19.7734375, 20.91015625, 22.046875, 23.18359375, 24.3203125, 25.45703125, 26.59375, 27.73046875, 28.8671875, 30.00390625, 31.140625, 32.27734375, 33.4140625, 34.55078125, 35.6875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 19.0, 20.0, 35.0, 57.0, 83.0, 121.0, 207.0, 320.0, 504.0, 773.0, 1243.0, 2052.0, 3124.0, 4717.0, 7047.0, 10915.0, 15641.0, 22365.0, 30727.0, 41619.0, 53389.0, 66370.0, 78724.0, 88020.0, 93264.0, 93518.0, 88688.0, 79080.0, 66990.0, 54658.0, 42158.0, 31387.0, 22777.0, 15984.0, 10913.0, 7346.0, 4952.0, 3089.0, 2026.0, 1311.0, 829.0, 569.0, 347.0, 207.0, 129.0, 83.0, 58.0, 39.0, 25.0, 11.0, 5.0, 5.0, 8.0, 5.0, 1.0, 1.0], "bins": [-13.2890625, -12.88671875, -12.484375, -12.08203125, -11.6796875, -11.27734375, -10.875, -10.47265625, -10.0703125, -9.66796875, -9.265625, -8.86328125, -8.4609375, -8.05859375, -7.65625, -7.25390625, -6.8515625, -6.44921875, -6.046875, -5.64453125, -5.2421875, -4.83984375, -4.4375, -4.03515625, -3.6328125, -3.23046875, -2.828125, -2.42578125, -2.0234375, -1.62109375, -1.21875, -0.81640625, -0.4140625, -0.01171875, 0.390625, 0.79296875, 1.1953125, 1.59765625, 2.0, 2.40234375, 2.8046875, 3.20703125, 3.609375, 4.01171875, 4.4140625, 4.81640625, 5.21875, 5.62109375, 6.0234375, 6.42578125, 6.828125, 7.23046875, 7.6328125, 8.03515625, 8.4375, 8.83984375, 9.2421875, 9.64453125, 10.046875, 10.44921875, 10.8515625, 11.25390625, 11.65625, 12.05859375, 12.4609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 8.0, 2.0, 9.0, 5.0, 11.0, 14.0, 13.0, 15.0, 24.0, 24.0, 18.0, 22.0, 34.0, 37.0, 41.0, 36.0, 49.0, 37.0, 43.0, 41.0, 46.0, 41.0, 25.0, 34.0, 52.0, 37.0, 37.0, 25.0, 35.0, 28.0, 30.0, 16.0, 21.0, 11.0, 14.0, 18.0, 9.0, 9.0, 3.0, 12.0, 1.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.859375, -20.1533203125, -19.447265625, -18.7412109375, -18.03515625, -17.3291015625, -16.623046875, -15.9169921875, -15.2109375, -14.5048828125, -13.798828125, -13.0927734375, -12.38671875, -11.6806640625, -10.974609375, -10.2685546875, -9.5625, -8.8564453125, -8.150390625, -7.4443359375, -6.73828125, -6.0322265625, -5.326171875, -4.6201171875, -3.9140625, -3.2080078125, -2.501953125, -1.7958984375, -1.08984375, -0.3837890625, 0.322265625, 1.0283203125, 1.734375, 2.4404296875, 3.146484375, 3.8525390625, 4.55859375, 5.2646484375, 5.970703125, 6.6767578125, 7.3828125, 8.0888671875, 8.794921875, 9.5009765625, 10.20703125, 10.9130859375, 11.619140625, 12.3251953125, 13.03125, 13.7373046875, 14.443359375, 15.1494140625, 15.85546875, 16.5615234375, 17.267578125, 17.9736328125, 18.6796875, 19.3857421875, 20.091796875, 20.7978515625, 21.50390625, 22.2099609375, 22.916015625, 23.6220703125, 24.328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 16.0, 16.0, 26.0, 36.0, 63.0, 105.0, 174.0, 268.0, 443.0, 683.0, 1165.0, 1910.0, 3173.0, 4831.0, 7921.0, 12156.0, 18099.0, 26837.0, 37353.0, 50313.0, 64637.0, 78492.0, 89566.0, 96863.0, 98521.0, 94657.0, 85255.0, 72748.0, 58752.0, 44892.0, 32798.0, 22990.0, 15397.0, 10231.0, 6430.0, 4068.0, 2542.0, 1597.0, 953.0, 601.0, 367.0, 251.0, 118.0, 87.0, 47.0, 43.0, 25.0, 16.0, 10.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.8984375, -4.74676513671875, -4.5950927734375, -4.44342041015625, -4.291748046875, -4.14007568359375, -3.9884033203125, -3.83673095703125, -3.68505859375, -3.53338623046875, -3.3817138671875, -3.23004150390625, -3.078369140625, -2.92669677734375, -2.7750244140625, -2.62335205078125, -2.4716796875, -2.32000732421875, -2.1683349609375, -2.01666259765625, -1.864990234375, -1.71331787109375, -1.5616455078125, -1.40997314453125, -1.25830078125, -1.10662841796875, -0.9549560546875, -0.80328369140625, -0.651611328125, -0.49993896484375, -0.3482666015625, -0.19659423828125, -0.044921875, 0.10675048828125, 0.2584228515625, 0.41009521484375, 0.561767578125, 0.71343994140625, 0.8651123046875, 1.01678466796875, 1.16845703125, 1.32012939453125, 1.4718017578125, 1.62347412109375, 1.775146484375, 1.92681884765625, 2.0784912109375, 2.23016357421875, 2.3818359375, 2.53350830078125, 2.6851806640625, 2.83685302734375, 2.988525390625, 3.14019775390625, 3.2918701171875, 3.44354248046875, 3.59521484375, 3.74688720703125, 3.8985595703125, 4.05023193359375, 4.201904296875, 4.35357666015625, 4.5052490234375, 4.65692138671875, 4.80859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 4.0, 8.0, 4.0, 10.0, 10.0, 11.0, 19.0, 17.0, 18.0, 22.0, 30.0, 25.0, 28.0, 19.0, 30.0, 38.0, 28.0, 34.0, 39.0, 48.0, 39.0, 39.0, 34.0, 37.0, 43.0, 42.0, 38.0, 38.0, 27.0, 20.0, 22.0, 27.0, 20.0, 18.0, 10.0, 13.0, 19.0, 18.0, 8.0, 5.0, 4.0, 7.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.0006222724914550781, -0.0006042718887329102, -0.0005862712860107422, -0.0005682706832885742, -0.0005502700805664062, -0.0005322694778442383, -0.0005142688751220703, -0.0004962682723999023, -0.0004782676696777344, -0.0004602670669555664, -0.00044226646423339844, -0.00042426586151123047, -0.0004062652587890625, -0.00038826465606689453, -0.00037026405334472656, -0.0003522634506225586, -0.0003342628479003906, -0.00031626224517822266, -0.0002982616424560547, -0.0002802610397338867, -0.00026226043701171875, -0.0002442598342895508, -0.0002262592315673828, -0.00020825862884521484, -0.00019025802612304688, -0.0001722574234008789, -0.00015425682067871094, -0.00013625621795654297, -0.000118255615234375, -0.00010025501251220703, -8.225440979003906e-05, -6.42538070678711e-05, -4.6253204345703125e-05, -2.8252601623535156e-05, -1.0251998901367188e-05, 7.748603820800781e-06, 2.574920654296875e-05, 4.374980926513672e-05, 6.175041198730469e-05, 7.975101470947266e-05, 9.775161743164062e-05, 0.0001157522201538086, 0.00013375282287597656, 0.00015175342559814453, 0.0001697540283203125, 0.00018775463104248047, 0.00020575523376464844, 0.0002237558364868164, 0.00024175643920898438, 0.00025975704193115234, 0.0002777576446533203, 0.0002957582473754883, 0.00031375885009765625, 0.0003317594528198242, 0.0003497600555419922, 0.00036776065826416016, 0.0003857612609863281, 0.0004037618637084961, 0.00042176246643066406, 0.00043976306915283203, 0.000457763671875, 0.00047576427459716797, 0.0004937648773193359, 0.0005117654800415039, 0.0005297660827636719]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 16.0, 16.0, 30.0, 41.0, 85.0, 113.0, 169.0, 306.0, 473.0, 697.0, 1163.0, 1894.0, 3047.0, 5241.0, 8184.0, 13226.0, 20747.0, 31492.0, 45651.0, 63095.0, 81437.0, 97597.0, 108033.0, 111929.0, 106316.0, 93811.0, 76008.0, 58564.0, 41577.0, 28594.0, 18312.0, 11876.0, 7285.0, 4377.0, 2772.0, 1658.0, 1040.0, 644.0, 392.0, 217.0, 175.0, 100.0, 63.0, 40.0, 22.0, 16.0, 6.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.83984375, -5.659423828125, -5.47900390625, -5.298583984375, -5.1181640625, -4.937744140625, -4.75732421875, -4.576904296875, -4.396484375, -4.216064453125, -4.03564453125, -3.855224609375, -3.6748046875, -3.494384765625, -3.31396484375, -3.133544921875, -2.953125, -2.772705078125, -2.59228515625, -2.411865234375, -2.2314453125, -2.051025390625, -1.87060546875, -1.690185546875, -1.509765625, -1.329345703125, -1.14892578125, -0.968505859375, -0.7880859375, -0.607666015625, -0.42724609375, -0.246826171875, -0.06640625, 0.114013671875, 0.29443359375, 0.474853515625, 0.6552734375, 0.835693359375, 1.01611328125, 1.196533203125, 1.376953125, 1.557373046875, 1.73779296875, 1.918212890625, 2.0986328125, 2.279052734375, 2.45947265625, 2.639892578125, 2.8203125, 3.000732421875, 3.18115234375, 3.361572265625, 3.5419921875, 3.722412109375, 3.90283203125, 4.083251953125, 4.263671875, 4.444091796875, 4.62451171875, 4.804931640625, 4.9853515625, 5.165771484375, 5.34619140625, 5.526611328125, 5.70703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 9.0, 4.0, 10.0, 12.0, 8.0, 15.0, 18.0, 17.0, 28.0, 25.0, 31.0, 30.0, 33.0, 46.0, 55.0, 46.0, 44.0, 47.0, 54.0, 41.0, 41.0, 47.0, 52.0, 33.0, 42.0, 23.0, 23.0, 27.0, 21.0, 18.0, 21.0, 9.0, 12.0, 8.0, 11.0, 2.0, 5.0, 6.0, 1.0, 4.0, 9.0, 1.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-3.060546875, -2.9644775390625, -2.868408203125, -2.7723388671875, -2.67626953125, -2.5802001953125, -2.484130859375, -2.3880615234375, -2.2919921875, -2.1959228515625, -2.099853515625, -2.0037841796875, -1.90771484375, -1.8116455078125, -1.715576171875, -1.6195068359375, -1.5234375, -1.4273681640625, -1.331298828125, -1.2352294921875, -1.13916015625, -1.0430908203125, -0.947021484375, -0.8509521484375, -0.7548828125, -0.6588134765625, -0.562744140625, -0.4666748046875, -0.37060546875, -0.2745361328125, -0.178466796875, -0.0823974609375, 0.013671875, 0.1097412109375, 0.205810546875, 0.3018798828125, 0.39794921875, 0.4940185546875, 0.590087890625, 0.6861572265625, 0.7822265625, 0.8782958984375, 0.974365234375, 1.0704345703125, 1.16650390625, 1.2625732421875, 1.358642578125, 1.4547119140625, 1.55078125, 1.6468505859375, 1.742919921875, 1.8389892578125, 1.93505859375, 2.0311279296875, 2.127197265625, 2.2232666015625, 2.3193359375, 2.4154052734375, 2.511474609375, 2.6075439453125, 2.70361328125, 2.7996826171875, 2.895751953125, 2.9918212890625, 3.087890625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 16.0, 11.0, 16.0, 25.0, 20.0, 25.0, 36.0, 39.0, 44.0, 49.0, 42.0, 46.0, 51.0, 48.0, 62.0, 57.0, 54.0, 46.0, 48.0, 40.0, 33.0, 35.0, 33.0, 15.0, 19.0, 18.0, 11.0, 13.0, 7.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.38981628417969, -33.34634780883789, -32.302879333496094, -31.25940704345703, -30.215938568115234, -29.172470092773438, -28.128999710083008, -27.085529327392578, -26.04206085205078, -24.998592376708984, -23.955121994018555, -22.911651611328125, -21.868183135986328, -20.82471466064453, -19.7812442779541, -18.737773895263672, -17.694305419921875, -16.650836944580078, -15.607366561889648, -14.563897132873535, -13.520427703857422, -12.476958274841309, -11.433488845825195, -10.390019416809082, -9.346549987792969, -8.303080558776855, -7.259611129760742, -6.216141700744629, -5.172672271728516, -4.129202842712402, -3.085733413696289, -2.042263984680176, -0.9987983703613281, 0.044671058654785156, 1.0881404876708984, 2.1316099166870117, 3.175079345703125, 4.218548774719238, 5.262018203735352, 6.305487632751465, 7.348957061767578, 8.392426490783691, 9.435895919799805, 10.479365348815918, 11.522834777832031, 12.566304206848145, 13.609773635864258, 14.653243064880371, 15.696712493896484, 16.74018096923828, 17.78365135192871, 18.82712173461914, 19.870590209960938, 20.914058685302734, 21.957529067993164, 23.000999450683594, 24.04446792602539, 25.087936401367188, 26.131406784057617, 27.174877166748047, 28.218345642089844, 29.26181411743164, 30.30528450012207, 31.3487548828125, 32.3922233581543]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 8.0, 14.0, 17.0, 14.0, 26.0, 18.0, 16.0, 29.0, 25.0, 31.0, 33.0, 45.0, 35.0, 39.0, 43.0, 38.0, 44.0, 56.0, 37.0, 45.0, 42.0, 29.0, 36.0, 37.0, 32.0, 29.0, 23.0, 23.0, 20.0, 19.0, 13.0, 13.0, 9.0, 15.0, 9.0, 9.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.09646224975586, -42.79240417480469, -41.488346099853516, -40.184288024902344, -38.88023376464844, -37.576175689697266, -36.272117614746094, -34.96805953979492, -33.66400146484375, -32.35994338989258, -31.055885314941406, -29.751829147338867, -28.447771072387695, -27.143712997436523, -25.839656829833984, -24.535598754882812, -23.23154067993164, -21.92748260498047, -20.623424530029297, -19.319368362426758, -18.015310287475586, -16.711252212524414, -15.407195091247559, -14.103137969970703, -12.799079895019531, -11.49502182006836, -10.190964698791504, -8.886907577514648, -7.582849502563477, -6.278791904449463, -4.974734306335449, -3.6706771850585938, -2.3666152954101562, -1.0625576972961426, 0.2414999008178711, 1.5455574989318848, 2.8496150970458984, 4.153672695159912, 5.457730293273926, 6.761787414550781, 8.065845489501953, 9.369903564453125, 10.67396068572998, 11.978017807006836, 13.282075881958008, 14.58613395690918, 15.890191078186035, 17.19424819946289, 18.498306274414062, 19.802364349365234, 21.106422424316406, 22.410478591918945, 23.714536666870117, 25.01859474182129, 26.322650909423828, 27.626708984375, 28.930767059326172, 30.234825134277344, 31.538883209228516, 32.84294128417969, 34.146995544433594, 35.451053619384766, 36.75511169433594, 38.05916976928711, 39.36322784423828]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 12.0, 14.0, 28.0, 40.0, 66.0, 120.0, 155.0, 258.0, 434.0, 678.0, 1046.0, 1699.0, 2582.0, 4253.0, 6704.0, 10714.0, 16490.0, 25650.0, 39476.0, 59770.0, 88193.0, 126751.0, 176667.0, 236538.0, 301726.0, 360497.0, 403562.0, 420144.0, 406825.0, 364230.0, 307038.0, 241676.0, 182192.0, 132353.0, 92761.0, 63300.0, 42078.0, 27462.0, 18109.0, 11595.0, 7555.0, 4814.0, 2978.0, 1905.0, 1179.0, 733.0, 442.0, 304.0, 185.0, 111.0, 73.0, 60.0, 23.0, 18.0, 8.0, 12.0, 6.0, 2.0], "bins": [-25.828125, -25.058837890625, -24.28955078125, -23.520263671875, -22.7509765625, -21.981689453125, -21.21240234375, -20.443115234375, -19.673828125, -18.904541015625, -18.13525390625, -17.365966796875, -16.5966796875, -15.827392578125, -15.05810546875, -14.288818359375, -13.51953125, -12.750244140625, -11.98095703125, -11.211669921875, -10.4423828125, -9.673095703125, -8.90380859375, -8.134521484375, -7.365234375, -6.595947265625, -5.82666015625, -5.057373046875, -4.2880859375, -3.518798828125, -2.74951171875, -1.980224609375, -1.2109375, -0.441650390625, 0.32763671875, 1.096923828125, 1.8662109375, 2.635498046875, 3.40478515625, 4.174072265625, 4.943359375, 5.712646484375, 6.48193359375, 7.251220703125, 8.0205078125, 8.789794921875, 9.55908203125, 10.328369140625, 11.09765625, 11.866943359375, 12.63623046875, 13.405517578125, 14.1748046875, 14.944091796875, 15.71337890625, 16.482666015625, 17.251953125, 18.021240234375, 18.79052734375, 19.559814453125, 20.3291015625, 21.098388671875, 21.86767578125, 22.636962890625, 23.40625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 11.0, 6.0, 9.0, 9.0, 14.0, 20.0, 18.0, 18.0, 18.0, 22.0, 19.0, 20.0, 38.0, 25.0, 29.0, 37.0, 36.0, 44.0, 39.0, 39.0, 41.0, 53.0, 36.0, 30.0, 33.0, 26.0, 35.0, 34.0, 32.0, 27.0, 22.0, 22.0, 15.0, 22.0, 15.0, 15.0, 13.0, 11.0, 6.0, 7.0, 10.0, 9.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-35.15625, -34.078125, -33.0, -31.921875, -30.84375, -29.765625, -28.6875, -27.609375, -26.53125, -25.453125, -24.375, -23.296875, -22.21875, -21.140625, -20.0625, -18.984375, -17.90625, -16.828125, -15.75, -14.671875, -13.59375, -12.515625, -11.4375, -10.359375, -9.28125, -8.203125, -7.125, -6.046875, -4.96875, -3.890625, -2.8125, -1.734375, -0.65625, 0.421875, 1.5, 2.578125, 3.65625, 4.734375, 5.8125, 6.890625, 7.96875, 9.046875, 10.125, 11.203125, 12.28125, 13.359375, 14.4375, 15.515625, 16.59375, 17.671875, 18.75, 19.828125, 20.90625, 21.984375, 23.0625, 24.140625, 25.21875, 26.296875, 27.375, 28.453125, 29.53125, 30.609375, 31.6875, 32.765625, 33.84375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 11.0, 7.0, 30.0, 43.0, 72.0, 114.0, 196.0, 317.0, 504.0, 877.0, 1462.0, 2360.0, 3945.0, 6330.0, 10304.0, 16790.0, 26721.0, 41941.0, 64373.0, 96580.0, 140106.0, 195467.0, 259375.0, 325622.0, 382360.0, 418656.0, 426410.0, 403447.0, 354188.0, 291336.0, 225636.0, 164738.0, 116133.0, 78285.0, 51922.0, 33115.0, 20798.0, 13028.0, 8046.0, 5061.0, 2951.0, 1852.0, 1083.0, 693.0, 367.0, 220.0, 146.0, 101.0, 56.0, 40.0, 25.0, 12.0, 12.0, 6.0, 5.0, 0.0, 3.0, 2.0], "bins": [-28.46875, -27.585693359375, -26.70263671875, -25.819580078125, -24.9365234375, -24.053466796875, -23.17041015625, -22.287353515625, -21.404296875, -20.521240234375, -19.63818359375, -18.755126953125, -17.8720703125, -16.989013671875, -16.10595703125, -15.222900390625, -14.33984375, -13.456787109375, -12.57373046875, -11.690673828125, -10.8076171875, -9.924560546875, -9.04150390625, -8.158447265625, -7.275390625, -6.392333984375, -5.50927734375, -4.626220703125, -3.7431640625, -2.860107421875, -1.97705078125, -1.093994140625, -0.2109375, 0.672119140625, 1.55517578125, 2.438232421875, 3.3212890625, 4.204345703125, 5.08740234375, 5.970458984375, 6.853515625, 7.736572265625, 8.61962890625, 9.502685546875, 10.3857421875, 11.268798828125, 12.15185546875, 13.034912109375, 13.91796875, 14.801025390625, 15.68408203125, 16.567138671875, 17.4501953125, 18.333251953125, 19.21630859375, 20.099365234375, 20.982421875, 21.865478515625, 22.74853515625, 23.631591796875, 24.5146484375, 25.397705078125, 26.28076171875, 27.163818359375, 28.046875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 9.0, 6.0, 4.0, 12.0, 15.0, 20.0, 17.0, 34.0, 41.0, 45.0, 48.0, 73.0, 94.0, 94.0, 118.0, 118.0, 146.0, 140.0, 161.0, 179.0, 199.0, 211.0, 199.0, 230.0, 183.0, 209.0, 198.0, 154.0, 159.0, 153.0, 119.0, 113.0, 102.0, 81.0, 76.0, 70.0, 56.0, 38.0, 33.0, 29.0, 29.0, 23.0, 10.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-17.328125, -16.766845703125, -16.20556640625, -15.644287109375, -15.0830078125, -14.521728515625, -13.96044921875, -13.399169921875, -12.837890625, -12.276611328125, -11.71533203125, -11.154052734375, -10.5927734375, -10.031494140625, -9.47021484375, -8.908935546875, -8.34765625, -7.786376953125, -7.22509765625, -6.663818359375, -6.1025390625, -5.541259765625, -4.97998046875, -4.418701171875, -3.857421875, -3.296142578125, -2.73486328125, -2.173583984375, -1.6123046875, -1.051025390625, -0.48974609375, 0.071533203125, 0.6328125, 1.194091796875, 1.75537109375, 2.316650390625, 2.8779296875, 3.439208984375, 4.00048828125, 4.561767578125, 5.123046875, 5.684326171875, 6.24560546875, 6.806884765625, 7.3681640625, 7.929443359375, 8.49072265625, 9.052001953125, 9.61328125, 10.174560546875, 10.73583984375, 11.297119140625, 11.8583984375, 12.419677734375, 12.98095703125, 13.542236328125, 14.103515625, 14.664794921875, 15.22607421875, 15.787353515625, 16.3486328125, 16.909912109375, 17.47119140625, 18.032470703125, 18.59375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 6.0, 10.0, 18.0, 22.0, 24.0, 29.0, 40.0, 48.0, 54.0, 54.0, 63.0, 69.0, 76.0, 65.0, 67.0, 66.0, 59.0, 47.0, 32.0, 29.0, 23.0, 18.0, 15.0, 18.0, 15.0, 10.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.15007781982422, -63.26443862915039, -61.37879943847656, -59.49315643310547, -57.60751724243164, -55.72187805175781, -53.836238861083984, -51.950599670410156, -50.06495666503906, -48.179317474365234, -46.293678283691406, -44.40803527832031, -42.522396087646484, -40.636756896972656, -38.75111770629883, -36.865478515625, -34.97983932495117, -33.094200134277344, -31.208559036254883, -29.322919845581055, -27.437278747558594, -25.551639556884766, -23.666000366210938, -21.78036117553711, -19.89472007751465, -18.00908088684082, -16.12343978881836, -14.237800598144531, -12.352160453796387, -10.466520309448242, -8.580881118774414, -6.6952409744262695, -4.809597015380859, -2.923957109451294, -1.0383172035217285, 0.8473224639892578, 2.7329626083374023, 4.618602752685547, 6.504241943359375, 8.38988208770752, 10.275522232055664, 12.161162376403809, 14.046802520751953, 15.932441711425781, 17.81808090209961, 19.70372200012207, 21.5893611907959, 23.47500228881836, 25.360641479492188, 27.246280670166016, 29.131921768188477, 31.017560958862305, 32.903202056884766, 34.788841247558594, 36.67448043823242, 38.56011962890625, 40.445762634277344, 42.33140182495117, 44.217041015625, 46.102684020996094, 47.98832321166992, 49.87396240234375, 51.75960159301758, 53.645240783691406, 55.530879974365234]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 8.0, 0.0, 11.0, 9.0, 17.0, 10.0, 10.0, 14.0, 27.0, 27.0, 22.0, 27.0, 30.0, 41.0, 42.0, 33.0, 42.0, 51.0, 40.0, 31.0, 31.0, 40.0, 40.0, 39.0, 37.0, 45.0, 33.0, 47.0, 21.0, 22.0, 26.0, 18.0, 16.0, 23.0, 11.0, 10.0, 9.0, 13.0, 10.0, 2.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.76868438720703, -51.064918518066406, -49.361148834228516, -47.65738296508789, -45.95361328125, -44.249847412109375, -42.54608154296875, -40.842315673828125, -39.138545989990234, -37.43478012084961, -35.73101043701172, -34.027244567871094, -32.32347869873047, -30.619709014892578, -28.915943145751953, -27.212175369262695, -25.508407592773438, -23.80463981628418, -22.100872039794922, -20.397106170654297, -18.69333839416504, -16.98957061767578, -15.28580379486084, -13.582036972045898, -11.87826919555664, -10.174501419067383, -8.470734596252441, -6.766967296600342, -5.063199996948242, -3.3594322204589844, -1.655665397644043, 0.04810142517089844, 1.7518692016601562, 3.455636501312256, 5.1594038009643555, 6.863171100616455, 8.566938400268555, 10.270706176757812, 11.974472999572754, 13.678239822387695, 15.382007598876953, 17.08577537536621, 18.78954315185547, 20.493309020996094, 22.19707679748535, 23.90084457397461, 25.604610443115234, 27.308378219604492, 29.01214599609375, 30.715913772583008, 32.419681549072266, 34.12344741821289, 35.82721710205078, 37.530982971191406, 39.23474884033203, 40.938514709472656, 42.64228439331055, 44.34605026245117, 46.04981994628906, 47.75358581542969, 49.45735168457031, 51.1611213684082, 52.86488723754883, 54.56865692138672, 56.272422790527344]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 13.0, 18.0, 19.0, 36.0, 47.0, 97.0, 147.0, 217.0, 378.0, 648.0, 1088.0, 1877.0, 3134.0, 5627.0, 9568.0, 16687.0, 29597.0, 52634.0, 93312.0, 160563.0, 232146.0, 185785.0, 110371.0, 62543.0, 35311.0, 19897.0, 11242.0, 6521.0, 3724.0, 2151.0, 1295.0, 741.0, 436.0, 249.0, 175.0, 90.0, 58.0, 47.0, 21.0, 11.0, 12.0, 6.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.59173583984375, -4.4256591796875, -4.25958251953125, -4.093505859375, -3.92742919921875, -3.7613525390625, -3.59527587890625, -3.42919921875, -3.26312255859375, -3.0970458984375, -2.93096923828125, -2.764892578125, -2.59881591796875, -2.4327392578125, -2.26666259765625, -2.1005859375, -1.93450927734375, -1.7684326171875, -1.60235595703125, -1.436279296875, -1.27020263671875, -1.1041259765625, -0.93804931640625, -0.77197265625, -0.60589599609375, -0.4398193359375, -0.27374267578125, -0.107666015625, 0.05841064453125, 0.2244873046875, 0.39056396484375, 0.556640625, 0.72271728515625, 0.8887939453125, 1.05487060546875, 1.220947265625, 1.38702392578125, 1.5531005859375, 1.71917724609375, 1.88525390625, 2.05133056640625, 2.2174072265625, 2.38348388671875, 2.549560546875, 2.71563720703125, 2.8817138671875, 3.04779052734375, 3.2138671875, 3.37994384765625, 3.5460205078125, 3.71209716796875, 3.878173828125, 4.04425048828125, 4.2103271484375, 4.37640380859375, 4.54248046875, 4.70855712890625, 4.8746337890625, 5.04071044921875, 5.206787109375, 5.37286376953125, 5.5389404296875, 5.70501708984375, 5.87109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 11.0, 8.0, 5.0, 15.0, 16.0, 17.0, 18.0, 29.0, 38.0, 33.0, 35.0, 41.0, 28.0, 46.0, 33.0, 51.0, 43.0, 50.0, 46.0, 35.0, 32.0, 41.0, 42.0, 35.0, 38.0, 26.0, 27.0, 24.0, 17.0, 12.0, 20.0, 18.0, 16.0, 5.0, 16.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.90625, -52.07958984375, -50.2529296875, -48.42626953125, -46.599609375, -44.77294921875, -42.9462890625, -41.11962890625, -39.29296875, -37.46630859375, -35.6396484375, -33.81298828125, -31.986328125, -30.15966796875, -28.3330078125, -26.50634765625, -24.6796875, -22.85302734375, -21.0263671875, -19.19970703125, -17.373046875, -15.54638671875, -13.7197265625, -11.89306640625, -10.06640625, -8.23974609375, -6.4130859375, -4.58642578125, -2.759765625, -0.93310546875, 0.8935546875, 2.72021484375, 4.546875, 6.37353515625, 8.2001953125, 10.02685546875, 11.853515625, 13.68017578125, 15.5068359375, 17.33349609375, 19.16015625, 20.98681640625, 22.8134765625, 24.64013671875, 26.466796875, 28.29345703125, 30.1201171875, 31.94677734375, 33.7734375, 35.60009765625, 37.4267578125, 39.25341796875, 41.080078125, 42.90673828125, 44.7333984375, 46.56005859375, 48.38671875, 50.21337890625, 52.0400390625, 53.86669921875, 55.693359375, 57.52001953125, 59.3466796875, 61.17333984375, 63.0]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 17.0, 16.0, 27.0, 30.0, 52.0, 72.0, 105.0, 153.0, 197.0, 285.0, 430.0, 697.0, 1001.0, 1474.0, 2272.0, 3230.0, 4933.0, 7635.0, 11790.0, 17889.0, 27723.0, 43167.0, 67090.0, 101481.0, 146042.0, 179393.0, 144119.0, 99916.0, 65997.0, 42475.0, 27345.0, 17687.0, 11575.0, 7390.0, 4867.0, 3244.0, 2130.0, 1484.0, 959.0, 686.0, 491.0, 318.0, 219.0, 126.0, 103.0, 75.0, 38.0, 26.0, 32.0, 18.0, 13.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.26171875, -4.1263427734375, -3.990966796875, -3.8555908203125, -3.72021484375, -3.5848388671875, -3.449462890625, -3.3140869140625, -3.1787109375, -3.0433349609375, -2.907958984375, -2.7725830078125, -2.63720703125, -2.5018310546875, -2.366455078125, -2.2310791015625, -2.095703125, -1.9603271484375, -1.824951171875, -1.6895751953125, -1.55419921875, -1.4188232421875, -1.283447265625, -1.1480712890625, -1.0126953125, -0.8773193359375, -0.741943359375, -0.6065673828125, -0.47119140625, -0.3358154296875, -0.200439453125, -0.0650634765625, 0.0703125, 0.2056884765625, 0.341064453125, 0.4764404296875, 0.61181640625, 0.7471923828125, 0.882568359375, 1.0179443359375, 1.1533203125, 1.2886962890625, 1.424072265625, 1.5594482421875, 1.69482421875, 1.8302001953125, 1.965576171875, 2.1009521484375, 2.236328125, 2.3717041015625, 2.507080078125, 2.6424560546875, 2.77783203125, 2.9132080078125, 3.048583984375, 3.1839599609375, 3.3193359375, 3.4547119140625, 3.590087890625, 3.7254638671875, 3.86083984375, 3.9962158203125, 4.131591796875, 4.2669677734375, 4.40234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 2.0, 2.0, 7.0, 2.0, 14.0, 5.0, 13.0, 15.0, 16.0, 16.0, 21.0, 18.0, 27.0, 33.0, 29.0, 32.0, 42.0, 26.0, 46.0, 37.0, 43.0, 38.0, 49.0, 44.0, 34.0, 34.0, 40.0, 47.0, 27.0, 34.0, 31.0, 21.0, 18.0, 25.0, 19.0, 17.0, 10.0, 14.0, 16.0, 7.0, 8.0, 6.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.375, -32.31884765625, -31.2626953125, -30.20654296875, -29.150390625, -28.09423828125, -27.0380859375, -25.98193359375, -24.92578125, -23.86962890625, -22.8134765625, -21.75732421875, -20.701171875, -19.64501953125, -18.5888671875, -17.53271484375, -16.4765625, -15.42041015625, -14.3642578125, -13.30810546875, -12.251953125, -11.19580078125, -10.1396484375, -9.08349609375, -8.02734375, -6.97119140625, -5.9150390625, -4.85888671875, -3.802734375, -2.74658203125, -1.6904296875, -0.63427734375, 0.421875, 1.47802734375, 2.5341796875, 3.59033203125, 4.646484375, 5.70263671875, 6.7587890625, 7.81494140625, 8.87109375, 9.92724609375, 10.9833984375, 12.03955078125, 13.095703125, 14.15185546875, 15.2080078125, 16.26416015625, 17.3203125, 18.37646484375, 19.4326171875, 20.48876953125, 21.544921875, 22.60107421875, 23.6572265625, 24.71337890625, 25.76953125, 26.82568359375, 27.8818359375, 28.93798828125, 29.994140625, 31.05029296875, 32.1064453125, 33.16259765625, 34.21875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 12.0, 10.0, 23.0, 36.0, 39.0, 62.0, 74.0, 111.0, 147.0, 196.0, 283.0, 409.0, 639.0, 944.0, 1284.0, 1814.0, 2813.0, 4130.0, 6171.0, 9820.0, 15755.0, 25638.0, 45435.0, 86973.0, 187168.0, 301762.0, 168705.0, 79110.0, 42260.0, 24233.0, 14779.0, 9285.0, 5849.0, 3950.0, 2735.0, 1802.0, 1246.0, 846.0, 598.0, 393.0, 293.0, 200.0, 130.0, 114.0, 90.0, 53.0, 45.0, 28.0, 22.0, 19.0, 10.0, 5.0, 3.0, 7.0, 3.0, 2.0], "bins": [-0.2159423828125, -0.20948410034179688, -0.20302581787109375, -0.19656753540039062, -0.1901092529296875, -0.18365097045898438, -0.17719268798828125, -0.17073440551757812, -0.164276123046875, -0.15781784057617188, -0.15135955810546875, -0.14490127563476562, -0.1384429931640625, -0.13198471069335938, -0.12552642822265625, -0.11906814575195312, -0.11260986328125, -0.10615158081054688, -0.09969329833984375, -0.09323501586914062, -0.0867767333984375, -0.08031845092773438, -0.07386016845703125, -0.06740188598632812, -0.060943603515625, -0.054485321044921875, -0.04802703857421875, -0.041568756103515625, -0.0351104736328125, -0.028652191162109375, -0.02219390869140625, -0.015735626220703125, -0.00927734375, -0.002819061279296875, 0.00363922119140625, 0.010097503662109375, 0.0165557861328125, 0.023014068603515625, 0.02947235107421875, 0.035930633544921875, 0.042388916015625, 0.048847198486328125, 0.05530548095703125, 0.061763763427734375, 0.0682220458984375, 0.07468032836914062, 0.08113861083984375, 0.08759689331054688, 0.09405517578125, 0.10051345825195312, 0.10697174072265625, 0.11343002319335938, 0.1198883056640625, 0.12634658813476562, 0.13280487060546875, 0.13926315307617188, 0.145721435546875, 0.15217971801757812, 0.15863800048828125, 0.16509628295898438, 0.1715545654296875, 0.17801284790039062, 0.18447113037109375, 0.19092941284179688, 0.1973876953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 9.0, 7.0, 23.0, 15.0, 22.0, 26.0, 30.0, 34.0, 40.0, 46.0, 51.0, 54.0, 40.0, 50.0, 56.0, 57.0, 67.0, 48.0, 41.0, 47.0, 37.0, 38.0, 24.0, 25.0, 25.0, 21.0, 9.0, 13.0, 9.0, 4.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.892183303833008e-05, -3.7590041756629944e-05, -3.625825047492981e-05, -3.4926459193229675e-05, -3.359466791152954e-05, -3.226287662982941e-05, -3.093108534812927e-05, -2.9599294066429138e-05, -2.8267502784729004e-05, -2.693571150302887e-05, -2.5603920221328735e-05, -2.42721289396286e-05, -2.2940337657928467e-05, -2.1608546376228333e-05, -2.0276755094528198e-05, -1.8944963812828064e-05, -1.761317253112793e-05, -1.6281381249427795e-05, -1.4949589967727661e-05, -1.3617798686027527e-05, -1.2286007404327393e-05, -1.0954216122627258e-05, -9.622424840927124e-06, -8.29063355922699e-06, -6.9588422775268555e-06, -5.627050995826721e-06, -4.295259714126587e-06, -2.9634684324264526e-06, -1.6316771507263184e-06, -2.998858690261841e-07, 1.0319054126739502e-06, 2.3636966943740845e-06, 3.6954879760742188e-06, 5.027279257774353e-06, 6.359070539474487e-06, 7.690861821174622e-06, 9.022653102874756e-06, 1.035444438457489e-05, 1.1686235666275024e-05, 1.3018026947975159e-05, 1.4349818229675293e-05, 1.5681609511375427e-05, 1.701340079307556e-05, 1.8345192074775696e-05, 1.967698335647583e-05, 2.1008774638175964e-05, 2.23405659198761e-05, 2.3672357201576233e-05, 2.5004148483276367e-05, 2.63359397649765e-05, 2.7667731046676636e-05, 2.899952232837677e-05, 3.0331313610076904e-05, 3.166310489177704e-05, 3.299489617347717e-05, 3.432668745517731e-05, 3.565847873687744e-05, 3.6990270018577576e-05, 3.832206130027771e-05, 3.9653852581977844e-05, 4.098564386367798e-05, 4.231743514537811e-05, 4.364922642707825e-05, 4.498101770877838e-05, 4.6312808990478516e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 13.0, 15.0, 32.0, 30.0, 58.0, 49.0, 91.0, 123.0, 165.0, 256.0, 340.0, 457.0, 626.0, 907.0, 1345.0, 1861.0, 2778.0, 4056.0, 6044.0, 9290.0, 14621.0, 23472.0, 36911.0, 63514.0, 118299.0, 265799.0, 235773.0, 106804.0, 58262.0, 34440.0, 21315.0, 13565.0, 8755.0, 5871.0, 3927.0, 2630.0, 1789.0, 1245.0, 837.0, 615.0, 413.0, 333.0, 244.0, 176.0, 95.0, 91.0, 54.0, 42.0, 39.0, 17.0, 17.0, 14.0, 10.0, 9.0, 6.0, 3.0, 4.0], "bins": [-0.5478515625, -0.5312118530273438, -0.5145721435546875, -0.49793243408203125, -0.481292724609375, -0.46465301513671875, -0.4480133056640625, -0.43137359619140625, -0.41473388671875, -0.39809417724609375, -0.3814544677734375, -0.36481475830078125, -0.348175048828125, -0.33153533935546875, -0.3148956298828125, -0.29825592041015625, -0.2816162109375, -0.26497650146484375, -0.2483367919921875, -0.23169708251953125, -0.215057373046875, -0.19841766357421875, -0.1817779541015625, -0.16513824462890625, -0.14849853515625, -0.13185882568359375, -0.1152191162109375, -0.09857940673828125, -0.081939697265625, -0.06529998779296875, -0.0486602783203125, -0.03202056884765625, -0.015380859375, 0.00125885009765625, 0.0178985595703125, 0.03453826904296875, 0.051177978515625, 0.06781768798828125, 0.0844573974609375, 0.10109710693359375, 0.11773681640625, 0.13437652587890625, 0.1510162353515625, 0.16765594482421875, 0.184295654296875, 0.20093536376953125, 0.2175750732421875, 0.23421478271484375, 0.2508544921875, 0.26749420166015625, 0.2841339111328125, 0.30077362060546875, 0.317413330078125, 0.33405303955078125, 0.3506927490234375, 0.36733245849609375, 0.38397216796875, 0.40061187744140625, 0.4172515869140625, 0.43389129638671875, 0.450531005859375, 0.46717071533203125, 0.4838104248046875, 0.5004501342773438, 0.51708984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 3.0, 9.0, 10.0, 18.0, 12.0, 15.0, 27.0, 20.0, 30.0, 41.0, 38.0, 53.0, 46.0, 54.0, 76.0, 75.0, 92.0, 54.0, 60.0, 35.0, 28.0, 24.0, 27.0, 28.0, 18.0, 14.0, 17.0, 15.0, 9.0, 6.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.42236328125, -0.4100303649902344, -0.39769744873046875, -0.3853645324707031, -0.3730316162109375, -0.3606986999511719, -0.34836578369140625, -0.3360328674316406, -0.323699951171875, -0.3113670349121094, -0.29903411865234375, -0.2867012023925781, -0.2743682861328125, -0.2620353698730469, -0.24970245361328125, -0.23736953735351562, -0.22503662109375, -0.21270370483398438, -0.20037078857421875, -0.18803787231445312, -0.1757049560546875, -0.16337203979492188, -0.15103912353515625, -0.13870620727539062, -0.126373291015625, -0.11404037475585938, -0.10170745849609375, -0.08937454223632812, -0.0770416259765625, -0.06470870971679688, -0.05237579345703125, -0.040042877197265625, -0.0277099609375, -0.015377044677734375, -0.00304412841796875, 0.009288787841796875, 0.0216217041015625, 0.033954620361328125, 0.04628753662109375, 0.058620452880859375, 0.070953369140625, 0.08328628540039062, 0.09561920166015625, 0.10795211791992188, 0.1202850341796875, 0.13261795043945312, 0.14495086669921875, 0.15728378295898438, 0.16961669921875, 0.18194961547851562, 0.19428253173828125, 0.20661544799804688, 0.2189483642578125, 0.23128128051757812, 0.24361419677734375, 0.2559471130371094, 0.268280029296875, 0.2806129455566406, 0.29294586181640625, 0.3052787780761719, 0.3176116943359375, 0.3299446105957031, 0.34227752685546875, 0.3546104431152344, 0.366943359375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 5.0, 5.0, 7.0, 10.0, 22.0, 20.0, 24.0, 33.0, 37.0, 49.0, 57.0, 56.0, 66.0, 66.0, 72.0, 68.0, 69.0, 69.0, 48.0, 51.0, 26.0, 32.0, 21.0, 18.0, 13.0, 19.0, 14.0, 11.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.27672576904297, -63.38839340209961, -61.50006103515625, -59.611732482910156, -57.7234001159668, -55.83506774902344, -53.94673538208008, -52.05840301513672, -50.17007064819336, -48.28173828125, -46.39340591430664, -44.50507354736328, -42.61674499511719, -40.72841262817383, -38.84008026123047, -36.95174789428711, -35.06341552734375, -33.17508316040039, -31.286752700805664, -29.398420333862305, -27.510087966918945, -25.62175750732422, -23.73342514038086, -21.8450927734375, -19.956764221191406, -18.068431854248047, -16.18010139465332, -14.291769027709961, -12.403436660766602, -10.515105247497559, -8.626773834228516, -6.738441467285156, -4.850109100341797, -2.9617772102355957, -1.0734455585479736, 0.8148860931396484, 2.7032179832458496, 4.591549873352051, 6.479881286621094, 8.368213653564453, 10.256545066833496, 12.144876480102539, 14.033208847045898, 15.921540260314941, 17.809871673583984, 19.698204040527344, 21.586536407470703, 23.474868774414062, 25.36319923400879, 27.25153160095215, 29.139862060546875, 31.028194427490234, 32.916526794433594, 34.80485916137695, 36.69319152832031, 38.581520080566406, 40.469852447509766, 42.358184814453125, 44.246517181396484, 46.134849548339844, 48.02317810058594, 49.9115104675293, 51.799842834472656, 53.688175201416016, 55.576507568359375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 7.0, 2.0, 10.0, 9.0, 16.0, 12.0, 9.0, 14.0, 26.0, 29.0, 21.0, 28.0, 30.0, 41.0, 41.0, 39.0, 37.0, 52.0, 41.0, 27.0, 31.0, 42.0, 42.0, 37.0, 38.0, 46.0, 33.0, 44.0, 21.0, 24.0, 27.0, 18.0, 15.0, 22.0, 13.0, 8.0, 8.0, 12.0, 11.0, 3.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.08054733276367, -51.367488861083984, -49.6544303894043, -47.94137191772461, -46.22831344604492, -44.515254974365234, -42.80219268798828, -41.089134216308594, -39.376075744628906, -37.66301727294922, -35.94995880126953, -34.236900329589844, -32.523841857910156, -30.81078338623047, -29.09772300720215, -27.38466453552246, -25.671607971191406, -23.95854949951172, -22.24549102783203, -20.532432556152344, -18.819374084472656, -17.10631561279297, -15.393255233764648, -13.680196762084961, -11.967138290405273, -10.254079818725586, -8.541021347045898, -6.8279619216918945, -5.114903450012207, -3.4018449783325195, -1.6887855529785156, 0.024272918701171875, 1.7373275756835938, 3.4503862857818604, 5.163444995880127, 6.876503944396973, 8.58956241607666, 10.302620887756348, 12.015680313110352, 13.728738784790039, 15.441797256469727, 17.154855728149414, 18.8679141998291, 20.580974578857422, 22.29403305053711, 24.007091522216797, 25.720149993896484, 27.433208465576172, 29.14626693725586, 30.859325408935547, 32.572383880615234, 34.28544235229492, 35.99850082397461, 37.7115592956543, 39.42462158203125, 41.13768005371094, 42.850738525390625, 44.56379699707031, 46.27685546875, 47.98991394042969, 49.702972412109375, 51.41603088378906, 53.12908935546875, 54.84214782714844, 56.555206298828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 21.0, 28.0, 41.0, 91.0, 157.0, 166.0, 318.0, 459.0, 741.0, 1132.0, 1765.0, 2841.0, 4360.0, 6856.0, 10604.0, 15942.0, 24131.0, 35836.0, 50087.0, 67493.0, 85575.0, 101329.0, 110274.0, 110864.0, 102100.0, 86894.0, 68967.0, 51010.0, 36746.0, 24783.0, 16635.0, 10747.0, 6957.0, 4536.0, 2836.0, 1829.0, 1155.0, 775.0, 543.0, 339.0, 204.0, 134.0, 74.0, 72.0, 34.0, 20.0, 14.0, 13.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.578125, -18.947265625, -18.31640625, -17.685546875, -17.0546875, -16.423828125, -15.79296875, -15.162109375, -14.53125, -13.900390625, -13.26953125, -12.638671875, -12.0078125, -11.376953125, -10.74609375, -10.115234375, -9.484375, -8.853515625, -8.22265625, -7.591796875, -6.9609375, -6.330078125, -5.69921875, -5.068359375, -4.4375, -3.806640625, -3.17578125, -2.544921875, -1.9140625, -1.283203125, -0.65234375, -0.021484375, 0.609375, 1.240234375, 1.87109375, 2.501953125, 3.1328125, 3.763671875, 4.39453125, 5.025390625, 5.65625, 6.287109375, 6.91796875, 7.548828125, 8.1796875, 8.810546875, 9.44140625, 10.072265625, 10.703125, 11.333984375, 11.96484375, 12.595703125, 13.2265625, 13.857421875, 14.48828125, 15.119140625, 15.75, 16.380859375, 17.01171875, 17.642578125, 18.2734375, 18.904296875, 19.53515625, 20.166015625, 20.796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 15.0, 12.0, 11.0, 12.0, 16.0, 25.0, 25.0, 31.0, 27.0, 35.0, 39.0, 42.0, 49.0, 48.0, 40.0, 45.0, 34.0, 38.0, 41.0, 45.0, 42.0, 45.0, 38.0, 40.0, 26.0, 24.0, 13.0, 19.0, 26.0, 21.0, 11.0, 15.0, 8.0, 9.0, 7.0, 4.0, 4.0, 2.0, 6.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.0, -52.2314453125, -50.462890625, -48.6943359375, -46.92578125, -45.1572265625, -43.388671875, -41.6201171875, -39.8515625, -38.0830078125, -36.314453125, -34.5458984375, -32.77734375, -31.0087890625, -29.240234375, -27.4716796875, -25.703125, -23.9345703125, -22.166015625, -20.3974609375, -18.62890625, -16.8603515625, -15.091796875, -13.3232421875, -11.5546875, -9.7861328125, -8.017578125, -6.2490234375, -4.48046875, -2.7119140625, -0.943359375, 0.8251953125, 2.59375, 4.3623046875, 6.130859375, 7.8994140625, 9.66796875, 11.4365234375, 13.205078125, 14.9736328125, 16.7421875, 18.5107421875, 20.279296875, 22.0478515625, 23.81640625, 25.5849609375, 27.353515625, 29.1220703125, 30.890625, 32.6591796875, 34.427734375, 36.1962890625, 37.96484375, 39.7333984375, 41.501953125, 43.2705078125, 45.0390625, 46.8076171875, 48.576171875, 50.3447265625, 52.11328125, 53.8818359375, 55.650390625, 57.4189453125, 59.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 19.0, 16.0, 22.0, 44.0, 60.0, 83.0, 123.0, 145.0, 234.0, 360.0, 551.0, 814.0, 1250.0, 1836.0, 2973.0, 4630.0, 7289.0, 11199.0, 17448.0, 26423.0, 39439.0, 56020.0, 76027.0, 96106.0, 111634.0, 117790.0, 113858.0, 99613.0, 79728.0, 59177.0, 41811.0, 28487.0, 18747.0, 12368.0, 7855.0, 5118.0, 3174.0, 2108.0, 1335.0, 888.0, 600.0, 399.0, 246.0, 168.0, 105.0, 64.0, 54.0, 43.0, 25.0, 13.0, 9.0, 9.0, 6.0, 1.0, 5.0, 0.0, 3.0, 1.0], "bins": [-23.9375, -23.1796875, -22.421875, -21.6640625, -20.90625, -20.1484375, -19.390625, -18.6328125, -17.875, -17.1171875, -16.359375, -15.6015625, -14.84375, -14.0859375, -13.328125, -12.5703125, -11.8125, -11.0546875, -10.296875, -9.5390625, -8.78125, -8.0234375, -7.265625, -6.5078125, -5.75, -4.9921875, -4.234375, -3.4765625, -2.71875, -1.9609375, -1.203125, -0.4453125, 0.3125, 1.0703125, 1.828125, 2.5859375, 3.34375, 4.1015625, 4.859375, 5.6171875, 6.375, 7.1328125, 7.890625, 8.6484375, 9.40625, 10.1640625, 10.921875, 11.6796875, 12.4375, 13.1953125, 13.953125, 14.7109375, 15.46875, 16.2265625, 16.984375, 17.7421875, 18.5, 19.2578125, 20.015625, 20.7734375, 21.53125, 22.2890625, 23.046875, 23.8046875, 24.5625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 4.0, 10.0, 5.0, 9.0, 7.0, 14.0, 11.0, 14.0, 21.0, 31.0, 16.0, 19.0, 35.0, 36.0, 33.0, 35.0, 38.0, 44.0, 45.0, 35.0, 44.0, 47.0, 42.0, 35.0, 34.0, 36.0, 35.0, 31.0, 37.0, 29.0, 26.0, 19.0, 20.0, 15.0, 22.0, 16.0, 11.0, 10.0, 3.0, 4.0, 3.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-34.5, -33.44873046875, -32.3974609375, -31.34619140625, -30.294921875, -29.24365234375, -28.1923828125, -27.14111328125, -26.08984375, -25.03857421875, -23.9873046875, -22.93603515625, -21.884765625, -20.83349609375, -19.7822265625, -18.73095703125, -17.6796875, -16.62841796875, -15.5771484375, -14.52587890625, -13.474609375, -12.42333984375, -11.3720703125, -10.32080078125, -9.26953125, -8.21826171875, -7.1669921875, -6.11572265625, -5.064453125, -4.01318359375, -2.9619140625, -1.91064453125, -0.859375, 0.19189453125, 1.2431640625, 2.29443359375, 3.345703125, 4.39697265625, 5.4482421875, 6.49951171875, 7.55078125, 8.60205078125, 9.6533203125, 10.70458984375, 11.755859375, 12.80712890625, 13.8583984375, 14.90966796875, 15.9609375, 17.01220703125, 18.0634765625, 19.11474609375, 20.166015625, 21.21728515625, 22.2685546875, 23.31982421875, 24.37109375, 25.42236328125, 26.4736328125, 27.52490234375, 28.576171875, 29.62744140625, 30.6787109375, 31.72998046875, 32.78125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 13.0, 16.0, 28.0, 61.0, 81.0, 130.0, 277.0, 400.0, 736.0, 1223.0, 1989.0, 3359.0, 5640.0, 9215.0, 14941.0, 23041.0, 34540.0, 48988.0, 65776.0, 83441.0, 99303.0, 108278.0, 110289.0, 103473.0, 90602.0, 73492.0, 56003.0, 39530.0, 27473.0, 17615.0, 11272.0, 7056.0, 4162.0, 2442.0, 1537.0, 873.0, 513.0, 300.0, 160.0, 115.0, 76.0, 39.0, 17.0, 18.0, 6.0, 6.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.15625, -8.8885498046875, -8.620849609375, -8.3531494140625, -8.08544921875, -7.8177490234375, -7.550048828125, -7.2823486328125, -7.0146484375, -6.7469482421875, -6.479248046875, -6.2115478515625, -5.94384765625, -5.6761474609375, -5.408447265625, -5.1407470703125, -4.873046875, -4.6053466796875, -4.337646484375, -4.0699462890625, -3.80224609375, -3.5345458984375, -3.266845703125, -2.9991455078125, -2.7314453125, -2.4637451171875, -2.196044921875, -1.9283447265625, -1.66064453125, -1.3929443359375, -1.125244140625, -0.8575439453125, -0.58984375, -0.3221435546875, -0.054443359375, 0.2132568359375, 0.48095703125, 0.7486572265625, 1.016357421875, 1.2840576171875, 1.5517578125, 1.8194580078125, 2.087158203125, 2.3548583984375, 2.62255859375, 2.8902587890625, 3.157958984375, 3.4256591796875, 3.693359375, 3.9610595703125, 4.228759765625, 4.4964599609375, 4.76416015625, 5.0318603515625, 5.299560546875, 5.5672607421875, 5.8349609375, 6.1026611328125, 6.370361328125, 6.6380615234375, 6.90576171875, 7.1734619140625, 7.441162109375, 7.7088623046875, 7.9765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 6.0, 9.0, 10.0, 19.0, 17.0, 23.0, 20.0, 26.0, 24.0, 28.0, 19.0, 34.0, 38.0, 46.0, 47.0, 46.0, 47.0, 45.0, 42.0, 37.0, 49.0, 41.0, 46.0, 23.0, 34.0, 38.0, 21.0, 26.0, 27.0, 26.0, 13.0, 13.0, 13.0, 15.0, 8.0, 3.0, 7.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0010652542114257812, -0.0010346770286560059, -0.0010040998458862305, -0.0009735226631164551, -0.0009429454803466797, -0.0009123682975769043, -0.0008817911148071289, -0.0008512139320373535, -0.0008206367492675781, -0.0007900595664978027, -0.0007594823837280273, -0.000728905200958252, -0.0006983280181884766, -0.0006677508354187012, -0.0006371736526489258, -0.0006065964698791504, -0.000576019287109375, -0.0005454421043395996, -0.0005148649215698242, -0.00048428773880004883, -0.00045371055603027344, -0.00042313337326049805, -0.00039255619049072266, -0.00036197900772094727, -0.0003314018249511719, -0.0003008246421813965, -0.0002702474594116211, -0.0002396702766418457, -0.0002090930938720703, -0.00017851591110229492, -0.00014793872833251953, -0.00011736154556274414, -8.678436279296875e-05, -5.620718002319336e-05, -2.562999725341797e-05, 4.947185516357422e-06, 3.552436828613281e-05, 6.61015510559082e-05, 9.66787338256836e-05, 0.00012725591659545898, 0.00015783309936523438, 0.00018841028213500977, 0.00021898746490478516, 0.00024956464767456055, 0.00028014183044433594, 0.00031071901321411133, 0.0003412961959838867, 0.0003718733787536621, 0.0004024505615234375, 0.0004330277442932129, 0.0004636049270629883, 0.0004941821098327637, 0.0005247592926025391, 0.0005553364753723145, 0.0005859136581420898, 0.0006164908409118652, 0.0006470680236816406, 0.000677645206451416, 0.0007082223892211914, 0.0007387995719909668, 0.0007693767547607422, 0.0007999539375305176, 0.000830531120300293, 0.0008611083030700684, 0.0008916854858398438]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 7.0, 11.0, 13.0, 32.0, 36.0, 50.0, 81.0, 160.0, 233.0, 338.0, 654.0, 1083.0, 1858.0, 3166.0, 5708.0, 9558.0, 16109.0, 26567.0, 41004.0, 60908.0, 83586.0, 105027.0, 120090.0, 125515.0, 117192.0, 100428.0, 78121.0, 55719.0, 37398.0, 23558.0, 14198.0, 8368.0, 4928.0, 2831.0, 1639.0, 926.0, 580.0, 347.0, 197.0, 128.0, 73.0, 56.0, 28.0, 20.0, 12.0, 8.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.620849609375, -9.30419921875, -8.987548828125, -8.6708984375, -8.354248046875, -8.03759765625, -7.720947265625, -7.404296875, -7.087646484375, -6.77099609375, -6.454345703125, -6.1376953125, -5.821044921875, -5.50439453125, -5.187744140625, -4.87109375, -4.554443359375, -4.23779296875, -3.921142578125, -3.6044921875, -3.287841796875, -2.97119140625, -2.654541015625, -2.337890625, -2.021240234375, -1.70458984375, -1.387939453125, -1.0712890625, -0.754638671875, -0.43798828125, -0.121337890625, 0.1953125, 0.511962890625, 0.82861328125, 1.145263671875, 1.4619140625, 1.778564453125, 2.09521484375, 2.411865234375, 2.728515625, 3.045166015625, 3.36181640625, 3.678466796875, 3.9951171875, 4.311767578125, 4.62841796875, 4.945068359375, 5.26171875, 5.578369140625, 5.89501953125, 6.211669921875, 6.5283203125, 6.844970703125, 7.16162109375, 7.478271484375, 7.794921875, 8.111572265625, 8.42822265625, 8.744873046875, 9.0615234375, 9.378173828125, 9.69482421875, 10.011474609375, 10.328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 4.0, 3.0, 9.0, 9.0, 14.0, 16.0, 18.0, 27.0, 28.0, 34.0, 47.0, 43.0, 45.0, 49.0, 46.0, 63.0, 72.0, 74.0, 54.0, 48.0, 45.0, 55.0, 28.0, 25.0, 37.0, 26.0, 15.0, 22.0, 15.0, 9.0, 7.0, 8.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.38671875, -5.2247314453125, -5.062744140625, -4.9007568359375, -4.73876953125, -4.5767822265625, -4.414794921875, -4.2528076171875, -4.0908203125, -3.9288330078125, -3.766845703125, -3.6048583984375, -3.44287109375, -3.2808837890625, -3.118896484375, -2.9569091796875, -2.794921875, -2.6329345703125, -2.470947265625, -2.3089599609375, -2.14697265625, -1.9849853515625, -1.822998046875, -1.6610107421875, -1.4990234375, -1.3370361328125, -1.175048828125, -1.0130615234375, -0.85107421875, -0.6890869140625, -0.527099609375, -0.3651123046875, -0.203125, -0.0411376953125, 0.120849609375, 0.2828369140625, 0.44482421875, 0.6068115234375, 0.768798828125, 0.9307861328125, 1.0927734375, 1.2547607421875, 1.416748046875, 1.5787353515625, 1.74072265625, 1.9027099609375, 2.064697265625, 2.2266845703125, 2.388671875, 2.5506591796875, 2.712646484375, 2.8746337890625, 3.03662109375, 3.1986083984375, 3.360595703125, 3.5225830078125, 3.6845703125, 3.8465576171875, 4.008544921875, 4.1705322265625, 4.33251953125, 4.4945068359375, 4.656494140625, 4.8184814453125, 4.98046875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 5.0, 7.0, 7.0, 12.0, 13.0, 18.0, 16.0, 23.0, 34.0, 44.0, 65.0, 58.0, 63.0, 64.0, 86.0, 70.0, 65.0, 58.0, 59.0, 64.0, 39.0, 30.0, 29.0, 16.0, 20.0, 11.0, 9.0, 11.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.45816802978516, -67.41261291503906, -65.36705780029297, -63.32150650024414, -61.27595138549805, -59.23039627075195, -57.184844970703125, -55.13928985595703, -53.09373474121094, -51.048179626464844, -49.00262451171875, -46.95707321166992, -44.91151809692383, -42.865962982177734, -40.820411682128906, -38.77485656738281, -36.72930145263672, -34.683746337890625, -32.63819122314453, -30.592639923095703, -28.54708480834961, -26.501529693603516, -24.455976486206055, -22.410423278808594, -20.3648681640625, -18.319313049316406, -16.273759841918945, -14.228205680847168, -12.18265151977539, -10.137097358703613, -8.091543197631836, -6.045989036560059, -4.000438690185547, -1.9548845291137695, 0.09066963195800781, 2.136223793029785, 4.1817779541015625, 6.22733211517334, 8.272886276245117, 10.318440437316895, 12.363994598388672, 14.40954875946045, 16.455102920532227, 18.500656127929688, 20.54621124267578, 22.591766357421875, 24.637319564819336, 26.682872772216797, 28.72842788696289, 30.773983001708984, 32.81953430175781, 34.865089416503906, 36.91064453125, 38.956199645996094, 41.00175476074219, 43.047306060791016, 45.09286117553711, 47.1384162902832, 49.18396759033203, 51.229522705078125, 53.27507781982422, 55.32063293457031, 57.366188049316406, 59.411739349365234, 61.45729446411133]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 7.0, 12.0, 5.0, 8.0, 9.0, 17.0, 12.0, 14.0, 23.0, 20.0, 34.0, 32.0, 38.0, 37.0, 33.0, 46.0, 43.0, 39.0, 42.0, 48.0, 44.0, 49.0, 37.0, 39.0, 37.0, 26.0, 37.0, 34.0, 35.0, 14.0, 24.0, 18.0, 24.0, 13.0, 10.0, 10.0, 10.0, 6.0, 3.0, 2.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.278377532958984, -60.16998291015625, -58.061588287353516, -55.95319366455078, -53.84479904174805, -51.73640441894531, -49.628013610839844, -47.519615173339844, -45.411224365234375, -43.30282974243164, -41.194435119628906, -39.08604049682617, -36.97764587402344, -34.8692512512207, -32.76085662841797, -30.652463912963867, -28.5440673828125, -26.435672760009766, -24.32727813720703, -22.218883514404297, -20.110488891601562, -18.002094268798828, -15.893701553344727, -13.785306930541992, -11.676912307739258, -9.568517684936523, -7.460123538970947, -5.351729393005371, -3.2433347702026367, -1.1349401473999023, 0.9734535217285156, 3.08184814453125, 5.19024658203125, 7.298641204833984, 9.407035827636719, 11.515429496765137, 13.623824119567871, 15.732218742370605, 17.840612411499023, 19.949007034301758, 22.057401657104492, 24.165796279907227, 26.27419090270996, 28.382583618164062, 30.490978240966797, 32.59937286376953, 34.707767486572266, 36.816162109375, 38.924556732177734, 41.03295135498047, 43.1413459777832, 45.24974060058594, 47.35813522338867, 49.466529846191406, 51.574920654296875, 53.683319091796875, 55.791709899902344, 57.90010452270508, 60.00849914550781, 62.11689376831055, 64.22528839111328, 66.33367919921875, 68.44207763671875, 70.55046844482422, 72.65886688232422]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 10.0, 19.0, 25.0, 47.0, 47.0, 73.0, 133.0, 147.0, 220.0, 303.0, 410.0, 644.0, 837.0, 1200.0, 1648.0, 2229.0, 2930.0, 3976.0, 5010.0, 6410.0, 1002349.0, 5539.0, 4209.0, 3225.0, 2522.0, 1765.0, 1328.0, 967.0, 673.0, 470.0, 354.0, 253.0, 187.0, 119.0, 92.0, 64.0, 54.0, 37.0, 23.0, 12.0, 8.0, 12.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-445.0298767089844, -431.61474609375, -418.19964599609375, -404.7845153808594, -391.3694152832031, -377.95428466796875, -364.5391845703125, -351.1240539550781, -337.70892333984375, -324.2937927246094, -310.8786926269531, -297.46356201171875, -284.0484619140625, -270.6333312988281, -257.21820068359375, -243.8031005859375, -230.38800048828125, -216.97288513183594, -203.55776977539062, -190.14263916015625, -176.7275390625, -163.31240844726562, -149.8972930908203, -136.482177734375, -123.06706237792969, -109.65194702148438, -96.23683166503906, -82.82170867919922, -69.4065933227539, -55.991477966308594, -42.57635498046875, -29.161239624023438, -15.746124267578125, -2.3310070037841797, 11.084110260009766, 24.499229431152344, 37.914344787597656, 51.32946014404297, 64.74458312988281, 78.15969848632812, 91.57481384277344, 104.98992919921875, 118.40504455566406, 131.82015991210938, 145.23529052734375, 158.650390625, 172.06552124023438, 185.4806365966797, 198.895751953125, 212.3108673095703, 225.72598266601562, 239.14111328125, 252.55621337890625, 265.9713439941406, 279.386474609375, 292.80157470703125, 306.2166748046875, 319.6318054199219, 333.0469055175781, 346.4620361328125, 359.87713623046875, 373.2922668457031, 386.7073974609375, 400.12249755859375, 413.5376281738281]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 3.0, 9.0, 11.0, 16.0, 20.0, 28.0, 27.0, 25.0, 35.0, 50.0, 36.0, 51.0, 55.0, 79.0, 78.0, 131.0, 222.0, 388.0, 667.0, 1119.0, 2091.0, 3698.0, 7303.0, 15105.0, 27565.0, 56314.0, 51245740.0, 53498.0, 27203.0, 14238.0, 7138.0, 3511.0, 1936.0, 1064.0, 655.0, 354.0, 209.0, 148.0, 93.0, 61.0, 60.0, 44.0, 34.0, 38.0, 42.0, 22.0, 36.0, 20.0, 18.0, 10.0, 11.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-858.0, -831.578125, -805.15625, -778.734375, -752.3125, -725.890625, -699.46875, -673.046875, -646.625, -620.203125, -593.78125, -567.359375, -540.9375, -514.515625, -488.09375, -461.671875, -435.25, -408.828125, -382.40625, -355.984375, -329.5625, -303.140625, -276.71875, -250.296875, -223.875, -197.453125, -171.03125, -144.609375, -118.1875, -91.765625, -65.34375, -38.921875, -12.5, 13.921875, 40.34375, 66.765625, 93.1875, 119.609375, 146.03125, 172.453125, 198.875, 225.296875, 251.71875, 278.140625, 304.5625, 330.984375, 357.40625, 383.828125, 410.25, 436.671875, 463.09375, 489.515625, 515.9375, 542.359375, 568.78125, 595.203125, 621.625, 648.046875, 674.46875, 700.890625, 727.3125, 753.734375, 780.15625, 806.578125, 833.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 10.0, 27.0, 38.0, 28.0, 46.0, 70.0, 89.0, 133.0, 186.0, 240.0, 405.0, 543.0, 763.0, 1017.0, 1736.0, 2413.0, 3424.0, 5581.0, 9158.0, 15032.0, 25363.0, 46589.0, 90378.0, 185955.0, 425608.0, 2757793.0, 1945058.0, 399962.0, 177455.0, 86596.0, 45182.0, 25295.0, 14265.0, 8534.0, 5519.0, 3465.0, 2345.0, 1529.0, 1096.0, 743.0, 546.0, 357.0, 221.0, 179.0, 129.0, 94.0, 67.0, 48.0, 34.0, 20.0, 16.0, 22.0, 13.0, 7.0, 3.0, 10.0], "bins": [-9.2265625, -8.9549560546875, -8.683349609375, -8.4117431640625, -8.14013671875, -7.8685302734375, -7.596923828125, -7.3253173828125, -7.0537109375, -6.7821044921875, -6.510498046875, -6.2388916015625, -5.96728515625, -5.6956787109375, -5.424072265625, -5.1524658203125, -4.880859375, -4.6092529296875, -4.337646484375, -4.0660400390625, -3.79443359375, -3.5228271484375, -3.251220703125, -2.9796142578125, -2.7080078125, -2.4364013671875, -2.164794921875, -1.8931884765625, -1.62158203125, -1.3499755859375, -1.078369140625, -0.8067626953125, -0.53515625, -0.2635498046875, 0.008056640625, 0.2796630859375, 0.55126953125, 0.8228759765625, 1.094482421875, 1.3660888671875, 1.6376953125, 1.9093017578125, 2.180908203125, 2.4525146484375, 2.72412109375, 2.9957275390625, 3.267333984375, 3.5389404296875, 3.810546875, 4.0821533203125, 4.353759765625, 4.6253662109375, 4.89697265625, 5.1685791015625, 5.440185546875, 5.7117919921875, 5.9833984375, 6.2550048828125, 6.526611328125, 6.7982177734375, 7.06982421875, 7.3414306640625, 7.613037109375, 7.8846435546875, 8.15625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 11.0, 16.0, 15.0, 28.0, 24.0, 16.0, 23.0, 26.0, 22.0, 51.0, 39.0, 48.0, 41.0, 40.0, 44.0, 378.0, 620.0, 111.0, 78.0, 41.0, 48.0, 29.0, 27.0, 37.0, 28.0, 20.0, 29.0, 20.0, 23.0, 15.0, 12.0, 10.0, 6.0, 3.0, 7.0, 5.0, 5.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-40.78125, -39.647705078125, -38.51416015625, -37.380615234375, -36.2470703125, -35.113525390625, -33.97998046875, -32.846435546875, -31.712890625, -30.579345703125, -29.44580078125, -28.312255859375, -27.1787109375, -26.045166015625, -24.91162109375, -23.778076171875, -22.64453125, -21.510986328125, -20.37744140625, -19.243896484375, -18.1103515625, -16.976806640625, -15.84326171875, -14.709716796875, -13.576171875, -12.442626953125, -11.30908203125, -10.175537109375, -9.0419921875, -7.908447265625, -6.77490234375, -5.641357421875, -4.5078125, -3.374267578125, -2.24072265625, -1.107177734375, 0.0263671875, 1.159912109375, 2.29345703125, 3.427001953125, 4.560546875, 5.694091796875, 6.82763671875, 7.961181640625, 9.0947265625, 10.228271484375, 11.36181640625, 12.495361328125, 13.62890625, 14.762451171875, 15.89599609375, 17.029541015625, 18.1630859375, 19.296630859375, 20.43017578125, 21.563720703125, 22.697265625, 23.830810546875, 24.96435546875, 26.097900390625, 27.2314453125, 28.364990234375, 29.49853515625, 30.632080078125, 31.765625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 8.0, 8.0, 1.0, 8.0, 19.0, 11.0, 11.0, 20.0, 33.0, 42.0, 73.0, 146.0, 159.0, 236.0, 311.0, 433.0, 623.0, 1058.0, 1552.0, 2384.0, 3692.0, 5738.0, 10076.0, 17485.0, 31531.0, 61108.0, 127712.0, 318995.0, 1881770.0, 3208185.0, 342085.0, 133423.0, 63046.0, 32864.0, 18142.0, 10552.0, 6389.0, 4062.0, 2452.0, 1617.0, 1094.0, 740.0, 503.0, 383.0, 233.0, 145.0, 79.0, 68.0, 37.0, 29.0, 30.0, 17.0, 6.0, 8.0, 9.0, 4.0, 2.0, 0.0, 3.0], "bins": [-15.9609375, -15.491943359375, -15.02294921875, -14.553955078125, -14.0849609375, -13.615966796875, -13.14697265625, -12.677978515625, -12.208984375, -11.739990234375, -11.27099609375, -10.802001953125, -10.3330078125, -9.864013671875, -9.39501953125, -8.926025390625, -8.45703125, -7.988037109375, -7.51904296875, -7.050048828125, -6.5810546875, -6.112060546875, -5.64306640625, -5.174072265625, -4.705078125, -4.236083984375, -3.76708984375, -3.298095703125, -2.8291015625, -2.360107421875, -1.89111328125, -1.422119140625, -0.953125, -0.484130859375, -0.01513671875, 0.453857421875, 0.9228515625, 1.391845703125, 1.86083984375, 2.329833984375, 2.798828125, 3.267822265625, 3.73681640625, 4.205810546875, 4.6748046875, 5.143798828125, 5.61279296875, 6.081787109375, 6.55078125, 7.019775390625, 7.48876953125, 7.957763671875, 8.4267578125, 8.895751953125, 9.36474609375, 9.833740234375, 10.302734375, 10.771728515625, 11.24072265625, 11.709716796875, 12.1787109375, 12.647705078125, 13.11669921875, 13.585693359375, 14.0546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 3.0, 7.0, 9.0, 12.0, 16.0, 15.0, 10.0, 24.0, 14.0, 28.0, 24.0, 35.0, 37.0, 35.0, 36.0, 49.0, 52.0, 49.0, 171.0, 838.0, 161.0, 66.0, 51.0, 49.0, 31.0, 28.0, 20.0, 26.0, 14.0, 27.0, 19.0, 14.0, 14.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.9375, -34.65869140625, -33.3798828125, -32.10107421875, -30.822265625, -29.54345703125, -28.2646484375, -26.98583984375, -25.70703125, -24.42822265625, -23.1494140625, -21.87060546875, -20.591796875, -19.31298828125, -18.0341796875, -16.75537109375, -15.4765625, -14.19775390625, -12.9189453125, -11.64013671875, -10.361328125, -9.08251953125, -7.8037109375, -6.52490234375, -5.24609375, -3.96728515625, -2.6884765625, -1.40966796875, -0.130859375, 1.14794921875, 2.4267578125, 3.70556640625, 4.984375, 6.26318359375, 7.5419921875, 8.82080078125, 10.099609375, 11.37841796875, 12.6572265625, 13.93603515625, 15.21484375, 16.49365234375, 17.7724609375, 19.05126953125, 20.330078125, 21.60888671875, 22.8876953125, 24.16650390625, 25.4453125, 26.72412109375, 28.0029296875, 29.28173828125, 30.560546875, 31.83935546875, 33.1181640625, 34.39697265625, 35.67578125, 36.95458984375, 38.2333984375, 39.51220703125, 40.791015625, 42.06982421875, 43.3486328125, 44.62744140625, 45.90625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 10.0, 6.0, 1.0, 14.0, 13.0, 8.0, 10.0, 28.0, 29.0, 34.0, 35.0, 51.0, 75.0, 82.0, 75.0, 115.0, 126.0, 217.0, 336.0, 488.0, 662.0, 1027.0, 1640.0, 2813.0, 5433.0, 12493.0, 38300.0, 5651095.0, 514611.0, 36406.0, 11924.0, 5330.0, 2806.0, 1699.0, 1019.0, 686.0, 465.0, 335.0, 245.0, 146.0, 123.0, 94.0, 58.0, 71.0, 39.0, 38.0, 27.0, 26.0, 9.0, 13.0, 6.0, 8.0, 12.0, 9.0, 6.0, 6.0, 3.0, 10.0, 1.0], "bins": [-103.0, -99.876953125, -96.75390625, -93.630859375, -90.5078125, -87.384765625, -84.26171875, -81.138671875, -78.015625, -74.892578125, -71.76953125, -68.646484375, -65.5234375, -62.400390625, -59.27734375, -56.154296875, -53.03125, -49.908203125, -46.78515625, -43.662109375, -40.5390625, -37.416015625, -34.29296875, -31.169921875, -28.046875, -24.923828125, -21.80078125, -18.677734375, -15.5546875, -12.431640625, -9.30859375, -6.185546875, -3.0625, 0.060546875, 3.18359375, 6.306640625, 9.4296875, 12.552734375, 15.67578125, 18.798828125, 21.921875, 25.044921875, 28.16796875, 31.291015625, 34.4140625, 37.537109375, 40.66015625, 43.783203125, 46.90625, 50.029296875, 53.15234375, 56.275390625, 59.3984375, 62.521484375, 65.64453125, 68.767578125, 71.890625, 75.013671875, 78.13671875, 81.259765625, 84.3828125, 87.505859375, 90.62890625, 93.751953125, 96.875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 1.0, 5.0, 9.0, 7.0, 6.0, 8.0, 7.0, 7.0, 22.0, 28.0, 27.0, 48.0, 31.0, 56.0, 55.0, 61.0, 89.0, 813.0, 274.0, 94.0, 67.0, 48.0, 53.0, 26.0, 41.0, 25.0, 21.0, 17.0, 18.0, 10.0, 7.0, 8.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-54.9375, -53.2509765625, -51.564453125, -49.8779296875, -48.19140625, -46.5048828125, -44.818359375, -43.1318359375, -41.4453125, -39.7587890625, -38.072265625, -36.3857421875, -34.69921875, -33.0126953125, -31.326171875, -29.6396484375, -27.953125, -26.2666015625, -24.580078125, -22.8935546875, -21.20703125, -19.5205078125, -17.833984375, -16.1474609375, -14.4609375, -12.7744140625, -11.087890625, -9.4013671875, -7.71484375, -6.0283203125, -4.341796875, -2.6552734375, -0.96875, 0.7177734375, 2.404296875, 4.0908203125, 5.77734375, 7.4638671875, 9.150390625, 10.8369140625, 12.5234375, 14.2099609375, 15.896484375, 17.5830078125, 19.26953125, 20.9560546875, 22.642578125, 24.3291015625, 26.015625, 27.7021484375, 29.388671875, 31.0751953125, 32.76171875, 34.4482421875, 36.134765625, 37.8212890625, 39.5078125, 41.1943359375, 42.880859375, 44.5673828125, 46.25390625, 47.9404296875, 49.626953125, 51.3134765625, 53.0]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 10.0, 10.0, 36.0, 373.0, 449.0, 50.0, 29.0, 13.0, 8.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.73007202148438, -159.4951171875, -152.2601776123047, -145.0252227783203, -137.79026794433594, -130.55532836914062, -123.32037353515625, -116.0854263305664, -108.85047912597656, -101.61553192138672, -94.38057708740234, -87.1456298828125, -79.91068267822266, -72.67573547363281, -65.44078063964844, -58.205833435058594, -50.97087860107422, -43.73592758178711, -36.500980377197266, -29.266029357910156, -22.03108024597168, -14.796131134033203, -7.561180114746094, -0.32623291015625, 6.908718109130859, 14.143667221069336, 21.378616333007812, 28.613567352294922, 35.84851837158203, 43.083465576171875, 50.318416595458984, 57.55336380004883, 64.78831481933594, 72.02326202392578, 79.25821685791016, 86.4931640625, 93.72811126708984, 100.96305847167969, 108.19801330566406, 115.4329605102539, 122.66790771484375, 129.90286254882812, 137.13780212402344, 144.3727569580078, 151.6077117919922, 158.8426513671875, 166.07760620117188, 173.31256103515625, 180.54751586914062, 187.782470703125, 195.0174102783203, 202.2523651123047, 209.48731994628906, 216.72225952148438, 223.95721435546875, 231.19216918945312, 238.42710876464844, 245.6620635986328, 252.89700317382812, 260.1319580078125, 267.3669128417969, 274.60186767578125, 281.8367919921875, 289.0717468261719, 296.30670166015625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 9.0, 9.0, 11.0, 14.0, 26.0, 30.0, 101.0, 262.0, 312.0, 101.0, 34.0, 24.0, 18.0, 15.0, 9.0, 6.0, 7.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.35198974609375, -267.7244873046875, -259.09698486328125, -250.46946716308594, -241.84194946289062, -233.21444702148438, -224.58694458007812, -215.95944213867188, -207.33192443847656, -198.7044219970703, -190.076904296875, -181.44940185546875, -172.8218994140625, -164.1943817138672, -155.56687927246094, -146.93936157226562, -138.31185913085938, -129.68435668945312, -121.05683898925781, -112.42933654785156, -103.80182647705078, -95.17431640625, -86.54681396484375, -77.91930389404297, -69.29179382324219, -60.664283752441406, -52.03677749633789, -43.409271240234375, -34.781761169433594, -26.154251098632812, -17.526744842529297, -8.899238586425781, -0.271728515625, 8.355779647827148, 16.983287811279297, 25.610795974731445, 34.238304138183594, 42.865814208984375, 51.49332046508789, 60.120826721191406, 68.74833679199219, 77.37584686279297, 86.00335693359375, 94.630859375, 103.25836944580078, 111.88587951660156, 120.51338195800781, 129.14089965820312, 137.76840209960938, 146.39590454101562, 155.02342224121094, 163.6509246826172, 172.2784423828125, 180.90594482421875, 189.533447265625, 198.16094970703125, 206.78846740722656, 215.4159698486328, 224.04348754882812, 232.67098999023438, 241.29849243164062, 249.92601013183594, 258.55352783203125, 267.1810302734375, 275.80853271484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 9.0, 6.0, 15.0, 19.0, 27.0, 34.0, 64.0, 101.0, 190.0, 307.0, 608.0, 1337.0, 3364.0, 10476.0, 55131.0, 4049307.0, 56128.0, 10743.0, 3399.0, 1427.0, 693.0, 332.0, 193.0, 127.0, 68.0, 56.0, 38.0, 15.0, 22.0, 11.0, 10.0, 11.0, 6.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.25958251953125, -2.1773681640625, -2.09515380859375, -2.012939453125, -1.93072509765625, -1.8485107421875, -1.76629638671875, -1.68408203125, -1.60186767578125, -1.5196533203125, -1.43743896484375, -1.355224609375, -1.27301025390625, -1.1907958984375, -1.10858154296875, -1.0263671875, -0.94415283203125, -0.8619384765625, -0.77972412109375, -0.697509765625, -0.61529541015625, -0.5330810546875, -0.45086669921875, -0.36865234375, -0.28643798828125, -0.2042236328125, -0.12200927734375, -0.039794921875, 0.04241943359375, 0.1246337890625, 0.20684814453125, 0.2890625, 0.37127685546875, 0.4534912109375, 0.53570556640625, 0.617919921875, 0.70013427734375, 0.7823486328125, 0.86456298828125, 0.94677734375, 1.02899169921875, 1.1112060546875, 1.19342041015625, 1.275634765625, 1.35784912109375, 1.4400634765625, 1.52227783203125, 1.6044921875, 1.68670654296875, 1.7689208984375, 1.85113525390625, 1.933349609375, 2.01556396484375, 2.0977783203125, 2.17999267578125, 2.26220703125, 2.34442138671875, 2.4266357421875, 2.50885009765625, 2.591064453125, 2.67327880859375, 2.7554931640625, 2.83770751953125, 2.919921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 6.0, 3.0, 9.0, 9.0, 12.0, 22.0, 30.0, 787.0, 40.0, 19.0, 22.0, 13.0, 4.0, 10.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3559532165527344, -0.34300994873046875, -0.3300666809082031, -0.3171234130859375, -0.3041801452636719, -0.29123687744140625, -0.2782936096191406, -0.265350341796875, -0.2524070739746094, -0.23946380615234375, -0.22652053833007812, -0.2135772705078125, -0.20063400268554688, -0.18769073486328125, -0.17474746704101562, -0.16180419921875, -0.14886093139648438, -0.13591766357421875, -0.12297439575195312, -0.1100311279296875, -0.09708786010742188, -0.08414459228515625, -0.07120132446289062, -0.058258056640625, -0.045314788818359375, -0.03237152099609375, -0.019428253173828125, -0.0064849853515625, 0.006458282470703125, 0.01940155029296875, 0.032344818115234375, 0.0452880859375, 0.058231353759765625, 0.07117462158203125, 0.08411788940429688, 0.0970611572265625, 0.11000442504882812, 0.12294769287109375, 0.13589096069335938, 0.148834228515625, 0.16177749633789062, 0.17472076416015625, 0.18766403198242188, 0.2006072998046875, 0.21355056762695312, 0.22649383544921875, 0.23943710327148438, 0.25238037109375, 0.2653236389160156, 0.27826690673828125, 0.2912101745605469, 0.3041534423828125, 0.3170967102050781, 0.33003997802734375, 0.3429832458496094, 0.355926513671875, 0.3688697814941406, 0.38181304931640625, 0.3947563171386719, 0.4076995849609375, 0.4206428527832031, 0.43358612060546875, 0.4465293884277344, 0.45947265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 17.0, 8.0, 19.0, 34.0, 24.0, 37.0, 61.0, 79.0, 116.0, 168.0, 262.0, 422.0, 640.0, 1149.0, 1853.0, 3582.0, 6597.0, 13560.0, 30810.0, 84524.0, 358678.0, 3176865.0, 379138.0, 82611.0, 28556.0, 12016.0, 5538.0, 2802.0, 1559.0, 883.0, 497.0, 357.0, 251.0, 156.0, 108.0, 79.0, 57.0, 44.0, 30.0, 24.0, 11.0, 15.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0], "bins": [-1.048828125, -1.0193023681640625, -0.989776611328125, -0.9602508544921875, -0.93072509765625, -0.9011993408203125, -0.871673583984375, -0.8421478271484375, -0.8126220703125, -0.7830963134765625, -0.753570556640625, -0.7240447998046875, -0.69451904296875, -0.6649932861328125, -0.635467529296875, -0.6059417724609375, -0.576416015625, -0.5468902587890625, -0.517364501953125, -0.4878387451171875, -0.45831298828125, -0.4287872314453125, -0.399261474609375, -0.3697357177734375, -0.3402099609375, -0.3106842041015625, -0.281158447265625, -0.2516326904296875, -0.22210693359375, -0.1925811767578125, -0.163055419921875, -0.1335296630859375, -0.10400390625, -0.0744781494140625, -0.044952392578125, -0.0154266357421875, 0.01409912109375, 0.0436248779296875, 0.073150634765625, 0.1026763916015625, 0.1322021484375, 0.1617279052734375, 0.191253662109375, 0.2207794189453125, 0.25030517578125, 0.2798309326171875, 0.309356689453125, 0.3388824462890625, 0.368408203125, 0.3979339599609375, 0.427459716796875, 0.4569854736328125, 0.48651123046875, 0.5160369873046875, 0.545562744140625, 0.5750885009765625, 0.6046142578125, 0.6341400146484375, 0.663665771484375, 0.6931915283203125, 0.72271728515625, 0.7522430419921875, 0.781768798828125, 0.8112945556640625, 0.8408203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 5.0, 9.0, 11.0, 4.0, 8.0, 15.0, 12.0, 20.0, 13.0, 20.0, 31.0, 41.0, 33.0, 59.0, 63.0, 97.0, 121.0, 152.0, 250.0, 429.0, 1044.0, 673.0, 306.0, 202.0, 114.0, 81.0, 69.0, 45.0, 28.0, 23.0, 23.0, 10.0, 14.0, 16.0, 7.0, 2.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36962890625, -0.3586769104003906, -0.34772491455078125, -0.3367729187011719, -0.3258209228515625, -0.3148689270019531, -0.30391693115234375, -0.2929649353027344, -0.282012939453125, -0.2710609436035156, -0.26010894775390625, -0.24915695190429688, -0.2382049560546875, -0.22725296020507812, -0.21630096435546875, -0.20534896850585938, -0.19439697265625, -0.18344497680664062, -0.17249298095703125, -0.16154098510742188, -0.1505889892578125, -0.13963699340820312, -0.12868499755859375, -0.11773300170898438, -0.106781005859375, -0.09582901000976562, -0.08487701416015625, -0.07392501831054688, -0.0629730224609375, -0.052021026611328125, -0.04106903076171875, -0.030117034912109375, -0.0191650390625, -0.008213043212890625, 0.00273895263671875, 0.013690948486328125, 0.0246429443359375, 0.035594940185546875, 0.04654693603515625, 0.057498931884765625, 0.068450927734375, 0.07940292358398438, 0.09035491943359375, 0.10130691528320312, 0.1122589111328125, 0.12321090698242188, 0.13416290283203125, 0.14511489868164062, 0.15606689453125, 0.16701889038085938, 0.17797088623046875, 0.18892288208007812, 0.1998748779296875, 0.21082687377929688, 0.22177886962890625, 0.23273086547851562, 0.243682861328125, 0.2546348571777344, 0.26558685302734375, 0.2765388488769531, 0.2874908447265625, 0.2984428405761719, 0.30939483642578125, 0.3203468322753906, 0.331298828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 8.0, 10.0, 33.0, 47.0, 81.0, 230.0, 415.0, 126.0, 30.0, 15.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.846606254577637, -13.577628135681152, -13.308650016784668, -13.039671897888184, -12.7706937789917, -12.501714706420898, -12.232736587524414, -11.96375846862793, -11.694780349731445, -11.425802230834961, -11.156824111938477, -10.887845993041992, -10.618867874145508, -10.349889755249023, -10.080911636352539, -9.811932563781738, -9.54295539855957, -9.273977279663086, -9.004999160766602, -8.736021041870117, -8.467042922973633, -8.198064804077148, -7.929086208343506, -7.6601080894470215, -7.391129493713379, -7.1221513748168945, -6.85317325592041, -6.584195137023926, -6.315216541290283, -6.046238422393799, -5.7772603034973145, -5.50828218460083, -5.239303112030029, -4.970324993133545, -4.7013468742370605, -4.432368278503418, -4.163390159606934, -3.894412040710449, -3.625433921813965, -3.3564558029174805, -3.087477445602417, -2.8184993267059326, -2.549520969390869, -2.2805428504943848, -2.0115647315979004, -1.742586374282837, -1.4736082553863525, -1.2046300172805786, -0.9356517791748047, -0.6666735410690308, -0.3976953625679016, -0.12871718406677246, 0.14026105403900146, 0.4092392921447754, 0.6782174110412598, 0.9471956491470337, 1.2161738872528076, 1.4851521253585815, 1.7541303634643555, 2.02310848236084, 2.292086601257324, 2.5610649585723877, 2.830043077468872, 3.0990214347839355, 3.36799955368042]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 3.0, 3.0, 9.0, 11.0, 17.0, 14.0, 17.0, 29.0, 32.0, 44.0, 49.0, 44.0, 57.0, 64.0, 72.0, 68.0, 57.0, 57.0, 55.0, 35.0, 45.0, 40.0, 36.0, 34.0, 26.0, 24.0, 14.0, 13.0, 8.0, 7.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.503812551498413, -3.399538040161133, -3.2952632904052734, -3.190988779067993, -3.086714029312134, -2.9824395179748535, -2.878164768218994, -2.773890256881714, -2.6696155071258545, -2.565340995788574, -2.461066246032715, -2.3567917346954346, -2.252516984939575, -2.148242473602295, -2.0439677238464355, -1.9396932125091553, -1.8354185819625854, -1.7311439514160156, -1.6268693208694458, -1.522594690322876, -1.4183200597763062, -1.3140454292297363, -1.209770917892456, -1.1054961681365967, -1.0012216567993164, -0.8969470262527466, -0.7926723957061768, -0.6883977651596069, -0.5841231346130371, -0.47984856367111206, -0.37557393312454224, -0.2712993025779724, -0.1670246124267578, -0.06274998933076859, 0.04152463376522064, 0.14579924941062927, 0.2500738799571991, 0.35434848070144653, 0.45862311124801636, 0.5628977417945862, 0.667172372341156, 0.7714470028877258, 0.8757216334342957, 0.9799962043762207, 1.0842708349227905, 1.1885454654693604, 1.2928200960159302, 1.3970947265625, 1.5013693571090698, 1.6056439876556396, 1.7099186182022095, 1.8141932487487793, 1.9184678792953491, 2.022742509841919, 2.127017021179199, 2.2312917709350586, 2.335566282272339, 2.439840793609619, 2.5441155433654785, 2.648390054702759, 2.752664804458618, 2.8569393157958984, 2.961214065551758, 3.065488576889038, 3.1697633266448975]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 8.0, 9.0, 15.0, 17.0, 26.0, 28.0, 46.0, 67.0, 117.0, 128.0, 201.0, 361.0, 552.0, 1028.0, 2019.0, 4456.0, 12702.0, 85256.0, 894361.0, 32071.0, 8208.0, 3197.0, 1511.0, 786.0, 469.0, 310.0, 180.0, 121.0, 83.0, 57.0, 46.0, 27.0, 21.0, 15.0, 11.0, 8.0, 5.0, 7.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0], "bins": [-2.732421875, -2.65716552734375, -2.5819091796875, -2.50665283203125, -2.431396484375, -2.35614013671875, -2.2808837890625, -2.20562744140625, -2.13037109375, -2.05511474609375, -1.9798583984375, -1.90460205078125, -1.829345703125, -1.75408935546875, -1.6788330078125, -1.60357666015625, -1.5283203125, -1.45306396484375, -1.3778076171875, -1.30255126953125, -1.227294921875, -1.15203857421875, -1.0767822265625, -1.00152587890625, -0.92626953125, -0.85101318359375, -0.7757568359375, -0.70050048828125, -0.625244140625, -0.54998779296875, -0.4747314453125, -0.39947509765625, -0.32421875, -0.24896240234375, -0.1737060546875, -0.09844970703125, -0.023193359375, 0.05206298828125, 0.1273193359375, 0.20257568359375, 0.27783203125, 0.35308837890625, 0.4283447265625, 0.50360107421875, 0.578857421875, 0.65411376953125, 0.7293701171875, 0.80462646484375, 0.8798828125, 0.95513916015625, 1.0303955078125, 1.10565185546875, 1.180908203125, 1.25616455078125, 1.3314208984375, 1.40667724609375, 1.48193359375, 1.55718994140625, 1.6324462890625, 1.70770263671875, 1.782958984375, 1.85821533203125, 1.9334716796875, 2.00872802734375, 2.083984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 3.0, 6.0, 5.0, 11.0, 12.0, 20.0, 88.0, 294.0, 334.0, 119.0, 35.0, 25.0, 9.0, 6.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.36907196044921875, -0.3582611083984375, -0.34745025634765625, -0.336639404296875, -0.32582855224609375, -0.3150177001953125, -0.30420684814453125, -0.29339599609375, -0.28258514404296875, -0.2717742919921875, -0.26096343994140625, -0.250152587890625, -0.23934173583984375, -0.2285308837890625, -0.21772003173828125, -0.2069091796875, -0.19609832763671875, -0.1852874755859375, -0.17447662353515625, -0.163665771484375, -0.15285491943359375, -0.1420440673828125, -0.13123321533203125, -0.12042236328125, -0.10961151123046875, -0.0988006591796875, -0.08798980712890625, -0.077178955078125, -0.06636810302734375, -0.0555572509765625, -0.04474639892578125, -0.033935546875, -0.02312469482421875, -0.0123138427734375, -0.00150299072265625, 0.009307861328125, 0.02011871337890625, 0.0309295654296875, 0.04174041748046875, 0.05255126953125, 0.06336212158203125, 0.0741729736328125, 0.08498382568359375, 0.095794677734375, 0.10660552978515625, 0.1174163818359375, 0.12822723388671875, 0.1390380859375, 0.14984893798828125, 0.1606597900390625, 0.17147064208984375, 0.182281494140625, 0.19309234619140625, 0.2039031982421875, 0.21471405029296875, 0.22552490234375, 0.23633575439453125, 0.2471466064453125, 0.25795745849609375, 0.268768310546875, 0.27957916259765625, 0.2903900146484375, 0.30120086669921875, 0.31201171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 6.0, 14.0, 18.0, 17.0, 34.0, 34.0, 83.0, 136.0, 214.0, 384.0, 765.0, 2068.0, 8886.0, 167181.0, 838591.0, 24328.0, 3476.0, 1077.0, 520.0, 264.0, 145.0, 98.0, 62.0, 26.0, 31.0, 23.0, 20.0, 9.0, 5.0, 4.0, 4.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7734375, -3.6485595703125, -3.523681640625, -3.3988037109375, -3.27392578125, -3.1490478515625, -3.024169921875, -2.8992919921875, -2.7744140625, -2.6495361328125, -2.524658203125, -2.3997802734375, -2.27490234375, -2.1500244140625, -2.025146484375, -1.9002685546875, -1.775390625, -1.6505126953125, -1.525634765625, -1.4007568359375, -1.27587890625, -1.1510009765625, -1.026123046875, -0.9012451171875, -0.7763671875, -0.6514892578125, -0.526611328125, -0.4017333984375, -0.27685546875, -0.1519775390625, -0.027099609375, 0.0977783203125, 0.22265625, 0.3475341796875, 0.472412109375, 0.5972900390625, 0.72216796875, 0.8470458984375, 0.971923828125, 1.0968017578125, 1.2216796875, 1.3465576171875, 1.471435546875, 1.5963134765625, 1.72119140625, 1.8460693359375, 1.970947265625, 2.0958251953125, 2.220703125, 2.3455810546875, 2.470458984375, 2.5953369140625, 2.72021484375, 2.8450927734375, 2.969970703125, 3.0948486328125, 3.2197265625, 3.3446044921875, 3.469482421875, 3.5943603515625, 3.71923828125, 3.8441162109375, 3.968994140625, 4.0938720703125, 4.21875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 5.0, 2.0, 10.0, 6.0, 8.0, 10.0, 12.0, 13.0, 19.0, 19.0, 19.0, 25.0, 21.0, 30.0, 28.0, 32.0, 26.0, 21.0, 31.0, 37.0, 41.0, 28.0, 50.0, 41.0, 43.0, 36.0, 31.0, 35.0, 31.0, 34.0, 30.0, 23.0, 31.0, 27.0, 21.0, 12.0, 12.0, 14.0, 11.0, 13.0, 6.0, 3.0, 10.0, 8.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0], "bins": [-0.96923828125, -0.9406356811523438, -0.9120330810546875, -0.8834304809570312, -0.854827880859375, -0.8262252807617188, -0.7976226806640625, -0.7690200805664062, -0.74041748046875, -0.7118148803710938, -0.6832122802734375, -0.6546096801757812, -0.626007080078125, -0.5974044799804688, -0.5688018798828125, -0.5401992797851562, -0.5115966796875, -0.48299407958984375, -0.4543914794921875, -0.42578887939453125, -0.397186279296875, -0.36858367919921875, -0.3399810791015625, -0.31137847900390625, -0.28277587890625, -0.25417327880859375, -0.2255706787109375, -0.19696807861328125, -0.168365478515625, -0.13976287841796875, -0.1111602783203125, -0.08255767822265625, -0.053955078125, -0.02535247802734375, 0.0032501220703125, 0.03185272216796875, 0.060455322265625, 0.08905792236328125, 0.1176605224609375, 0.14626312255859375, 0.17486572265625, 0.20346832275390625, 0.2320709228515625, 0.26067352294921875, 0.289276123046875, 0.31787872314453125, 0.3464813232421875, 0.37508392333984375, 0.4036865234375, 0.43228912353515625, 0.4608917236328125, 0.48949432373046875, 0.518096923828125, 0.5466995239257812, 0.5753021240234375, 0.6039047241210938, 0.63250732421875, 0.6611099243164062, 0.6897125244140625, 0.7183151245117188, 0.746917724609375, 0.7755203247070312, 0.8041229248046875, 0.8327255249023438, 0.861328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 11.0, 16.0, 20.0, 22.0, 31.0, 55.0, 97.0, 153.0, 341.0, 851.0, 3060.0, 25222.0, 993765.0, 20407.0, 2885.0, 856.0, 311.0, 154.0, 83.0, 59.0, 38.0, 22.0, 20.0, 11.0, 12.0, 7.0, 4.0, 9.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.16015625, -4.00299072265625, -3.8458251953125, -3.68865966796875, -3.531494140625, -3.37432861328125, -3.2171630859375, -3.05999755859375, -2.90283203125, -2.74566650390625, -2.5885009765625, -2.43133544921875, -2.274169921875, -2.11700439453125, -1.9598388671875, -1.80267333984375, -1.6455078125, -1.48834228515625, -1.3311767578125, -1.17401123046875, -1.016845703125, -0.85968017578125, -0.7025146484375, -0.54534912109375, -0.38818359375, -0.23101806640625, -0.0738525390625, 0.08331298828125, 0.240478515625, 0.39764404296875, 0.5548095703125, 0.71197509765625, 0.869140625, 1.02630615234375, 1.1834716796875, 1.34063720703125, 1.497802734375, 1.65496826171875, 1.8121337890625, 1.96929931640625, 2.12646484375, 2.28363037109375, 2.4407958984375, 2.59796142578125, 2.755126953125, 2.91229248046875, 3.0694580078125, 3.22662353515625, 3.3837890625, 3.54095458984375, 3.6981201171875, 3.85528564453125, 4.012451171875, 4.16961669921875, 4.3267822265625, 4.48394775390625, 4.64111328125, 4.79827880859375, 4.9554443359375, 5.11260986328125, 5.269775390625, 5.42694091796875, 5.5841064453125, 5.74127197265625, 5.8984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 8.0, 2.0, 6.0, 7.0, 5.0, 13.0, 23.0, 25.0, 67.0, 113.0, 182.0, 203.0, 137.0, 95.0, 41.0, 31.0, 19.0, 12.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00173187255859375, -0.001681312918663025, -0.0016307532787322998, -0.0015801936388015747, -0.0015296339988708496, -0.0014790743589401245, -0.0014285147190093994, -0.0013779550790786743, -0.0013273954391479492, -0.0012768357992172241, -0.001226276159286499, -0.001175716519355774, -0.0011251568794250488, -0.0010745972394943237, -0.0010240375995635986, -0.0009734779596328735, -0.0009229183197021484, -0.0008723586797714233, -0.0008217990398406982, -0.0007712393999099731, -0.000720679759979248, -0.000670120120048523, -0.0006195604801177979, -0.0005690008401870728, -0.0005184412002563477, -0.00046788156032562256, -0.00041732192039489746, -0.00036676228046417236, -0.00031620264053344727, -0.00026564300060272217, -0.00021508336067199707, -0.00016452372074127197, -0.00011396408081054688, -6.340444087982178e-05, -1.284480094909668e-05, 3.771483898162842e-05, 8.827447891235352e-05, 0.0001388341188430786, 0.0001893937587738037, 0.0002399533987045288, 0.0002905130386352539, 0.000341072678565979, 0.0003916323184967041, 0.0004421919584274292, 0.0004927515983581543, 0.0005433112382888794, 0.0005938708782196045, 0.0006444305181503296, 0.0006949901580810547, 0.0007455497980117798, 0.0007961094379425049, 0.00084666907787323, 0.0008972287178039551, 0.0009477883577346802, 0.0009983479976654053, 0.0010489076375961304, 0.0010994672775268555, 0.0011500269174575806, 0.0012005865573883057, 0.0012511461973190308, 0.0013017058372497559, 0.001352265477180481, 0.001402825117111206, 0.0014533847570419312, 0.0015039443969726562]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 7.0, 11.0, 13.0, 21.0, 25.0, 34.0, 57.0, 85.0, 124.0, 201.0, 336.0, 553.0, 995.0, 1966.0, 4840.0, 13859.0, 63337.0, 779833.0, 146771.0, 22733.0, 6858.0, 2842.0, 1275.0, 700.0, 378.0, 238.0, 156.0, 88.0, 62.0, 35.0, 32.0, 23.0, 15.0, 10.0, 8.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9501953125, -1.8845062255859375, -1.818817138671875, -1.7531280517578125, -1.68743896484375, -1.6217498779296875, -1.556060791015625, -1.4903717041015625, -1.4246826171875, -1.3589935302734375, -1.293304443359375, -1.2276153564453125, -1.16192626953125, -1.0962371826171875, -1.030548095703125, -0.9648590087890625, -0.899169921875, -0.8334808349609375, -0.767791748046875, -0.7021026611328125, -0.63641357421875, -0.5707244873046875, -0.505035400390625, -0.4393463134765625, -0.3736572265625, -0.3079681396484375, -0.242279052734375, -0.1765899658203125, -0.11090087890625, -0.0452117919921875, 0.020477294921875, 0.0861663818359375, 0.15185546875, 0.2175445556640625, 0.283233642578125, 0.3489227294921875, 0.41461181640625, 0.4803009033203125, 0.545989990234375, 0.6116790771484375, 0.6773681640625, 0.7430572509765625, 0.808746337890625, 0.8744354248046875, 0.94012451171875, 1.0058135986328125, 1.071502685546875, 1.1371917724609375, 1.202880859375, 1.2685699462890625, 1.334259033203125, 1.3999481201171875, 1.46563720703125, 1.5313262939453125, 1.597015380859375, 1.6627044677734375, 1.7283935546875, 1.7940826416015625, 1.859771728515625, 1.9254608154296875, 1.99114990234375, 2.0568389892578125, 2.122528076171875, 2.1882171630859375, 2.25390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 16.0, 12.0, 18.0, 16.0, 31.0, 24.0, 56.0, 75.0, 111.0, 144.0, 149.0, 88.0, 62.0, 47.0, 37.0, 23.0, 22.0, 11.0, 15.0, 6.0, 4.0, 4.0, 2.0, 5.0, 7.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8515625, -1.78985595703125, -1.7281494140625, -1.66644287109375, -1.604736328125, -1.54302978515625, -1.4813232421875, -1.41961669921875, -1.35791015625, -1.29620361328125, -1.2344970703125, -1.17279052734375, -1.111083984375, -1.04937744140625, -0.9876708984375, -0.92596435546875, -0.8642578125, -0.80255126953125, -0.7408447265625, -0.67913818359375, -0.617431640625, -0.55572509765625, -0.4940185546875, -0.43231201171875, -0.37060546875, -0.30889892578125, -0.2471923828125, -0.18548583984375, -0.123779296875, -0.06207275390625, -0.0003662109375, 0.06134033203125, 0.123046875, 0.18475341796875, 0.2464599609375, 0.30816650390625, 0.369873046875, 0.43157958984375, 0.4932861328125, 0.55499267578125, 0.61669921875, 0.67840576171875, 0.7401123046875, 0.80181884765625, 0.863525390625, 0.92523193359375, 0.9869384765625, 1.04864501953125, 1.1103515625, 1.17205810546875, 1.2337646484375, 1.29547119140625, 1.357177734375, 1.41888427734375, 1.4805908203125, 1.54229736328125, 1.60400390625, 1.66571044921875, 1.7274169921875, 1.78912353515625, 1.850830078125, 1.91253662109375, 1.9742431640625, 2.03594970703125, 2.09765625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 4.0, 12.0, 56.0, 229.0, 521.0, 123.0, 28.0, 14.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.99327087402344, -31.83414077758789, -30.675012588500977, -29.515884399414062, -28.356754302978516, -27.19762420654297, -26.038496017456055, -24.87936782836914, -23.720237731933594, -22.561107635498047, -21.401979446411133, -20.24285125732422, -19.083721160888672, -17.924591064453125, -16.76546287536621, -15.60633373260498, -14.44720458984375, -13.28807544708252, -12.128946304321289, -10.969817161560059, -9.810688018798828, -8.651558876037598, -7.492429733276367, -6.333300590515137, -5.174171447753906, -4.015042304992676, -2.8559131622314453, -1.6967840194702148, -0.5376548767089844, 0.6214742660522461, 1.7806034088134766, 2.939732551574707, 4.098865509033203, 5.257994651794434, 6.417123794555664, 7.5762529373168945, 8.735382080078125, 9.894511222839355, 11.053640365600586, 12.212769508361816, 13.371898651123047, 14.531027793884277, 15.690156936645508, 16.849285125732422, 18.00841522216797, 19.167545318603516, 20.32667350769043, 21.485801696777344, 22.64493179321289, 23.804061889648438, 24.96319007873535, 26.122318267822266, 27.281448364257812, 28.44057846069336, 29.599706649780273, 30.758834838867188, 31.917964935302734, 33.07709503173828, 34.23622131347656, 35.39535140991211, 36.554481506347656, 37.7136116027832, 38.87274169921875, 40.03186798095703, 41.19099807739258]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 10.0, 8.0, 13.0, 17.0, 42.0, 39.0, 85.0, 103.0, 144.0, 157.0, 128.0, 88.0, 61.0, 37.0, 24.0, 15.0, 6.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.332351684570312, -19.522924423217773, -18.713499069213867, -17.904071807861328, -17.094646453857422, -16.285219192504883, -15.47579288482666, -14.666366577148438, -13.856939315795898, -13.047513008117676, -12.238086700439453, -11.428659439086914, -10.619233131408691, -9.809806823730469, -9.000380516052246, -8.190954208374023, -7.381527900695801, -6.572101593017578, -5.762674808502197, -4.953248500823975, -4.143821716308594, -3.334395408630371, -2.5249691009521484, -1.7155423164367676, -0.9061160087585449, -0.09668952226638794, 0.712736964225769, 1.5221633911132812, 2.331589937210083, 3.1410164833068848, 3.9504427909851074, 4.759869575500488, 5.569295883178711, 6.378722190856934, 7.1881489753723145, 7.997575283050537, 8.807002067565918, 9.61642837524414, 10.425854682922363, 11.235280990600586, 12.044708251953125, 12.854134559631348, 13.66356086730957, 14.47298812866211, 15.282414436340332, 16.091840744018555, 16.901268005371094, 17.710693359375, 18.520118713378906, 19.329545974731445, 20.13897132873535, 20.94839859008789, 21.757823944091797, 22.567251205444336, 23.376678466796875, 24.18610382080078, 24.99553108215332, 25.80495834350586, 26.614383697509766, 27.423810958862305, 28.23323631286621, 29.04266357421875, 29.852088928222656, 30.661516189575195, 31.470943450927734]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 8.0, 7.0, 6.0, 11.0, 20.0, 24.0, 50.0, 186.0, 28551.0, 4164094.0, 1038.0, 165.0, 52.0, 27.0, 19.0, 11.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.4375, -34.865234375, -33.29296875, -31.720703125, -30.1484375, -28.576171875, -27.00390625, -25.431640625, -23.859375, -22.287109375, -20.71484375, -19.142578125, -17.5703125, -15.998046875, -14.42578125, -12.853515625, -11.28125, -9.708984375, -8.13671875, -6.564453125, -4.9921875, -3.419921875, -1.84765625, -0.275390625, 1.296875, 2.869140625, 4.44140625, 6.013671875, 7.5859375, 9.158203125, 10.73046875, 12.302734375, 13.875, 15.447265625, 17.01953125, 18.591796875, 20.1640625, 21.736328125, 23.30859375, 24.880859375, 26.453125, 28.025390625, 29.59765625, 31.169921875, 32.7421875, 34.314453125, 35.88671875, 37.458984375, 39.03125, 40.603515625, 42.17578125, 43.748046875, 45.3203125, 46.892578125, 48.46484375, 50.037109375, 51.609375, 53.181640625, 54.75390625, 56.326171875, 57.8984375, 59.470703125, 61.04296875, 62.615234375, 64.1875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 11.0, 5.0, 7.0, 18.0, 27.0, 69.0, 84.0, 130.0, 160.0, 157.0, 112.0, 64.0, 44.0, 32.0, 16.0, 6.0, 8.0, 5.0, 9.0, 4.0, 1.0, 6.0, 3.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14990234375, -0.14412879943847656, -0.13835525512695312, -0.1325817108154297, -0.12680816650390625, -0.12103462219238281, -0.11526107788085938, -0.10948753356933594, -0.1037139892578125, -0.09794044494628906, -0.09216690063476562, -0.08639335632324219, -0.08061981201171875, -0.07484626770019531, -0.06907272338867188, -0.06329917907714844, -0.057525634765625, -0.05175209045410156, -0.045978546142578125, -0.04020500183105469, -0.03443145751953125, -0.028657913208007812, -0.022884368896484375, -0.017110824584960938, -0.0113372802734375, -0.0055637359619140625, 0.000209808349609375, 0.0059833526611328125, 0.01175689697265625, 0.017530441284179688, 0.023303985595703125, 0.029077529907226562, 0.03485107421875, 0.04062461853027344, 0.046398162841796875, 0.05217170715332031, 0.05794525146484375, 0.06371879577636719, 0.06949234008789062, 0.07526588439941406, 0.0810394287109375, 0.08681297302246094, 0.09258651733398438, 0.09836006164550781, 0.10413360595703125, 0.10990715026855469, 0.11568069458007812, 0.12145423889160156, 0.127227783203125, 0.13300132751464844, 0.13877487182617188, 0.1445484161376953, 0.15032196044921875, 0.1560955047607422, 0.16186904907226562, 0.16764259338378906, 0.1734161376953125, 0.17918968200683594, 0.18496322631835938, 0.1907367706298828, 0.19651031494140625, 0.2022838592529297, 0.20805740356445312, 0.21383094787597656, 0.2196044921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 3.0, 6.0, 13.0, 21.0, 41.0, 44.0, 71.0, 93.0, 134.0, 204.0, 423.0, 1695.0, 344979.0, 3843791.0, 2301.0, 311.0, 97.0, 31.0, 11.0, 7.0, 3.0, 4.0, 2.0], "bins": [-19.671875, -19.308074951171875, -18.94427490234375, -18.580474853515625, -18.2166748046875, -17.852874755859375, -17.48907470703125, -17.125274658203125, -16.761474609375, -16.397674560546875, -16.03387451171875, -15.670074462890625, -15.3062744140625, -14.942474365234375, -14.57867431640625, -14.214874267578125, -13.85107421875, -13.487274169921875, -13.12347412109375, -12.759674072265625, -12.3958740234375, -12.032073974609375, -11.66827392578125, -11.304473876953125, -10.940673828125, -10.576873779296875, -10.21307373046875, -9.849273681640625, -9.4854736328125, -9.121673583984375, -8.75787353515625, -8.394073486328125, -8.0302734375, -7.666473388671875, -7.30267333984375, -6.938873291015625, -6.5750732421875, -6.211273193359375, -5.84747314453125, -5.483673095703125, -5.119873046875, -4.756072998046875, -4.39227294921875, -4.028472900390625, -3.6646728515625, -3.300872802734375, -2.93707275390625, -2.573272705078125, -2.20947265625, -1.845672607421875, -1.48187255859375, -1.118072509765625, -0.7542724609375, -0.390472412109375, -0.02667236328125, 0.337127685546875, 0.700927734375, 1.064727783203125, 1.42852783203125, 1.792327880859375, 2.1561279296875, 2.519927978515625, 2.88372802734375, 3.247528076171875, 3.611328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 10.0, 8.0, 18.0, 30.0, 23.0, 62.0, 113.0, 230.0, 454.0, 981.0, 1178.0, 410.0, 180.0, 107.0, 60.0, 47.0, 32.0, 25.0, 26.0, 9.0, 16.0, 9.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326904296875, -0.3175849914550781, -0.30826568603515625, -0.2989463806152344, -0.2896270751953125, -0.2803077697753906, -0.27098846435546875, -0.2616691589355469, -0.252349853515625, -0.24303054809570312, -0.23371124267578125, -0.22439193725585938, -0.2150726318359375, -0.20575332641601562, -0.19643402099609375, -0.18711471557617188, -0.17779541015625, -0.16847610473632812, -0.15915679931640625, -0.14983749389648438, -0.1405181884765625, -0.13119888305664062, -0.12187957763671875, -0.11256027221679688, -0.103240966796875, -0.09392166137695312, -0.08460235595703125, -0.07528305053710938, -0.0659637451171875, -0.056644439697265625, -0.04732513427734375, -0.038005828857421875, -0.0286865234375, -0.019367218017578125, -0.01004791259765625, -0.000728607177734375, 0.0085906982421875, 0.017910003662109375, 0.02722930908203125, 0.036548614501953125, 0.045867919921875, 0.055187225341796875, 0.06450653076171875, 0.07382583618164062, 0.0831451416015625, 0.09246444702148438, 0.10178375244140625, 0.11110305786132812, 0.12042236328125, 0.12974166870117188, 0.13906097412109375, 0.14838027954101562, 0.1576995849609375, 0.16701889038085938, 0.17633819580078125, 0.18565750122070312, 0.194976806640625, 0.20429611206054688, 0.21361541748046875, 0.22293472290039062, 0.2322540283203125, 0.24157333374023438, 0.25089263916015625, 0.2602119445800781, 0.26953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 77.0, 904.0, 24.0, 2.0, 2.0, 2.0], "bins": [-90.9687728881836, -89.4393539428711, -87.90994262695312, -86.38052368164062, -84.85110473632812, -83.32168579101562, -81.79227447509766, -80.26285552978516, -78.73343658447266, -77.20401763916016, -75.67460632324219, -74.14518737792969, -72.61576843261719, -71.08634948730469, -69.55693817138672, -68.02751922607422, -66.49810791015625, -64.96868896484375, -63.439273834228516, -61.90985870361328, -60.38043975830078, -58.85102462768555, -57.32160949707031, -55.79219055175781, -54.26277160644531, -52.73335647583008, -51.20393753051758, -49.674522399902344, -48.145103454589844, -46.61568832397461, -45.086273193359375, -43.556854248046875, -42.02743911743164, -40.498023986816406, -38.968605041503906, -37.43918991088867, -35.90977096557617, -34.38035583496094, -32.85093688964844, -31.321521759033203, -29.792102813720703, -28.262685775756836, -26.73326873779297, -25.203853607177734, -23.674434661865234, -22.14501953125, -20.615602493286133, -19.086185455322266, -17.55677032470703, -16.027353286743164, -14.497936248779297, -12.968520164489746, -11.439103126525879, -9.909686088562012, -8.380270004272461, -6.850852966308594, -5.32143497467041, -3.792018175125122, -2.262601375579834, -0.733184814453125, 0.7962322235107422, 2.3256492614746094, 3.85506534576416, 5.384482383728027, 6.9138994216918945]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 15.0, 37.0, 63.0, 87.0, 146.0, 158.0, 138.0, 130.0, 92.0, 48.0, 26.0, 21.0, 12.0, 10.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.495293617248535, -6.3571600914001465, -6.219026565551758, -6.080893039703369, -5.9427595138549805, -5.804625988006592, -5.666492462158203, -5.5283589363098145, -5.390225410461426, -5.252091884613037, -5.113958358764648, -4.97582483291626, -4.837691307067871, -4.699557781219482, -4.561424255371094, -4.423290729522705, -4.285157203674316, -4.147023677825928, -4.008890151977539, -3.8707566261291504, -3.7326231002807617, -3.594489574432373, -3.4563560485839844, -3.3182225227355957, -3.1800894737243652, -3.0419559478759766, -2.903822422027588, -2.765688896179199, -2.6275553703308105, -2.489421844482422, -2.351288318634033, -2.2131547927856445, -2.075021266937256, -1.9368877410888672, -1.7987542152404785, -1.6606206893920898, -1.5224871635437012, -1.3843536376953125, -1.2462202310562134, -1.1080867052078247, -0.969953179359436, -0.8318196535110474, -0.6936861276626587, -0.5555526614189148, -0.4174191355705261, -0.27928560972213745, -0.14115214347839355, -0.003018617630004883, 0.1351149082183838, 0.27324843406677246, 0.41138193011283875, 0.549515426158905, 0.6876489520072937, 0.8257824778556824, 0.9639159440994263, 1.102049469947815, 1.2401829957962036, 1.3783165216445923, 1.516450047492981, 1.65458345413208, 1.7927169799804688, 1.9308505058288574, 2.068984031677246, 2.2071175575256348, 2.3452510833740234]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 8.0, 9.0, 13.0, 10.0, 17.0, 19.0, 46.0, 69.0, 119.0, 191.0, 361.0, 617.0, 1194.0, 2630.0, 7836.0, 37440.0, 735960.0, 232241.0, 20652.0, 5110.0, 1890.0, 919.0, 500.0, 282.0, 155.0, 100.0, 58.0, 40.0, 24.0, 11.0, 12.0, 13.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.41058349609375, -2.3172607421875, -2.22393798828125, -2.130615234375, -2.03729248046875, -1.9439697265625, -1.85064697265625, -1.75732421875, -1.66400146484375, -1.5706787109375, -1.47735595703125, -1.384033203125, -1.29071044921875, -1.1973876953125, -1.10406494140625, -1.0107421875, -0.91741943359375, -0.8240966796875, -0.73077392578125, -0.637451171875, -0.54412841796875, -0.4508056640625, -0.35748291015625, -0.26416015625, -0.17083740234375, -0.0775146484375, 0.01580810546875, 0.109130859375, 0.20245361328125, 0.2957763671875, 0.38909912109375, 0.482421875, 0.57574462890625, 0.6690673828125, 0.76239013671875, 0.855712890625, 0.94903564453125, 1.0423583984375, 1.13568115234375, 1.22900390625, 1.32232666015625, 1.4156494140625, 1.50897216796875, 1.602294921875, 1.69561767578125, 1.7889404296875, 1.88226318359375, 1.9755859375, 2.06890869140625, 2.1622314453125, 2.25555419921875, 2.348876953125, 2.44219970703125, 2.5355224609375, 2.62884521484375, 2.72216796875, 2.81549072265625, 2.9088134765625, 3.00213623046875, 3.095458984375, 3.18878173828125, 3.2821044921875, 3.37542724609375, 3.46875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 8.0, 5.0, 8.0, 2.0, 17.0, 29.0, 55.0, 70.0, 104.0, 125.0, 171.0, 135.0, 79.0, 54.0, 39.0, 26.0, 21.0, 8.0, 7.0, 3.0, 9.0, 2.0, 3.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1435546875, -0.13812637329101562, -0.13269805908203125, -0.12726974487304688, -0.1218414306640625, -0.11641311645507812, -0.11098480224609375, -0.10555648803710938, -0.100128173828125, -0.09469985961914062, -0.08927154541015625, -0.08384323120117188, -0.0784149169921875, -0.07298660278320312, -0.06755828857421875, -0.062129974365234375, -0.05670166015625, -0.051273345947265625, -0.04584503173828125, -0.040416717529296875, -0.0349884033203125, -0.029560089111328125, -0.02413177490234375, -0.018703460693359375, -0.013275146484375, -0.007846832275390625, -0.00241851806640625, 0.003009796142578125, 0.0084381103515625, 0.013866424560546875, 0.01929473876953125, 0.024723052978515625, 0.0301513671875, 0.035579681396484375, 0.04100799560546875, 0.046436309814453125, 0.0518646240234375, 0.057292938232421875, 0.06272125244140625, 0.06814956665039062, 0.073577880859375, 0.07900619506835938, 0.08443450927734375, 0.08986282348632812, 0.0952911376953125, 0.10071945190429688, 0.10614776611328125, 0.11157608032226562, 0.11700439453125, 0.12243270874023438, 0.12786102294921875, 0.13328933715820312, 0.1387176513671875, 0.14414596557617188, 0.14957427978515625, 0.15500259399414062, 0.160430908203125, 0.16585922241210938, 0.17128753662109375, 0.17671585083007812, 0.1821441650390625, 0.18757247924804688, 0.19300079345703125, 0.19842910766601562, 0.203857421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 14.0, 24.0, 24.0, 30.0, 63.0, 68.0, 126.0, 280.0, 523.0, 1170.0, 4048.0, 27953.0, 696143.0, 297384.0, 15604.0, 2968.0, 1011.0, 494.0, 226.0, 122.0, 94.0, 62.0, 35.0, 22.0, 15.0, 8.0, 1.0, 5.0, 4.0, 4.0, 1.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.818359375, -2.735137939453125, -2.65191650390625, -2.568695068359375, -2.4854736328125, -2.402252197265625, -2.31903076171875, -2.235809326171875, -2.152587890625, -2.069366455078125, -1.98614501953125, -1.902923583984375, -1.8197021484375, -1.736480712890625, -1.65325927734375, -1.570037841796875, -1.48681640625, -1.403594970703125, -1.32037353515625, -1.237152099609375, -1.1539306640625, -1.070709228515625, -0.98748779296875, -0.904266357421875, -0.821044921875, -0.737823486328125, -0.65460205078125, -0.571380615234375, -0.4881591796875, -0.404937744140625, -0.32171630859375, -0.238494873046875, -0.1552734375, -0.072052001953125, 0.01116943359375, 0.094390869140625, 0.1776123046875, 0.260833740234375, 0.34405517578125, 0.427276611328125, 0.510498046875, 0.593719482421875, 0.67694091796875, 0.760162353515625, 0.8433837890625, 0.926605224609375, 1.00982666015625, 1.093048095703125, 1.17626953125, 1.259490966796875, 1.34271240234375, 1.425933837890625, 1.5091552734375, 1.592376708984375, 1.67559814453125, 1.758819580078125, 1.842041015625, 1.925262451171875, 2.00848388671875, 2.091705322265625, 2.1749267578125, 2.258148193359375, 2.34136962890625, 2.424591064453125, 2.5078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 8.0, 11.0, 8.0, 12.0, 17.0, 21.0, 16.0, 12.0, 20.0, 31.0, 38.0, 31.0, 33.0, 44.0, 29.0, 42.0, 48.0, 53.0, 48.0, 47.0, 37.0, 34.0, 37.0, 51.0, 43.0, 31.0, 28.0, 26.0, 19.0, 18.0, 17.0, 18.0, 15.0, 8.0, 7.0, 9.0, 3.0, 6.0, 5.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5439453125, -0.5257949829101562, -0.5076446533203125, -0.48949432373046875, -0.471343994140625, -0.45319366455078125, -0.4350433349609375, -0.41689300537109375, -0.39874267578125, -0.38059234619140625, -0.3624420166015625, -0.34429168701171875, -0.326141357421875, -0.30799102783203125, -0.2898406982421875, -0.27169036865234375, -0.2535400390625, -0.23538970947265625, -0.2172393798828125, -0.19908905029296875, -0.180938720703125, -0.16278839111328125, -0.1446380615234375, -0.12648773193359375, -0.10833740234375, -0.09018707275390625, -0.0720367431640625, -0.05388641357421875, -0.035736083984375, -0.01758575439453125, 0.0005645751953125, 0.01871490478515625, 0.036865234375, 0.05501556396484375, 0.0731658935546875, 0.09131622314453125, 0.109466552734375, 0.12761688232421875, 0.1457672119140625, 0.16391754150390625, 0.18206787109375, 0.20021820068359375, 0.2183685302734375, 0.23651885986328125, 0.254669189453125, 0.27281951904296875, 0.2909698486328125, 0.30912017822265625, 0.3272705078125, 0.34542083740234375, 0.3635711669921875, 0.38172149658203125, 0.399871826171875, 0.41802215576171875, 0.4361724853515625, 0.45432281494140625, 0.47247314453125, 0.49062347412109375, 0.5087738037109375, 0.5269241333007812, 0.545074462890625, 0.5632247924804688, 0.5813751220703125, 0.5995254516601562, 0.61767578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 7.0, 6.0, 13.0, 17.0, 21.0, 40.0, 44.0, 67.0, 134.0, 251.0, 532.0, 1226.0, 4391.0, 36072.0, 970455.0, 29235.0, 3875.0, 1122.0, 445.0, 217.0, 121.0, 84.0, 43.0, 24.0, 13.0, 14.0, 16.0, 9.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.76629638671875, -5.5989990234375, -5.43170166015625, -5.264404296875, -5.09710693359375, -4.9298095703125, -4.76251220703125, -4.59521484375, -4.42791748046875, -4.2606201171875, -4.09332275390625, -3.926025390625, -3.75872802734375, -3.5914306640625, -3.42413330078125, -3.2568359375, -3.08953857421875, -2.9222412109375, -2.75494384765625, -2.587646484375, -2.42034912109375, -2.2530517578125, -2.08575439453125, -1.91845703125, -1.75115966796875, -1.5838623046875, -1.41656494140625, -1.249267578125, -1.08197021484375, -0.9146728515625, -0.74737548828125, -0.580078125, -0.41278076171875, -0.2454833984375, -0.07818603515625, 0.089111328125, 0.25640869140625, 0.4237060546875, 0.59100341796875, 0.75830078125, 0.92559814453125, 1.0928955078125, 1.26019287109375, 1.427490234375, 1.59478759765625, 1.7620849609375, 1.92938232421875, 2.0966796875, 2.26397705078125, 2.4312744140625, 2.59857177734375, 2.765869140625, 2.93316650390625, 3.1004638671875, 3.26776123046875, 3.43505859375, 3.60235595703125, 3.7696533203125, 3.93695068359375, 4.104248046875, 4.27154541015625, 4.4388427734375, 4.60614013671875, 4.7734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 9.0, 4.0, 15.0, 22.0, 39.0, 66.0, 125.0, 333.0, 203.0, 58.0, 36.0, 26.0, 12.0, 8.0, 12.0, 8.0, 9.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001201629638671875, -0.001156628131866455, -0.0011116266250610352, -0.0010666251182556152, -0.0010216236114501953, -0.0009766221046447754, -0.0009316205978393555, -0.0008866190910339355, -0.0008416175842285156, -0.0007966160774230957, -0.0007516145706176758, -0.0007066130638122559, -0.0006616115570068359, -0.000616610050201416, -0.0005716085433959961, -0.0005266070365905762, -0.00048160552978515625, -0.00043660402297973633, -0.0003916025161743164, -0.0003466010093688965, -0.00030159950256347656, -0.00025659799575805664, -0.00021159648895263672, -0.0001665949821472168, -0.00012159347534179688, -7.659196853637695e-05, -3.159046173095703e-05, 1.341104507446289e-05, 5.841255187988281e-05, 0.00010341405868530273, 0.00014841556549072266, 0.00019341707229614258, 0.0002384185791015625, 0.0002834200859069824, 0.00032842159271240234, 0.00037342309951782227, 0.0004184246063232422, 0.0004634261131286621, 0.000508427619934082, 0.000553429126739502, 0.0005984306335449219, 0.0006434321403503418, 0.0006884336471557617, 0.0007334351539611816, 0.0007784366607666016, 0.0008234381675720215, 0.0008684396743774414, 0.0009134411811828613, 0.0009584426879882812, 0.0010034441947937012, 0.001048445701599121, 0.001093447208404541, 0.001138448715209961, 0.0011834502220153809, 0.0012284517288208008, 0.0012734532356262207, 0.0013184547424316406, 0.0013634562492370605, 0.0014084577560424805, 0.0014534592628479004, 0.0014984607696533203, 0.0015434622764587402, 0.0015884637832641602, 0.00163346529006958, 0.001678466796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 15.0, 20.0, 33.0, 58.0, 126.0, 411.0, 1554.0, 8365.0, 104816.0, 886108.0, 40767.0, 4648.0, 1045.0, 296.0, 125.0, 56.0, 27.0, 18.0, 14.0, 6.0, 9.0, 4.0, 6.0, 4.0, 1.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.45977783203125, -4.3218994140625, -4.18402099609375, -4.046142578125, -3.90826416015625, -3.7703857421875, -3.63250732421875, -3.49462890625, -3.35675048828125, -3.2188720703125, -3.08099365234375, -2.943115234375, -2.80523681640625, -2.6673583984375, -2.52947998046875, -2.3916015625, -2.25372314453125, -2.1158447265625, -1.97796630859375, -1.840087890625, -1.70220947265625, -1.5643310546875, -1.42645263671875, -1.28857421875, -1.15069580078125, -1.0128173828125, -0.87493896484375, -0.737060546875, -0.59918212890625, -0.4613037109375, -0.32342529296875, -0.185546875, -0.04766845703125, 0.0902099609375, 0.22808837890625, 0.365966796875, 0.50384521484375, 0.6417236328125, 0.77960205078125, 0.91748046875, 1.05535888671875, 1.1932373046875, 1.33111572265625, 1.468994140625, 1.60687255859375, 1.7447509765625, 1.88262939453125, 2.0205078125, 2.15838623046875, 2.2962646484375, 2.43414306640625, 2.572021484375, 2.70989990234375, 2.8477783203125, 2.98565673828125, 3.12353515625, 3.26141357421875, 3.3992919921875, 3.53717041015625, 3.675048828125, 3.81292724609375, 3.9508056640625, 4.08868408203125, 4.2265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 4.0, 9.0, 15.0, 6.0, 12.0, 14.0, 27.0, 35.0, 29.0, 45.0, 62.0, 84.0, 107.0, 102.0, 90.0, 76.0, 47.0, 57.0, 24.0, 38.0, 23.0, 12.0, 14.0, 20.0, 8.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.054534912109375, -1.00946044921875, -0.964385986328125, -0.9193115234375, -0.874237060546875, -0.82916259765625, -0.784088134765625, -0.739013671875, -0.693939208984375, -0.64886474609375, -0.603790283203125, -0.5587158203125, -0.513641357421875, -0.46856689453125, -0.423492431640625, -0.37841796875, -0.333343505859375, -0.28826904296875, -0.243194580078125, -0.1981201171875, -0.153045654296875, -0.10797119140625, -0.062896728515625, -0.017822265625, 0.027252197265625, 0.07232666015625, 0.117401123046875, 0.1624755859375, 0.207550048828125, 0.25262451171875, 0.297698974609375, 0.3427734375, 0.387847900390625, 0.43292236328125, 0.477996826171875, 0.5230712890625, 0.568145751953125, 0.61322021484375, 0.658294677734375, 0.703369140625, 0.748443603515625, 0.79351806640625, 0.838592529296875, 0.8836669921875, 0.928741455078125, 0.97381591796875, 1.018890380859375, 1.06396484375, 1.109039306640625, 1.15411376953125, 1.199188232421875, 1.2442626953125, 1.289337158203125, 1.33441162109375, 1.379486083984375, 1.424560546875, 1.469635009765625, 1.51470947265625, 1.559783935546875, 1.6048583984375, 1.649932861328125, 1.69500732421875, 1.740081787109375, 1.78515625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 17.0, 29.0, 56.0, 110.0, 220.0, 236.0, 165.0, 74.0, 31.0, 18.0, 14.0, 2.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.573041915893555, -8.245044708251953, -7.917048454284668, -7.589051246643066, -7.261054515838623, -6.93305778503418, -6.605061054229736, -6.277064323425293, -5.949067115783691, -5.621070384979248, -5.293073654174805, -4.965076446533203, -4.63707971572876, -4.309082984924316, -3.981086254119873, -3.6530892848968506, -3.3250927925109863, -2.997096061706543, -2.6690990924835205, -2.341102361679077, -2.0131053924560547, -1.6851086616516113, -1.357111930847168, -1.0291149616241455, -0.7011182308197021, -0.3731214106082916, -0.045124590396881104, 0.28287220001220703, 0.6108690500259399, 0.9388659000396729, 1.2668626308441162, 1.5948596000671387, 1.922856330871582, 2.2508530616760254, 2.578850030899048, 2.906846761703491, 3.2348437309265137, 3.562840461730957, 3.8908371925354004, 4.218833923339844, 4.546831130981445, 4.874827861785889, 5.202824592590332, 5.530821800231934, 5.858818531036377, 6.18681526184082, 6.514811992645264, 6.842808723449707, 7.17080545425415, 7.498802185058594, 7.826798915863037, 8.15479564666748, 8.482792854309082, 8.810789108276367, 9.138786315917969, 9.46678352355957, 9.794779777526855, 10.122776985168457, 10.450773239135742, 10.778770446777344, 11.106766700744629, 11.43476390838623, 11.762760162353516, 12.090757369995117, 12.418754577636719]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 7.0, 15.0, 21.0, 26.0, 29.0, 44.0, 61.0, 65.0, 76.0, 81.0, 78.0, 79.0, 72.0, 70.0, 62.0, 58.0, 48.0, 35.0, 24.0, 13.0, 8.0, 3.0, 5.0, 1.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.116640090942383, -5.852290630340576, -5.5879411697387695, -5.323591709136963, -5.059242248535156, -4.79489278793335, -4.530543327331543, -4.266193866729736, -4.00184440612793, -3.737494945526123, -3.4731454849243164, -3.2087960243225098, -2.944446563720703, -2.6800971031188965, -2.41574764251709, -2.151398181915283, -1.8870487213134766, -1.62269926071167, -1.3583498001098633, -1.0940003395080566, -0.82965087890625, -0.5653014183044434, -0.3009519577026367, -0.03660249710083008, 0.22774696350097656, 0.4920964241027832, 0.7564458847045898, 1.0207953453063965, 1.2851448059082031, 1.5494942665100098, 1.8138437271118164, 2.078193187713623, 2.3425416946411133, 2.60689115524292, 2.8712406158447266, 3.135590076446533, 3.39993953704834, 3.6642889976501465, 3.928638458251953, 4.19298791885376, 4.457337379455566, 4.721686840057373, 4.98603630065918, 5.250385761260986, 5.514735221862793, 5.7790846824646, 6.043434143066406, 6.307783603668213, 6.5721330642700195, 6.836482524871826, 7.100831985473633, 7.3651814460754395, 7.629530906677246, 7.893880367279053, 8.15822982788086, 8.422578811645508, 8.686928749084473, 8.951278686523438, 9.215627670288086, 9.479976654052734, 9.7443265914917, 10.008676528930664, 10.273025512695312, 10.537374496459961, 10.801724433898926]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 1.0, 5.0, 4.0, 6.0, 8.0, 10.0, 13.0, 4.0, 14.0, 17.0, 14.0, 37.0, 73.0, 239.0, 1520.0, 852695.0, 3337756.0, 1456.0, 206.0, 44.0, 33.0, 21.0, 14.0, 17.0, 11.0, 15.0, 10.0, 5.0, 5.0, 5.0, 0.0, 10.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-22.59375, -22.0146484375, -21.435546875, -20.8564453125, -20.27734375, -19.6982421875, -19.119140625, -18.5400390625, -17.9609375, -17.3818359375, -16.802734375, -16.2236328125, -15.64453125, -15.0654296875, -14.486328125, -13.9072265625, -13.328125, -12.7490234375, -12.169921875, -11.5908203125, -11.01171875, -10.4326171875, -9.853515625, -9.2744140625, -8.6953125, -8.1162109375, -7.537109375, -6.9580078125, -6.37890625, -5.7998046875, -5.220703125, -4.6416015625, -4.0625, -3.4833984375, -2.904296875, -2.3251953125, -1.74609375, -1.1669921875, -0.587890625, -0.0087890625, 0.5703125, 1.1494140625, 1.728515625, 2.3076171875, 2.88671875, 3.4658203125, 4.044921875, 4.6240234375, 5.203125, 5.7822265625, 6.361328125, 6.9404296875, 7.51953125, 8.0986328125, 8.677734375, 9.2568359375, 9.8359375, 10.4150390625, 10.994140625, 11.5732421875, 12.15234375, 12.7314453125, 13.310546875, 13.8896484375, 14.46875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 4.0, 10.0, 8.0, 10.0, 22.0, 23.0, 29.0, 45.0, 51.0, 53.0, 67.0, 90.0, 91.0, 94.0, 88.0, 85.0, 63.0, 33.0, 26.0, 36.0, 16.0, 13.0, 14.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.166259765625, -0.161956787109375, -0.15765380859375, -0.153350830078125, -0.1490478515625, -0.144744873046875, -0.14044189453125, -0.136138916015625, -0.1318359375, -0.127532958984375, -0.12322998046875, -0.118927001953125, -0.1146240234375, -0.110321044921875, -0.10601806640625, -0.101715087890625, -0.097412109375, -0.093109130859375, -0.08880615234375, -0.084503173828125, -0.0802001953125, -0.075897216796875, -0.07159423828125, -0.067291259765625, -0.06298828125, -0.058685302734375, -0.05438232421875, -0.050079345703125, -0.0457763671875, -0.041473388671875, -0.03717041015625, -0.032867431640625, -0.028564453125, -0.024261474609375, -0.01995849609375, -0.015655517578125, -0.0113525390625, -0.007049560546875, -0.00274658203125, 0.001556396484375, 0.005859375, 0.010162353515625, 0.01446533203125, 0.018768310546875, 0.0230712890625, 0.027374267578125, 0.03167724609375, 0.035980224609375, 0.040283203125, 0.044586181640625, 0.04888916015625, 0.053192138671875, 0.0574951171875, 0.061798095703125, 0.06610107421875, 0.070404052734375, 0.07470703125, 0.079010009765625, 0.08331298828125, 0.087615966796875, 0.0919189453125, 0.096221923828125, 0.10052490234375, 0.104827880859375, 0.109130859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [7.0, 18.0, 106.0, 1297.0, 4191839.0, 915.0, 95.0, 19.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.11328125, -3.95623779296875, -2.7991943359375, -1.64215087890625, -0.485107421875, 0.67193603515625, 1.8289794921875, 2.98602294921875, 4.14306640625, 5.30010986328125, 6.4571533203125, 7.61419677734375, 8.771240234375, 9.92828369140625, 11.0853271484375, 12.24237060546875, 13.3994140625, 14.55645751953125, 15.7135009765625, 16.87054443359375, 18.027587890625, 19.18463134765625, 20.3416748046875, 21.49871826171875, 22.65576171875, 23.81280517578125, 24.9698486328125, 26.12689208984375, 27.283935546875, 28.44097900390625, 29.5980224609375, 30.75506591796875, 31.912109375, 33.06915283203125, 34.2261962890625, 35.38323974609375, 36.540283203125, 37.69732666015625, 38.8543701171875, 40.01141357421875, 41.16845703125, 42.32550048828125, 43.4825439453125, 44.63958740234375, 45.796630859375, 46.95367431640625, 48.1107177734375, 49.26776123046875, 50.4248046875, 51.58184814453125, 52.7388916015625, 53.89593505859375, 55.052978515625, 56.21002197265625, 57.3670654296875, 58.52410888671875, 59.68115234375, 60.83819580078125, 61.9952392578125, 63.15228271484375, 64.309326171875, 65.46636962890625, 66.6234130859375, 67.78045654296875, 68.9375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 13.0, 13.0, 16.0, 22.0, 82.0, 192.0, 1426.0, 1871.0, 295.0, 76.0, 33.0, 18.0, 13.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328369140625, -0.3010673522949219, -0.27376556396484375, -0.24646377563476562, -0.2191619873046875, -0.19186019897460938, -0.16455841064453125, -0.13725662231445312, -0.109954833984375, -0.08265304565429688, -0.05535125732421875, -0.028049468994140625, -0.0007476806640625, 0.026554107666015625, 0.05385589599609375, 0.08115768432617188, 0.10845947265625, 0.13576126098632812, 0.16306304931640625, 0.19036483764648438, 0.2176666259765625, 0.24496841430664062, 0.27227020263671875, 0.2995719909667969, 0.326873779296875, 0.3541755676269531, 0.38147735595703125, 0.4087791442871094, 0.4360809326171875, 0.4633827209472656, 0.49068450927734375, 0.5179862976074219, 0.5452880859375, 0.5725898742675781, 0.5998916625976562, 0.6271934509277344, 0.6544952392578125, 0.6817970275878906, 0.7090988159179688, 0.7364006042480469, 0.763702392578125, 0.7910041809082031, 0.8183059692382812, 0.8456077575683594, 0.8729095458984375, 0.9002113342285156, 0.9275131225585938, 0.9548149108886719, 0.98211669921875, 1.0094184875488281, 1.0367202758789062, 1.0640220642089844, 1.0913238525390625, 1.1186256408691406, 1.1459274291992188, 1.1732292175292969, 1.200531005859375, 1.2278327941894531, 1.2551345825195312, 1.2824363708496094, 1.3097381591796875, 1.3370399475097656, 1.3643417358398438, 1.3916435241699219, 1.4189453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 25.0, 987.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.354900360107422, -25.362552642822266, -22.370203018188477, -19.377853393554688, -16.38550567626953, -13.393157005310059, -10.400808334350586, -7.408458709716797, -4.416110992431641, -1.423762321472168, 1.5685863494873047, 4.560935020446777, 7.55328369140625, 10.545632362365723, 13.537981033325195, 16.530330657958984, 19.52267837524414, 22.515026092529297, 25.507375717163086, 28.499725341796875, 31.49207305908203, 34.48442077636719, 37.476768493652344, 40.469120025634766, 43.46146774291992, 46.45381546020508, 49.4461669921875, 52.438514709472656, 55.43086242675781, 58.42321014404297, 61.415557861328125, 64.40791320800781, 67.40025329589844, 70.3926010131836, 73.38494873046875, 76.3772964477539, 79.36964416503906, 82.36199951171875, 85.3543472290039, 88.34669494628906, 91.33904266357422, 94.33139038085938, 97.32373809814453, 100.31608581542969, 103.30844116210938, 106.30078887939453, 109.29313659667969, 112.28548431396484, 115.27783203125, 118.27017974853516, 121.26252746582031, 124.25487518310547, 127.24722290039062, 130.2395782470703, 133.23191833496094, 136.22427368164062, 139.21661376953125, 142.20896911621094, 145.20130920410156, 148.19366455078125, 151.18600463867188, 154.17835998535156, 157.1707000732422, 160.16305541992188, 163.15541076660156]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 13.0, 30.0, 70.0, 133.0, 201.0, 213.0, 162.0, 103.0, 49.0, 21.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.317737102508545, -6.781598091125488, -6.245459079742432, -5.709320068359375, -5.173181056976318, -4.637042045593262, -4.100903034210205, -3.5647640228271484, -3.028625011444092, -2.492486000061035, -1.9563469886779785, -1.4202079772949219, -0.8840689659118652, -0.3479299545288086, 0.18820905685424805, 0.7243480682373047, 1.2604870796203613, 1.796626091003418, 2.3327651023864746, 2.8689041137695312, 3.405043125152588, 3.9411821365356445, 4.477321147918701, 5.013460159301758, 5.5495991706848145, 6.085738182067871, 6.621877193450928, 7.158016204833984, 7.694155216217041, 8.230294227600098, 8.766433715820312, 9.302572250366211, 9.83871078491211, 10.374849319458008, 10.910988807678223, 11.447128295898438, 11.983266830444336, 12.519405364990234, 13.05554485321045, 13.591684341430664, 14.127822875976562, 14.663961410522461, 15.200100898742676, 15.73624038696289, 16.27237892150879, 16.808517456054688, 17.34465789794922, 17.880796432495117, 18.416934967041016, 18.953073501586914, 19.489212036132812, 20.025352478027344, 20.561491012573242, 21.09762954711914, 21.633769989013672, 22.16990852355957, 22.70604705810547, 23.242185592651367, 23.778324127197266, 24.314464569091797, 24.850603103637695, 25.386741638183594, 25.922882080078125, 26.459020614624023, 26.995159149169922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 7.0, 5.0, 12.0, 6.0, 20.0, 25.0, 19.0, 23.0, 34.0, 35.0, 40.0, 49.0, 63.0, 47.0, 232.0, 1033691.0, 13796.0, 62.0, 61.0, 56.0, 41.0, 33.0, 36.0, 28.0, 17.0, 18.0, 21.0, 16.0, 8.0, 10.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.15625, -26.1025390625, -25.048828125, -23.9951171875, -22.94140625, -21.8876953125, -20.833984375, -19.7802734375, -18.7265625, -17.6728515625, -16.619140625, -15.5654296875, -14.51171875, -13.4580078125, -12.404296875, -11.3505859375, -10.296875, -9.2431640625, -8.189453125, -7.1357421875, -6.08203125, -5.0283203125, -3.974609375, -2.9208984375, -1.8671875, -0.8134765625, 0.240234375, 1.2939453125, 2.34765625, 3.4013671875, 4.455078125, 5.5087890625, 6.5625, 7.6162109375, 8.669921875, 9.7236328125, 10.77734375, 11.8310546875, 12.884765625, 13.9384765625, 14.9921875, 16.0458984375, 17.099609375, 18.1533203125, 19.20703125, 20.2607421875, 21.314453125, 22.3681640625, 23.421875, 24.4755859375, 25.529296875, 26.5830078125, 27.63671875, 28.6904296875, 29.744140625, 30.7978515625, 31.8515625, 32.9052734375, 33.958984375, 35.0126953125, 36.06640625, 37.1201171875, 38.173828125, 39.2275390625, 40.28125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 21.0, 199.0, 650.0, 139.0, 10.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.2534675598144531, -0.15073394775390625, -0.048000335693359375, 0.0547332763671875, 0.15746688842773438, 0.26020050048828125, 0.3629341125488281, 0.465667724609375, 0.5684013366699219, 0.6711349487304688, 0.7738685607910156, 0.8766021728515625, 0.9793357849121094, 1.0820693969726562, 1.1848030090332031, 1.28753662109375, 1.3902702331542969, 1.4930038452148438, 1.5957374572753906, 1.6984710693359375, 1.8012046813964844, 1.9039382934570312, 2.006671905517578, 2.109405517578125, 2.212139129638672, 2.3148727416992188, 2.4176063537597656, 2.5203399658203125, 2.6230735778808594, 2.7258071899414062, 2.828540802001953, 2.9312744140625, 3.034008026123047, 3.1367416381835938, 3.2394752502441406, 3.3422088623046875, 3.4449424743652344, 3.5476760864257812, 3.650409698486328, 3.753143310546875, 3.855876922607422, 3.9586105346679688, 4.061344146728516, 4.1640777587890625, 4.266811370849609, 4.369544982910156, 4.472278594970703, 4.57501220703125, 4.677745819091797, 4.780479431152344, 4.883213043212891, 4.9859466552734375, 5.088680267333984, 5.191413879394531, 5.294147491455078, 5.396881103515625, 5.499614715576172, 5.602348327636719, 5.705081939697266, 5.8078155517578125, 5.910549163818359, 6.013282775878906, 6.116016387939453, 6.21875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 7.0, 9.0, 9.0, 14.0, 19.0, 23.0, 28.0, 43.0, 51.0, 81.0, 116.0, 144.0, 234.0, 409.0, 679.0, 1189.0, 2437.0, 5390.0, 14163.0, 43584.0, 205735.0, 608361.0, 117077.0, 29538.0, 10362.0, 4252.0, 1990.0, 978.0, 546.0, 346.0, 193.0, 147.0, 104.0, 72.0, 60.0, 29.0, 26.0, 33.0, 20.0, 19.0, 11.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.15625, -4.996826171875, -4.83740234375, -4.677978515625, -4.5185546875, -4.359130859375, -4.19970703125, -4.040283203125, -3.880859375, -3.721435546875, -3.56201171875, -3.402587890625, -3.2431640625, -3.083740234375, -2.92431640625, -2.764892578125, -2.60546875, -2.446044921875, -2.28662109375, -2.127197265625, -1.9677734375, -1.808349609375, -1.64892578125, -1.489501953125, -1.330078125, -1.170654296875, -1.01123046875, -0.851806640625, -0.6923828125, -0.532958984375, -0.37353515625, -0.214111328125, -0.0546875, 0.104736328125, 0.26416015625, 0.423583984375, 0.5830078125, 0.742431640625, 0.90185546875, 1.061279296875, 1.220703125, 1.380126953125, 1.53955078125, 1.698974609375, 1.8583984375, 2.017822265625, 2.17724609375, 2.336669921875, 2.49609375, 2.655517578125, 2.81494140625, 2.974365234375, 3.1337890625, 3.293212890625, 3.45263671875, 3.612060546875, 3.771484375, 3.930908203125, 4.09033203125, 4.249755859375, 4.4091796875, 4.568603515625, 4.72802734375, 4.887451171875, 5.046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 4.0, 7.0, 9.0, 7.0, 14.0, 13.0, 20.0, 26.0, 22.0, 42.0, 27.0, 47.0, 64.0, 80.0, 66.0, 79.0, 52.0, 74.0, 58.0, 62.0, 45.0, 36.0, 32.0, 31.0, 9.0, 14.0, 14.0, 12.0, 9.0, 13.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.26953125, -5.1221923828125, -4.974853515625, -4.8275146484375, -4.68017578125, -4.5328369140625, -4.385498046875, -4.2381591796875, -4.0908203125, -3.9434814453125, -3.796142578125, -3.6488037109375, -3.50146484375, -3.3541259765625, -3.206787109375, -3.0594482421875, -2.912109375, -2.7647705078125, -2.617431640625, -2.4700927734375, -2.32275390625, -2.1754150390625, -2.028076171875, -1.8807373046875, -1.7333984375, -1.5860595703125, -1.438720703125, -1.2913818359375, -1.14404296875, -0.9967041015625, -0.849365234375, -0.7020263671875, -0.5546875, -0.4073486328125, -0.260009765625, -0.1126708984375, 0.03466796875, 0.1820068359375, 0.329345703125, 0.4766845703125, 0.6240234375, 0.7713623046875, 0.918701171875, 1.0660400390625, 1.21337890625, 1.3607177734375, 1.508056640625, 1.6553955078125, 1.802734375, 1.9500732421875, 2.097412109375, 2.2447509765625, 2.39208984375, 2.5394287109375, 2.686767578125, 2.8341064453125, 2.9814453125, 3.1287841796875, 3.276123046875, 3.4234619140625, 3.57080078125, 3.7181396484375, 3.865478515625, 4.0128173828125, 4.16015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 2.0, 9.0, 4.0, 11.0, 15.0, 17.0, 22.0, 35.0, 64.0, 104.0, 176.0, 398.0, 840.0, 2356.0, 8967.0, 58366.0, 809017.0, 147444.0, 15055.0, 3388.0, 1152.0, 477.0, 248.0, 133.0, 84.0, 39.0, 33.0, 26.0, 22.0, 7.0, 12.0, 5.0, 7.0, 4.0, 3.0, 0.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.98046875, -6.7528076171875, -6.525146484375, -6.2974853515625, -6.06982421875, -5.8421630859375, -5.614501953125, -5.3868408203125, -5.1591796875, -4.9315185546875, -4.703857421875, -4.4761962890625, -4.24853515625, -4.0208740234375, -3.793212890625, -3.5655517578125, -3.337890625, -3.1102294921875, -2.882568359375, -2.6549072265625, -2.42724609375, -2.1995849609375, -1.971923828125, -1.7442626953125, -1.5166015625, -1.2889404296875, -1.061279296875, -0.8336181640625, -0.60595703125, -0.3782958984375, -0.150634765625, 0.0770263671875, 0.3046875, 0.5323486328125, 0.760009765625, 0.9876708984375, 1.21533203125, 1.4429931640625, 1.670654296875, 1.8983154296875, 2.1259765625, 2.3536376953125, 2.581298828125, 2.8089599609375, 3.03662109375, 3.2642822265625, 3.491943359375, 3.7196044921875, 3.947265625, 4.1749267578125, 4.402587890625, 4.6302490234375, 4.85791015625, 5.0855712890625, 5.313232421875, 5.5408935546875, 5.7685546875, 5.9962158203125, 6.223876953125, 6.4515380859375, 6.67919921875, 6.9068603515625, 7.134521484375, 7.3621826171875, 7.58984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 2.0, 6.0, 5.0, 9.0, 12.0, 26.0, 28.0, 47.0, 79.0, 148.0, 172.0, 163.0, 118.0, 67.0, 32.0, 32.0, 16.0, 10.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009374618530273438, -0.0009087696671485901, -0.0008800774812698364, -0.0008513852953910828, -0.0008226931095123291, -0.0007940009236335754, -0.0007653087377548218, -0.0007366165518760681, -0.0007079243659973145, -0.0006792321801185608, -0.0006505399942398071, -0.0006218478083610535, -0.0005931556224822998, -0.0005644634366035461, -0.0005357712507247925, -0.0005070790648460388, -0.00047838687896728516, -0.0004496946930885315, -0.00042100250720977783, -0.00039231032133102417, -0.0003636181354522705, -0.00033492594957351685, -0.0003062337636947632, -0.0002775415778160095, -0.00024884939193725586, -0.0002201572060585022, -0.00019146502017974854, -0.00016277283430099487, -0.0001340806484222412, -0.00010538846254348755, -7.669627666473389e-05, -4.8004090785980225e-05, -1.9311904907226562e-05, 9.3802809715271e-06, 3.807246685028076e-05, 6.676465272903442e-05, 9.545683860778809e-05, 0.00012414902448654175, 0.0001528412103652954, 0.00018153339624404907, 0.00021022558212280273, 0.0002389177680015564, 0.00026760995388031006, 0.0002963021397590637, 0.0003249943256378174, 0.00035368651151657104, 0.0003823786973953247, 0.00041107088327407837, 0.00043976306915283203, 0.0004684552550315857, 0.0004971474409103394, 0.000525839626789093, 0.0005545318126678467, 0.0005832239985466003, 0.000611916184425354, 0.0006406083703041077, 0.0006693005561828613, 0.000697992742061615, 0.0007266849279403687, 0.0007553771138191223, 0.000784069299697876, 0.0008127614855766296, 0.0008414536714553833, 0.000870145857334137, 0.0008988380432128906]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 8.0, 5.0, 9.0, 22.0, 18.0, 29.0, 47.0, 87.0, 121.0, 261.0, 550.0, 1578.0, 5852.0, 53876.0, 938453.0, 40440.0, 4943.0, 1290.0, 510.0, 179.0, 109.0, 64.0, 33.0, 36.0, 14.0, 8.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3046875, -12.85302734375, -12.4013671875, -11.94970703125, -11.498046875, -11.04638671875, -10.5947265625, -10.14306640625, -9.69140625, -9.23974609375, -8.7880859375, -8.33642578125, -7.884765625, -7.43310546875, -6.9814453125, -6.52978515625, -6.078125, -5.62646484375, -5.1748046875, -4.72314453125, -4.271484375, -3.81982421875, -3.3681640625, -2.91650390625, -2.46484375, -2.01318359375, -1.5615234375, -1.10986328125, -0.658203125, -0.20654296875, 0.2451171875, 0.69677734375, 1.1484375, 1.60009765625, 2.0517578125, 2.50341796875, 2.955078125, 3.40673828125, 3.8583984375, 4.31005859375, 4.76171875, 5.21337890625, 5.6650390625, 6.11669921875, 6.568359375, 7.02001953125, 7.4716796875, 7.92333984375, 8.375, 8.82666015625, 9.2783203125, 9.72998046875, 10.181640625, 10.63330078125, 11.0849609375, 11.53662109375, 11.98828125, 12.43994140625, 12.8916015625, 13.34326171875, 13.794921875, 14.24658203125, 14.6982421875, 15.14990234375, 15.6015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 6.0, 6.0, 15.0, 25.0, 46.0, 100.0, 219.0, 247.0, 157.0, 82.0, 26.0, 11.0, 14.0, 15.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.6484375, -9.4091796875, -9.169921875, -8.9306640625, -8.69140625, -8.4521484375, -8.212890625, -7.9736328125, -7.734375, -7.4951171875, -7.255859375, -7.0166015625, -6.77734375, -6.5380859375, -6.298828125, -6.0595703125, -5.8203125, -5.5810546875, -5.341796875, -5.1025390625, -4.86328125, -4.6240234375, -4.384765625, -4.1455078125, -3.90625, -3.6669921875, -3.427734375, -3.1884765625, -2.94921875, -2.7099609375, -2.470703125, -2.2314453125, -1.9921875, -1.7529296875, -1.513671875, -1.2744140625, -1.03515625, -0.7958984375, -0.556640625, -0.3173828125, -0.078125, 0.1611328125, 0.400390625, 0.6396484375, 0.87890625, 1.1181640625, 1.357421875, 1.5966796875, 1.8359375, 2.0751953125, 2.314453125, 2.5537109375, 2.79296875, 3.0322265625, 3.271484375, 3.5107421875, 3.75, 3.9892578125, 4.228515625, 4.4677734375, 4.70703125, 4.9462890625, 5.185546875, 5.4248046875, 5.6640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 20.0, 435.0, 555.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.96212768554688, -70.01885986328125, -60.075584411621094, -50.1323127746582, -40.18904113769531, -30.245769500732422, -20.30249786376953, -10.359222412109375, -0.41595458984375, 9.52731704711914, 19.47058868408203, 29.413860321044922, 39.35713195800781, 49.3004035949707, 59.243675231933594, 69.18695068359375, 79.13021850585938, 89.073486328125, 99.01676177978516, 108.96003723144531, 118.90330505371094, 128.84657287597656, 138.78985595703125, 148.73312377929688, 158.6763916015625, 168.61965942382812, 178.56292724609375, 188.50621032714844, 198.44947814941406, 208.3927459716797, 218.33602905273438, 228.279296875, 238.2225341796875, 248.16580200195312, 258.10906982421875, 268.0523376464844, 277.99560546875, 287.93890380859375, 297.8821716308594, 307.825439453125, 317.7687072753906, 327.71197509765625, 337.6552429199219, 347.5985107421875, 357.54180908203125, 367.4850769042969, 377.4283447265625, 387.3716125488281, 397.31488037109375, 407.2581481933594, 417.201416015625, 427.1446838378906, 437.08795166015625, 447.03125, 456.9745178222656, 466.91778564453125, 476.8610534667969, 486.8043212890625, 496.7475891113281, 506.69085693359375, 516.6341552734375, 526.577392578125, 536.5206909179688, 546.4639892578125, 556.4072265625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 10.0, 10.0, 28.0, 26.0, 30.0, 45.0, 81.0, 80.0, 91.0, 114.0, 104.0, 92.0, 75.0, 52.0, 55.0, 52.0, 25.0, 13.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.575244903564453, -22.17174530029297, -20.768245697021484, -19.36474609375, -17.961246490478516, -16.55774688720703, -15.15424919128418, -13.750749588012695, -12.347249984741211, -10.943750381469727, -9.540250778198242, -8.136752128601074, -6.73325252532959, -5.3297529220581055, -3.9262542724609375, -2.522754669189453, -1.1192550659179688, 0.2842442989349365, 1.6877436637878418, 3.091242790222168, 4.494742393493652, 5.898241996765137, 7.301740646362305, 8.705240249633789, 10.108739852905273, 11.512239456176758, 12.915739059448242, 14.31923770904541, 15.722737312316895, 17.126235961914062, 18.529735565185547, 19.93323516845703, 21.33673095703125, 22.740230560302734, 24.14373016357422, 25.547229766845703, 26.950729370117188, 28.354228973388672, 29.757726669311523, 31.161226272583008, 32.564727783203125, 33.96822738647461, 35.371726989746094, 36.77522659301758, 38.17872619628906, 39.58222579956055, 40.98572540283203, 42.38922119140625, 43.792720794677734, 45.19622039794922, 46.5997200012207, 48.00321960449219, 49.40671920776367, 50.810218811035156, 52.213714599609375, 53.617218017578125, 55.020713806152344, 56.42421340942383, 57.82771301269531, 59.2312126159668, 60.63471221923828, 62.038211822509766, 63.44171142578125, 64.84520721435547, 66.24871063232422]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 64.0, 1135.0, 4191979.0, 681.0, 205.0, 115.0, 52.0, 25.0, 17.0, 7.0, 9.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -11.6982421875, -6.583984375, -1.4697265625, 3.64453125, 8.7587890625, 13.873046875, 18.9873046875, 24.1015625, 29.2158203125, 34.330078125, 39.4443359375, 44.55859375, 49.6728515625, 54.787109375, 59.9013671875, 65.015625, 70.1298828125, 75.244140625, 80.3583984375, 85.47265625, 90.5869140625, 95.701171875, 100.8154296875, 105.9296875, 111.0439453125, 116.158203125, 121.2724609375, 126.38671875, 131.5009765625, 136.615234375, 141.7294921875, 146.84375, 151.9580078125, 157.072265625, 162.1865234375, 167.30078125, 172.4150390625, 177.529296875, 182.6435546875, 187.7578125, 192.8720703125, 197.986328125, 203.1005859375, 208.21484375, 213.3291015625, 218.443359375, 223.5576171875, 228.671875, 233.7861328125, 238.900390625, 244.0146484375, 249.12890625, 254.2431640625, 259.357421875, 264.4716796875, 269.5859375, 274.7001953125, 279.814453125, 284.9287109375, 290.04296875, 295.1572265625, 300.271484375, 305.3857421875, 310.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 13.0, 98.0, 334.0, 414.0, 134.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.396026611328125, -0.27056884765625, -0.145111083984375, -0.0196533203125, 0.105804443359375, 0.23126220703125, 0.356719970703125, 0.482177734375, 0.607635498046875, 0.73309326171875, 0.858551025390625, 0.9840087890625, 1.109466552734375, 1.23492431640625, 1.360382080078125, 1.48583984375, 1.611297607421875, 1.73675537109375, 1.862213134765625, 1.9876708984375, 2.113128662109375, 2.23858642578125, 2.364044189453125, 2.489501953125, 2.614959716796875, 2.74041748046875, 2.865875244140625, 2.9913330078125, 3.116790771484375, 3.24224853515625, 3.367706298828125, 3.4931640625, 3.618621826171875, 3.74407958984375, 3.869537353515625, 3.9949951171875, 4.120452880859375, 4.24591064453125, 4.371368408203125, 4.496826171875, 4.622283935546875, 4.74774169921875, 4.873199462890625, 4.9986572265625, 5.124114990234375, 5.24957275390625, 5.375030517578125, 5.50048828125, 5.625946044921875, 5.75140380859375, 5.876861572265625, 6.0023193359375, 6.127777099609375, 6.25323486328125, 6.378692626953125, 6.504150390625, 6.629608154296875, 6.75506591796875, 6.880523681640625, 7.0059814453125, 7.131439208984375, 7.25689697265625, 7.382354736328125, 7.5078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 26.0, 53.0, 128.0, 416.0, 4322.0, 4174386.0, 13628.0, 851.0, 291.0, 124.0, 40.0, 11.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -30.48291015625, -27.8720703125, -25.26123046875, -22.650390625, -20.03955078125, -17.4287109375, -14.81787109375, -12.20703125, -9.59619140625, -6.9853515625, -4.37451171875, -1.763671875, 0.84716796875, 3.4580078125, 6.06884765625, 8.6796875, 11.29052734375, 13.9013671875, 16.51220703125, 19.123046875, 21.73388671875, 24.3447265625, 26.95556640625, 29.56640625, 32.17724609375, 34.7880859375, 37.39892578125, 40.009765625, 42.62060546875, 45.2314453125, 47.84228515625, 50.453125, 53.06396484375, 55.6748046875, 58.28564453125, 60.896484375, 63.50732421875, 66.1181640625, 68.72900390625, 71.33984375, 73.95068359375, 76.5615234375, 79.17236328125, 81.783203125, 84.39404296875, 87.0048828125, 89.61572265625, 92.2265625, 94.83740234375, 97.4482421875, 100.05908203125, 102.669921875, 105.28076171875, 107.8916015625, 110.50244140625, 113.11328125, 115.72412109375, 118.3349609375, 120.94580078125, 123.556640625, 126.16748046875, 128.7783203125, 131.38916015625, 134.0]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 10.0, 21.0, 44.0, 99.0, 445.0, 3196.0, 198.0, 33.0, 9.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.69140625, -4.44842529296875, -4.2054443359375, -3.96246337890625, -3.719482421875, -3.47650146484375, -3.2335205078125, -2.99053955078125, -2.74755859375, -2.50457763671875, -2.2615966796875, -2.01861572265625, -1.775634765625, -1.53265380859375, -1.2896728515625, -1.04669189453125, -0.8037109375, -0.56072998046875, -0.3177490234375, -0.07476806640625, 0.168212890625, 0.41119384765625, 0.6541748046875, 0.89715576171875, 1.14013671875, 1.38311767578125, 1.6260986328125, 1.86907958984375, 2.112060546875, 2.35504150390625, 2.5980224609375, 2.84100341796875, 3.083984375, 3.32696533203125, 3.5699462890625, 3.81292724609375, 4.055908203125, 4.29888916015625, 4.5418701171875, 4.78485107421875, 5.02783203125, 5.27081298828125, 5.5137939453125, 5.75677490234375, 5.999755859375, 6.24273681640625, 6.4857177734375, 6.72869873046875, 6.9716796875, 7.21466064453125, 7.4576416015625, 7.70062255859375, 7.943603515625, 8.18658447265625, 8.4295654296875, 8.67254638671875, 8.91552734375, 9.15850830078125, 9.4014892578125, 9.64447021484375, 9.887451171875, 10.13043212890625, 10.3734130859375, 10.61639404296875, 10.859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 14.0, 257.0, 710.0, 25.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-126.69851684570312, -122.35978698730469, -118.02105712890625, -113.68233489990234, -109.3436050415039, -105.00487518310547, -100.66615295410156, -96.32742309570312, -91.98869323730469, -87.64996337890625, -83.31123352050781, -78.9725112915039, -74.63378143310547, -70.29505157470703, -65.95632934570312, -61.61759948730469, -57.27886962890625, -52.94013977050781, -48.60141372680664, -44.26268768310547, -39.92395782470703, -35.585227966308594, -31.246501922607422, -26.907773971557617, -22.569046020507812, -18.230318069458008, -13.891590118408203, -9.552862167358398, -5.214134216308594, -0.8754062652587891, 3.4633216857910156, 7.80204963684082, 12.140792846679688, 16.479520797729492, 20.818248748779297, 25.1569766998291, 29.495704650878906, 33.834434509277344, 38.173160552978516, 42.51188659667969, 46.850616455078125, 51.18934631347656, 55.528072357177734, 59.866798400878906, 64.20552825927734, 68.54425811767578, 72.88298034667969, 77.22171020507812, 81.56044006347656, 85.899169921875, 90.23789978027344, 94.57662200927734, 98.91535186767578, 103.25408172607422, 107.59280395507812, 111.93153381347656, 116.270263671875, 120.60899353027344, 124.94772338867188, 129.2864532470703, 133.62518310546875, 137.96389770507812, 142.30262756347656, 146.641357421875, 150.98008728027344]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 13.0, 29.0, 26.0, 62.0, 84.0, 122.0, 124.0, 121.0, 130.0, 93.0, 71.0, 55.0, 35.0, 18.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.66246795654297, -46.25364303588867, -44.84481430053711, -43.43598937988281, -42.02716064453125, -40.61833572387695, -39.209510803222656, -37.800682067871094, -36.3918571472168, -34.9830322265625, -33.57420349121094, -32.16537857055664, -30.75655174255371, -29.34772491455078, -27.938899993896484, -26.530073165893555, -25.121246337890625, -23.712419509887695, -22.303592681884766, -20.89476776123047, -19.48594093322754, -18.07711410522461, -16.668289184570312, -15.259462356567383, -13.850635528564453, -12.441808700561523, -11.03298282623291, -9.624156951904297, -8.215330123901367, -6.806503772735596, -5.397677421569824, -3.988851547241211, -2.5800247192382812, -1.1711983680725098, 0.23762798309326172, 1.6464543342590332, 3.0552806854248047, 4.464107036590576, 5.872933387756348, 7.281759262084961, 8.69058609008789, 10.09941291809082, 11.508238792419434, 12.917064666748047, 14.325891494750977, 15.734718322753906, 17.143543243408203, 18.552370071411133, 19.961196899414062, 21.370023727416992, 22.778850555419922, 24.18767547607422, 25.59650230407715, 27.005329132080078, 28.414154052734375, 29.822980880737305, 31.231807708740234, 32.64063262939453, 34.049461364746094, 35.45828628540039, 36.86711120605469, 38.27593994140625, 39.68476486206055, 41.093589782714844, 42.502418518066406]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 12.0, 14.0, 15.0, 23.0, 36.0, 41.0, 58.0, 103.0, 208.0, 688.0, 5887.0, 732693.0, 303846.0, 3875.0, 531.0, 196.0, 86.0, 51.0, 46.0, 26.0, 33.0, 20.0, 10.0, 6.0, 10.0, 3.0, 3.0, 7.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.234375, -24.297119140625, -23.35986328125, -22.422607421875, -21.4853515625, -20.548095703125, -19.61083984375, -18.673583984375, -17.736328125, -16.799072265625, -15.86181640625, -14.924560546875, -13.9873046875, -13.050048828125, -12.11279296875, -11.175537109375, -10.23828125, -9.301025390625, -8.36376953125, -7.426513671875, -6.4892578125, -5.552001953125, -4.61474609375, -3.677490234375, -2.740234375, -1.802978515625, -0.86572265625, 0.071533203125, 1.0087890625, 1.946044921875, 2.88330078125, 3.820556640625, 4.7578125, 5.695068359375, 6.63232421875, 7.569580078125, 8.5068359375, 9.444091796875, 10.38134765625, 11.318603515625, 12.255859375, 13.193115234375, 14.13037109375, 15.067626953125, 16.0048828125, 16.942138671875, 17.87939453125, 18.816650390625, 19.75390625, 20.691162109375, 21.62841796875, 22.565673828125, 23.5029296875, 24.440185546875, 25.37744140625, 26.314697265625, 27.251953125, 28.189208984375, 29.12646484375, 30.063720703125, 31.0009765625, 31.938232421875, 32.87548828125, 33.812744140625, 34.75]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 33.0, 83.0, 191.0, 282.0, 205.0, 133.0, 51.0, 13.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.348663330078125, -2.19927978515625, -2.049896240234375, -1.9005126953125, -1.751129150390625, -1.60174560546875, -1.452362060546875, -1.302978515625, -1.153594970703125, -1.00421142578125, -0.854827880859375, -0.7054443359375, -0.556060791015625, -0.40667724609375, -0.257293701171875, -0.10791015625, 0.041473388671875, 0.19085693359375, 0.340240478515625, 0.4896240234375, 0.639007568359375, 0.78839111328125, 0.937774658203125, 1.087158203125, 1.236541748046875, 1.38592529296875, 1.535308837890625, 1.6846923828125, 1.834075927734375, 1.98345947265625, 2.132843017578125, 2.2822265625, 2.431610107421875, 2.58099365234375, 2.730377197265625, 2.8797607421875, 3.029144287109375, 3.17852783203125, 3.327911376953125, 3.477294921875, 3.626678466796875, 3.77606201171875, 3.925445556640625, 4.0748291015625, 4.224212646484375, 4.37359619140625, 4.522979736328125, 4.67236328125, 4.821746826171875, 4.97113037109375, 5.120513916015625, 5.2698974609375, 5.419281005859375, 5.56866455078125, 5.718048095703125, 5.867431640625, 6.016815185546875, 6.16619873046875, 6.315582275390625, 6.4649658203125, 6.614349365234375, 6.76373291015625, 6.913116455078125, 7.0625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 12.0, 17.0, 16.0, 41.0, 50.0, 103.0, 215.0, 514.0, 1677.0, 8825.0, 140447.0, 838393.0, 51208.0, 5003.0, 1159.0, 396.0, 176.0, 105.0, 53.0, 25.0, 22.0, 20.0, 14.0, 6.0, 11.0, 4.0, 3.0, 0.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.203125, -11.8138427734375, -11.424560546875, -11.0352783203125, -10.64599609375, -10.2567138671875, -9.867431640625, -9.4781494140625, -9.0888671875, -8.6995849609375, -8.310302734375, -7.9210205078125, -7.53173828125, -7.1424560546875, -6.753173828125, -6.3638916015625, -5.974609375, -5.5853271484375, -5.196044921875, -4.8067626953125, -4.41748046875, -4.0281982421875, -3.638916015625, -3.2496337890625, -2.8603515625, -2.4710693359375, -2.081787109375, -1.6925048828125, -1.30322265625, -0.9139404296875, -0.524658203125, -0.1353759765625, 0.25390625, 0.6431884765625, 1.032470703125, 1.4217529296875, 1.81103515625, 2.2003173828125, 2.589599609375, 2.9788818359375, 3.3681640625, 3.7574462890625, 4.146728515625, 4.5360107421875, 4.92529296875, 5.3145751953125, 5.703857421875, 6.0931396484375, 6.482421875, 6.8717041015625, 7.260986328125, 7.6502685546875, 8.03955078125, 8.4288330078125, 8.818115234375, 9.2073974609375, 9.5966796875, 9.9859619140625, 10.375244140625, 10.7645263671875, 11.15380859375, 11.5430908203125, 11.932373046875, 12.3216552734375, 12.7109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 8.0, 10.0, 10.0, 13.0, 14.0, 18.0, 28.0, 42.0, 36.0, 46.0, 55.0, 65.0, 81.0, 80.0, 63.0, 53.0, 51.0, 47.0, 55.0, 51.0, 40.0, 23.0, 27.0, 20.0, 11.0, 13.0, 11.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3984375, -5.20611572265625, -5.0137939453125, -4.82147216796875, -4.629150390625, -4.43682861328125, -4.2445068359375, -4.05218505859375, -3.85986328125, -3.66754150390625, -3.4752197265625, -3.28289794921875, -3.090576171875, -2.89825439453125, -2.7059326171875, -2.51361083984375, -2.3212890625, -2.12896728515625, -1.9366455078125, -1.74432373046875, -1.552001953125, -1.35968017578125, -1.1673583984375, -0.97503662109375, -0.78271484375, -0.59039306640625, -0.3980712890625, -0.20574951171875, -0.013427734375, 0.17889404296875, 0.3712158203125, 0.56353759765625, 0.755859375, 0.94818115234375, 1.1405029296875, 1.33282470703125, 1.525146484375, 1.71746826171875, 1.9097900390625, 2.10211181640625, 2.29443359375, 2.48675537109375, 2.6790771484375, 2.87139892578125, 3.063720703125, 3.25604248046875, 3.4483642578125, 3.64068603515625, 3.8330078125, 4.02532958984375, 4.2176513671875, 4.40997314453125, 4.602294921875, 4.79461669921875, 4.9869384765625, 5.17926025390625, 5.37158203125, 5.56390380859375, 5.7562255859375, 5.94854736328125, 6.140869140625, 6.33319091796875, 6.5255126953125, 6.71783447265625, 6.91015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 19.0, 16.0, 29.0, 48.0, 128.0, 310.0, 1058.0, 6425.0, 245905.0, 780795.0, 11520.0, 1561.0, 430.0, 164.0, 61.0, 35.0, 18.0, 7.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.3311767578125, -9.842041015625, -9.3529052734375, -8.86376953125, -8.3746337890625, -7.885498046875, -7.3963623046875, -6.9072265625, -6.4180908203125, -5.928955078125, -5.4398193359375, -4.95068359375, -4.4615478515625, -3.972412109375, -3.4832763671875, -2.994140625, -2.5050048828125, -2.015869140625, -1.5267333984375, -1.03759765625, -0.5484619140625, -0.059326171875, 0.4298095703125, 0.9189453125, 1.4080810546875, 1.897216796875, 2.3863525390625, 2.87548828125, 3.3646240234375, 3.853759765625, 4.3428955078125, 4.83203125, 5.3211669921875, 5.810302734375, 6.2994384765625, 6.78857421875, 7.2777099609375, 7.766845703125, 8.2559814453125, 8.7451171875, 9.2342529296875, 9.723388671875, 10.2125244140625, 10.70166015625, 11.1907958984375, 11.679931640625, 12.1690673828125, 12.658203125, 13.1473388671875, 13.636474609375, 14.1256103515625, 14.61474609375, 15.1038818359375, 15.593017578125, 16.0821533203125, 16.5712890625, 17.0604248046875, 17.549560546875, 18.0386962890625, 18.52783203125, 19.0169677734375, 19.506103515625, 19.9952392578125, 20.484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 11.0, 21.0, 29.0, 55.0, 102.0, 177.0, 231.0, 156.0, 100.0, 44.0, 24.0, 15.0, 7.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009379386901855469, -0.0008939877152442932, -0.0008500367403030396, -0.0008060857653617859, -0.0007621347904205322, -0.0007181838154792786, -0.0006742328405380249, -0.0006302818655967712, -0.0005863308906555176, -0.0005423799157142639, -0.0004984289407730103, -0.0004544779658317566, -0.00041052699089050293, -0.00036657601594924927, -0.0003226250410079956, -0.00027867406606674194, -0.00023472309112548828, -0.00019077211618423462, -0.00014682114124298096, -0.0001028701663017273, -5.891919136047363e-05, -1.496821641921997e-05, 2.898275852203369e-05, 7.293373346328735e-05, 0.00011688470840454102, 0.00016083568334579468, 0.00020478665828704834, 0.000248737633228302, 0.00029268860816955566, 0.0003366395831108093, 0.000380590558052063, 0.00042454153299331665, 0.0004684925079345703, 0.000512443482875824, 0.0005563944578170776, 0.0006003454327583313, 0.000644296407699585, 0.0006882473826408386, 0.0007321983575820923, 0.000776149332523346, 0.0008201003074645996, 0.0008640512824058533, 0.0009080022573471069, 0.0009519532322883606, 0.0009959042072296143, 0.001039855182170868, 0.0010838061571121216, 0.0011277571320533752, 0.001171708106994629, 0.0012156590819358826, 0.0012596100568771362, 0.00130356103181839, 0.0013475120067596436, 0.0013914629817008972, 0.0014354139566421509, 0.0014793649315834045, 0.0015233159065246582, 0.0015672668814659119, 0.0016112178564071655, 0.0016551688313484192, 0.0016991198062896729, 0.0017430707812309265, 0.0017870217561721802, 0.0018309727311134338, 0.0018749237060546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 9.0, 12.0, 25.0, 43.0, 77.0, 136.0, 288.0, 648.0, 2290.0, 12767.0, 222210.0, 764952.0, 38547.0, 4728.0, 1096.0, 348.0, 168.0, 83.0, 49.0, 27.0, 14.0, 12.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.1796875, -12.84375, -12.5078125, -12.171875, -11.8359375, -11.5, -11.1640625, -10.828125, -10.4921875, -10.15625, -9.8203125, -9.484375, -9.1484375, -8.8125, -8.4765625, -8.140625, -7.8046875, -7.46875, -7.1328125, -6.796875, -6.4609375, -6.125, -5.7890625, -5.453125, -5.1171875, -4.78125, -4.4453125, -4.109375, -3.7734375, -3.4375, -3.1015625, -2.765625, -2.4296875, -2.09375, -1.7578125, -1.421875, -1.0859375, -0.75, -0.4140625, -0.078125, 0.2578125, 0.59375, 0.9296875, 1.265625, 1.6015625, 1.9375, 2.2734375, 2.609375, 2.9453125, 3.28125, 3.6171875, 3.953125, 4.2890625, 4.625, 4.9609375, 5.296875, 5.6328125, 5.96875, 6.3046875, 6.640625, 6.9765625, 7.3125, 7.6484375, 7.984375, 8.3203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 9.0, 6.0, 7.0, 14.0, 19.0, 28.0, 42.0, 57.0, 85.0, 113.0, 125.0, 149.0, 119.0, 59.0, 55.0, 41.0, 24.0, 10.0, 7.0, 12.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.296875, -5.1453857421875, -4.993896484375, -4.8424072265625, -4.69091796875, -4.5394287109375, -4.387939453125, -4.2364501953125, -4.0849609375, -3.9334716796875, -3.781982421875, -3.6304931640625, -3.47900390625, -3.3275146484375, -3.176025390625, -3.0245361328125, -2.873046875, -2.7215576171875, -2.570068359375, -2.4185791015625, -2.26708984375, -2.1156005859375, -1.964111328125, -1.8126220703125, -1.6611328125, -1.5096435546875, -1.358154296875, -1.2066650390625, -1.05517578125, -0.9036865234375, -0.752197265625, -0.6007080078125, -0.44921875, -0.2977294921875, -0.146240234375, 0.0052490234375, 0.15673828125, 0.3082275390625, 0.459716796875, 0.6112060546875, 0.7626953125, 0.9141845703125, 1.065673828125, 1.2171630859375, 1.36865234375, 1.5201416015625, 1.671630859375, 1.8231201171875, 1.974609375, 2.1260986328125, 2.277587890625, 2.4290771484375, 2.58056640625, 2.7320556640625, 2.883544921875, 3.0350341796875, 3.1865234375, 3.3380126953125, 3.489501953125, 3.6409912109375, 3.79248046875, 3.9439697265625, 4.095458984375, 4.2469482421875, 4.3984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 11.0, 15.0, 29.0, 129.0, 494.0, 268.0, 59.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.02476501464844, -106.33174133300781, -102.63872528076172, -98.94570922851562, -95.252685546875, -91.55966186523438, -87.86664581298828, -84.17362976074219, -80.48060607910156, -76.78758239746094, -73.09456634521484, -69.40155029296875, -65.70852661132812, -62.015506744384766, -58.322486877441406, -54.62946701049805, -50.93644714355469, -47.24342727661133, -43.55040740966797, -39.85738754272461, -36.16436767578125, -32.47134780883789, -28.77832794189453, -25.085308074951172, -21.392288208007812, -17.699268341064453, -14.006248474121094, -10.313228607177734, -6.620208740234375, -2.9271888732910156, 0.7658309936523438, 4.458850860595703, 8.151878356933594, 11.844898223876953, 15.537918090820312, 19.230937957763672, 22.92395782470703, 26.61697769165039, 30.30999755859375, 34.00301742553711, 37.69603729248047, 41.38905715942383, 45.08207702636719, 48.77509689331055, 52.468116760253906, 56.161136627197266, 59.854156494140625, 63.547176361083984, 67.24019622802734, 70.93321228027344, 74.62623596191406, 78.31925964355469, 82.01227569580078, 85.70529174804688, 89.3983154296875, 93.09133911132812, 96.78435516357422, 100.47737121582031, 104.17039489746094, 107.86341857910156, 111.55643463134766, 115.24945068359375, 118.94247436523438, 122.635498046875, 126.3285140991211]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 5.0, 8.0, 11.0, 9.0, 21.0, 30.0, 25.0, 31.0, 43.0, 52.0, 45.0, 61.0, 58.0, 67.0, 56.0, 49.0, 60.0, 62.0, 67.0, 53.0, 33.0, 21.0, 33.0, 15.0, 25.0, 19.0, 9.0, 13.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.06242370605469, -35.8731575012207, -34.68389129638672, -33.494625091552734, -32.30535888671875, -31.1160945892334, -29.926830291748047, -28.737564086914062, -27.548297882080078, -26.359031677246094, -25.16976547241211, -23.980501174926758, -22.791234970092773, -21.60196876525879, -20.412704467773438, -19.223438262939453, -18.03417205810547, -16.844905853271484, -15.655640602111816, -14.466375350952148, -13.277109146118164, -12.08784294128418, -10.898577690124512, -9.709312438964844, -8.52004623413086, -7.330780506134033, -6.141514778137207, -4.952249050140381, -3.7629833221435547, -2.5737175941467285, -1.3844518661499023, -0.19518661499023438, 0.9940757751464844, 2.1833415031433105, 3.3726072311401367, 4.561872959136963, 5.751138687133789, 6.940404415130615, 8.129670143127441, 9.31893539428711, 10.508201599121094, 11.697467803955078, 12.886733055114746, 14.075998306274414, 15.265264511108398, 16.454530715942383, 17.643795013427734, 18.83306121826172, 20.022327423095703, 21.211593627929688, 22.400859832763672, 23.590124130249023, 24.779390335083008, 25.968656539916992, 27.157920837402344, 28.347187042236328, 29.536453247070312, 30.725719451904297, 31.91498565673828, 33.104251861572266, 34.29351806640625, 35.48278045654297, 36.67204666137695, 37.86131286621094, 39.05057907104492]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 8.0, 25.0, 57.0, 207.0, 805.0, 6051.0, 333684.0, 3840772.0, 10285.0, 1270.0, 383.0, 181.0, 121.0, 93.0, 71.0, 45.0, 38.0, 33.0, 32.0, 20.0, 15.0, 17.0, 11.0, 10.0, 10.0, 3.0, 6.0, 6.0, 7.0, 2.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -9.65966796875, -8.6005859375, -7.54150390625, -6.482421875, -5.42333984375, -4.3642578125, -3.30517578125, -2.24609375, -1.18701171875, -0.1279296875, 0.93115234375, 1.990234375, 3.04931640625, 4.1083984375, 5.16748046875, 6.2265625, 7.28564453125, 8.3447265625, 9.40380859375, 10.462890625, 11.52197265625, 12.5810546875, 13.64013671875, 14.69921875, 15.75830078125, 16.8173828125, 17.87646484375, 18.935546875, 19.99462890625, 21.0537109375, 22.11279296875, 23.171875, 24.23095703125, 25.2900390625, 26.34912109375, 27.408203125, 28.46728515625, 29.5263671875, 30.58544921875, 31.64453125, 32.70361328125, 33.7626953125, 34.82177734375, 35.880859375, 36.93994140625, 37.9990234375, 39.05810546875, 40.1171875, 41.17626953125, 42.2353515625, 43.29443359375, 44.353515625, 45.41259765625, 46.4716796875, 47.53076171875, 48.58984375, 49.64892578125, 50.7080078125, 51.76708984375, 52.826171875, 53.88525390625, 54.9443359375, 56.00341796875, 57.0625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 16.0, 49.0, 83.0, 209.0, 240.0, 215.0, 127.0, 47.0, 14.0, 9.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.611328125, -1.460174560546875, -1.30902099609375, -1.157867431640625, -1.0067138671875, -0.855560302734375, -0.70440673828125, -0.553253173828125, -0.402099609375, -0.250946044921875, -0.09979248046875, 0.051361083984375, 0.2025146484375, 0.353668212890625, 0.50482177734375, 0.655975341796875, 0.80712890625, 0.958282470703125, 1.10943603515625, 1.260589599609375, 1.4117431640625, 1.562896728515625, 1.71405029296875, 1.865203857421875, 2.016357421875, 2.167510986328125, 2.31866455078125, 2.469818115234375, 2.6209716796875, 2.772125244140625, 2.92327880859375, 3.074432373046875, 3.2255859375, 3.376739501953125, 3.52789306640625, 3.679046630859375, 3.8302001953125, 3.981353759765625, 4.13250732421875, 4.283660888671875, 4.434814453125, 4.585968017578125, 4.73712158203125, 4.888275146484375, 5.0394287109375, 5.190582275390625, 5.34173583984375, 5.492889404296875, 5.64404296875, 5.795196533203125, 5.94635009765625, 6.097503662109375, 6.2486572265625, 6.399810791015625, 6.55096435546875, 6.702117919921875, 6.853271484375, 7.004425048828125, 7.15557861328125, 7.306732177734375, 7.4578857421875, 7.609039306640625, 7.76019287109375, 7.911346435546875, 8.0625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 15.0, 49.0, 99.0, 192.0, 778.0, 3892503.0, 298908.0, 1078.0, 332.0, 157.0, 96.0, 41.0, 17.0, 11.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.46875, -32.50244140625, -29.5361328125, -26.56982421875, -23.603515625, -20.63720703125, -17.6708984375, -14.70458984375, -11.73828125, -8.77197265625, -5.8056640625, -2.83935546875, 0.126953125, 3.09326171875, 6.0595703125, 9.02587890625, 11.9921875, 14.95849609375, 17.9248046875, 20.89111328125, 23.857421875, 26.82373046875, 29.7900390625, 32.75634765625, 35.72265625, 38.68896484375, 41.6552734375, 44.62158203125, 47.587890625, 50.55419921875, 53.5205078125, 56.48681640625, 59.453125, 62.41943359375, 65.3857421875, 68.35205078125, 71.318359375, 74.28466796875, 77.2509765625, 80.21728515625, 83.18359375, 86.14990234375, 89.1162109375, 92.08251953125, 95.048828125, 98.01513671875, 100.9814453125, 103.94775390625, 106.9140625, 109.88037109375, 112.8466796875, 115.81298828125, 118.779296875, 121.74560546875, 124.7119140625, 127.67822265625, 130.64453125, 133.61083984375, 136.5771484375, 139.54345703125, 142.509765625, 145.47607421875, 148.4423828125, 151.40869140625, 154.375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 14.0, 34.0, 77.0, 546.0, 3122.0, 229.0, 28.0, 11.0, 9.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.16754150390625, -1.8702392578125, -1.57293701171875, -1.275634765625, -0.97833251953125, -0.6810302734375, -0.38372802734375, -0.08642578125, 0.21087646484375, 0.5081787109375, 0.80548095703125, 1.102783203125, 1.40008544921875, 1.6973876953125, 1.99468994140625, 2.2919921875, 2.58929443359375, 2.8865966796875, 3.18389892578125, 3.481201171875, 3.77850341796875, 4.0758056640625, 4.37310791015625, 4.67041015625, 4.96771240234375, 5.2650146484375, 5.56231689453125, 5.859619140625, 6.15692138671875, 6.4542236328125, 6.75152587890625, 7.048828125, 7.34613037109375, 7.6434326171875, 7.94073486328125, 8.238037109375, 8.53533935546875, 8.8326416015625, 9.12994384765625, 9.42724609375, 9.72454833984375, 10.0218505859375, 10.31915283203125, 10.616455078125, 10.91375732421875, 11.2110595703125, 11.50836181640625, 11.8056640625, 12.10296630859375, 12.4002685546875, 12.69757080078125, 12.994873046875, 13.29217529296875, 13.5894775390625, 13.88677978515625, 14.18408203125, 14.48138427734375, 14.7786865234375, 15.07598876953125, 15.373291015625, 15.67059326171875, 15.9678955078125, 16.26519775390625, 16.5625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 26.0, 337.0, 529.0, 74.0, 25.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.65919494628906, -71.03740692138672, -68.41561889648438, -65.79383087158203, -63.17204284667969, -60.550254821777344, -57.928462982177734, -55.30667495727539, -52.68488693237305, -50.0630989074707, -47.44131088256836, -44.819522857666016, -42.197731018066406, -39.57594299316406, -36.95415496826172, -34.332366943359375, -31.71057891845703, -29.088790893554688, -26.467002868652344, -23.845212936401367, -21.223424911499023, -18.60163688659668, -15.97984790802002, -13.35805892944336, -10.736270904541016, -8.114482879638672, -5.492693901062012, -2.8709053993225098, -0.2491168975830078, 2.372671127319336, 4.994460105895996, 7.616249084472656, 10.238037109375, 12.859825134277344, 15.481614112854004, 18.103403091430664, 20.725191116333008, 23.34697914123535, 25.968769073486328, 28.590557098388672, 31.212345123291016, 33.83413314819336, 36.4559211730957, 39.07770919799805, 41.699501037597656, 44.3212890625, 46.943077087402344, 49.56486511230469, 52.18665313720703, 54.808441162109375, 57.43022918701172, 60.05201721191406, 62.673805236816406, 65.29559326171875, 67.9173812866211, 70.53916931152344, 73.16096496582031, 75.78275299072266, 78.404541015625, 81.02632904052734, 83.64811706542969, 86.26990509033203, 88.89169311523438, 91.51348876953125, 94.13526916503906]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 11.0, 20.0, 38.0, 61.0, 70.0, 87.0, 86.0, 116.0, 120.0, 100.0, 82.0, 73.0, 38.0, 38.0, 19.0, 11.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.18561553955078, -31.13006591796875, -30.07451629638672, -29.018966674804688, -27.963417053222656, -26.907867431640625, -25.852319717407227, -24.796770095825195, -23.741220474243164, -22.685670852661133, -21.6301212310791, -20.57457160949707, -19.519023895263672, -18.46347427368164, -17.40792465209961, -16.352375030517578, -15.296825408935547, -14.241275787353516, -13.185726165771484, -12.13017749786377, -11.074627876281738, -10.019078254699707, -8.963529586791992, -7.907979965209961, -6.85243034362793, -5.796880722045898, -4.741331577301025, -3.6857821941375732, -2.630232810974121, -1.5746831893920898, -0.5191340446472168, 0.5364151000976562, 1.5919685363769531, 2.6475179195404053, 3.7030673027038574, 4.7586164474487305, 5.814166069030762, 6.869715690612793, 7.925264835357666, 8.980813980102539, 10.03636360168457, 11.091913223266602, 12.147462844848633, 13.203011512756348, 14.258561134338379, 15.31411075592041, 16.369659423828125, 17.425209045410156, 18.480758666992188, 19.53630828857422, 20.59185791015625, 21.64740753173828, 22.702957153320312, 23.758506774902344, 24.814054489135742, 25.869604110717773, 26.925153732299805, 27.980703353881836, 29.036252975463867, 30.0918025970459, 31.147350311279297, 32.20289993286133, 33.25844955444336, 34.31399917602539, 35.36954879760742]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 2.0, 6.0, 4.0, 10.0, 11.0, 15.0, 16.0, 29.0, 30.0, 33.0, 67.0, 73.0, 136.0, 273.0, 584.0, 1982.0, 13112.0, 281222.0, 715585.0, 30281.0, 3322.0, 875.0, 334.0, 178.0, 105.0, 69.0, 42.0, 30.0, 26.0, 20.0, 14.0, 13.0, 13.0, 8.0, 5.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2109375, -14.7066650390625, -14.202392578125, -13.6981201171875, -13.19384765625, -12.6895751953125, -12.185302734375, -11.6810302734375, -11.1767578125, -10.6724853515625, -10.168212890625, -9.6639404296875, -9.15966796875, -8.6553955078125, -8.151123046875, -7.6468505859375, -7.142578125, -6.6383056640625, -6.134033203125, -5.6297607421875, -5.12548828125, -4.6212158203125, -4.116943359375, -3.6126708984375, -3.1083984375, -2.6041259765625, -2.099853515625, -1.5955810546875, -1.09130859375, -0.5870361328125, -0.082763671875, 0.4215087890625, 0.92578125, 1.4300537109375, 1.934326171875, 2.4385986328125, 2.94287109375, 3.4471435546875, 3.951416015625, 4.4556884765625, 4.9599609375, 5.4642333984375, 5.968505859375, 6.4727783203125, 6.97705078125, 7.4813232421875, 7.985595703125, 8.4898681640625, 8.994140625, 9.4984130859375, 10.002685546875, 10.5069580078125, 11.01123046875, 11.5155029296875, 12.019775390625, 12.5240478515625, 13.0283203125, 13.5325927734375, 14.036865234375, 14.5411376953125, 15.04541015625, 15.5496826171875, 16.053955078125, 16.5582275390625, 17.0625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 13.0, 18.0, 37.0, 91.0, 131.0, 165.0, 184.0, 139.0, 110.0, 60.0, 32.0, 17.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.791015625, -2.638092041015625, -2.48516845703125, -2.332244873046875, -2.1793212890625, -2.026397705078125, -1.87347412109375, -1.720550537109375, -1.567626953125, -1.414703369140625, -1.26177978515625, -1.108856201171875, -0.9559326171875, -0.803009033203125, -0.65008544921875, -0.497161865234375, -0.34423828125, -0.191314697265625, -0.03839111328125, 0.114532470703125, 0.2674560546875, 0.420379638671875, 0.57330322265625, 0.726226806640625, 0.879150390625, 1.032073974609375, 1.18499755859375, 1.337921142578125, 1.4908447265625, 1.643768310546875, 1.79669189453125, 1.949615478515625, 2.1025390625, 2.255462646484375, 2.40838623046875, 2.561309814453125, 2.7142333984375, 2.867156982421875, 3.02008056640625, 3.173004150390625, 3.325927734375, 3.478851318359375, 3.63177490234375, 3.784698486328125, 3.9376220703125, 4.090545654296875, 4.24346923828125, 4.396392822265625, 4.54931640625, 4.702239990234375, 4.85516357421875, 5.008087158203125, 5.1610107421875, 5.313934326171875, 5.46685791015625, 5.619781494140625, 5.772705078125, 5.925628662109375, 6.07855224609375, 6.231475830078125, 6.3843994140625, 6.537322998046875, 6.69024658203125, 6.843170166015625, 6.99609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 7.0, 7.0, 15.0, 8.0, 15.0, 20.0, 45.0, 60.0, 99.0, 166.0, 297.0, 523.0, 1339.0, 4019.0, 18336.0, 153019.0, 718053.0, 130199.0, 16108.0, 3777.0, 1255.0, 540.0, 237.0, 133.0, 81.0, 48.0, 47.0, 32.0, 19.0, 17.0, 6.0, 12.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.2890625, -10.9794921875, -10.669921875, -10.3603515625, -10.05078125, -9.7412109375, -9.431640625, -9.1220703125, -8.8125, -8.5029296875, -8.193359375, -7.8837890625, -7.57421875, -7.2646484375, -6.955078125, -6.6455078125, -6.3359375, -6.0263671875, -5.716796875, -5.4072265625, -5.09765625, -4.7880859375, -4.478515625, -4.1689453125, -3.859375, -3.5498046875, -3.240234375, -2.9306640625, -2.62109375, -2.3115234375, -2.001953125, -1.6923828125, -1.3828125, -1.0732421875, -0.763671875, -0.4541015625, -0.14453125, 0.1650390625, 0.474609375, 0.7841796875, 1.09375, 1.4033203125, 1.712890625, 2.0224609375, 2.33203125, 2.6416015625, 2.951171875, 3.2607421875, 3.5703125, 3.8798828125, 4.189453125, 4.4990234375, 4.80859375, 5.1181640625, 5.427734375, 5.7373046875, 6.046875, 6.3564453125, 6.666015625, 6.9755859375, 7.28515625, 7.5947265625, 7.904296875, 8.2138671875, 8.5234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 2.0, 15.0, 13.0, 17.0, 18.0, 20.0, 22.0, 36.0, 38.0, 35.0, 47.0, 53.0, 52.0, 52.0, 56.0, 52.0, 55.0, 57.0, 52.0, 44.0, 48.0, 32.0, 22.0, 22.0, 28.0, 21.0, 16.0, 13.0, 11.0, 10.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.4453125, -8.20550537109375, -7.9656982421875, -7.72589111328125, -7.486083984375, -7.24627685546875, -7.0064697265625, -6.76666259765625, -6.52685546875, -6.28704833984375, -6.0472412109375, -5.80743408203125, -5.567626953125, -5.32781982421875, -5.0880126953125, -4.84820556640625, -4.6083984375, -4.36859130859375, -4.1287841796875, -3.88897705078125, -3.649169921875, -3.40936279296875, -3.1695556640625, -2.92974853515625, -2.68994140625, -2.45013427734375, -2.2103271484375, -1.97052001953125, -1.730712890625, -1.49090576171875, -1.2510986328125, -1.01129150390625, -0.771484375, -0.53167724609375, -0.2918701171875, -0.05206298828125, 0.187744140625, 0.42755126953125, 0.6673583984375, 0.90716552734375, 1.14697265625, 1.38677978515625, 1.6265869140625, 1.86639404296875, 2.106201171875, 2.34600830078125, 2.5858154296875, 2.82562255859375, 3.0654296875, 3.30523681640625, 3.5450439453125, 3.78485107421875, 4.024658203125, 4.26446533203125, 4.5042724609375, 4.74407958984375, 4.98388671875, 5.22369384765625, 5.4635009765625, 5.70330810546875, 5.943115234375, 6.18292236328125, 6.4227294921875, 6.66253662109375, 6.90234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 4.0, 6.0, 19.0, 11.0, 16.0, 19.0, 34.0, 54.0, 75.0, 101.0, 137.0, 255.0, 390.0, 646.0, 1218.0, 2415.0, 5270.0, 13062.0, 37882.0, 138114.0, 449137.0, 286606.0, 74020.0, 22794.0, 8468.0, 3691.0, 1788.0, 923.0, 493.0, 312.0, 193.0, 131.0, 82.0, 53.0, 36.0, 23.0, 25.0, 13.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.431640625, -2.3551025390625, -2.278564453125, -2.2020263671875, -2.12548828125, -2.0489501953125, -1.972412109375, -1.8958740234375, -1.8193359375, -1.7427978515625, -1.666259765625, -1.5897216796875, -1.51318359375, -1.4366455078125, -1.360107421875, -1.2835693359375, -1.20703125, -1.1304931640625, -1.053955078125, -0.9774169921875, -0.90087890625, -0.8243408203125, -0.747802734375, -0.6712646484375, -0.5947265625, -0.5181884765625, -0.441650390625, -0.3651123046875, -0.28857421875, -0.2120361328125, -0.135498046875, -0.0589599609375, 0.017578125, 0.0941162109375, 0.170654296875, 0.2471923828125, 0.32373046875, 0.4002685546875, 0.476806640625, 0.5533447265625, 0.6298828125, 0.7064208984375, 0.782958984375, 0.8594970703125, 0.93603515625, 1.0125732421875, 1.089111328125, 1.1656494140625, 1.2421875, 1.3187255859375, 1.395263671875, 1.4718017578125, 1.54833984375, 1.6248779296875, 1.701416015625, 1.7779541015625, 1.8544921875, 1.9310302734375, 2.007568359375, 2.0841064453125, 2.16064453125, 2.2371826171875, 2.313720703125, 2.3902587890625, 2.466796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 18.0, 13.0, 21.0, 21.0, 28.0, 35.0, 51.0, 74.0, 96.0, 119.0, 102.0, 76.0, 84.0, 58.0, 38.0, 31.0, 20.0, 19.0, 12.0, 6.0, 10.0, 8.0, 11.0, 2.0, 6.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0006403923034667969, -0.0006243288516998291, -0.0006082653999328613, -0.0005922019481658936, -0.0005761384963989258, -0.000560075044631958, -0.0005440115928649902, -0.0005279481410980225, -0.0005118846893310547, -0.0004958212375640869, -0.00047975778579711914, -0.00046369433403015137, -0.0004476308822631836, -0.0004315674304962158, -0.00041550397872924805, -0.0003994405269622803, -0.0003833770751953125, -0.0003673136234283447, -0.00035125017166137695, -0.0003351867198944092, -0.0003191232681274414, -0.00030305981636047363, -0.00028699636459350586, -0.0002709329128265381, -0.0002548694610595703, -0.00023880600929260254, -0.00022274255752563477, -0.000206679105758667, -0.00019061565399169922, -0.00017455220222473145, -0.00015848875045776367, -0.0001424252986907959, -0.00012636184692382812, -0.00011029839515686035, -9.423494338989258e-05, -7.81714916229248e-05, -6.210803985595703e-05, -4.604458808898926e-05, -2.9981136322021484e-05, -1.3917684555053711e-05, 2.1457672119140625e-06, 1.8209218978881836e-05, 3.427267074584961e-05, 5.033612251281738e-05, 6.639957427978516e-05, 8.246302604675293e-05, 9.85264778137207e-05, 0.00011458992958068848, 0.00013065338134765625, 0.00014671683311462402, 0.0001627802848815918, 0.00017884373664855957, 0.00019490718841552734, 0.00021097064018249512, 0.0002270340919494629, 0.00024309754371643066, 0.00025916099548339844, 0.0002752244472503662, 0.000291287899017334, 0.00030735135078430176, 0.00032341480255126953, 0.0003394782543182373, 0.0003555417060852051, 0.00037160515785217285, 0.0003876686096191406]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 14.0, 16.0, 15.0, 26.0, 22.0, 41.0, 62.0, 60.0, 108.0, 151.0, 251.0, 381.0, 599.0, 1079.0, 1858.0, 3705.0, 8146.0, 19544.0, 57647.0, 203841.0, 462054.0, 197657.0, 55782.0, 19127.0, 7964.0, 3738.0, 1902.0, 1033.0, 617.0, 360.0, 252.0, 160.0, 101.0, 69.0, 51.0, 36.0, 25.0, 17.0, 9.0, 7.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.21624755859375, -2.1356201171875, -2.05499267578125, -1.974365234375, -1.89373779296875, -1.8131103515625, -1.73248291015625, -1.65185546875, -1.57122802734375, -1.4906005859375, -1.40997314453125, -1.329345703125, -1.24871826171875, -1.1680908203125, -1.08746337890625, -1.0068359375, -0.92620849609375, -0.8455810546875, -0.76495361328125, -0.684326171875, -0.60369873046875, -0.5230712890625, -0.44244384765625, -0.36181640625, -0.28118896484375, -0.2005615234375, -0.11993408203125, -0.039306640625, 0.04132080078125, 0.1219482421875, 0.20257568359375, 0.283203125, 0.36383056640625, 0.4444580078125, 0.52508544921875, 0.605712890625, 0.68634033203125, 0.7669677734375, 0.84759521484375, 0.92822265625, 1.00885009765625, 1.0894775390625, 1.17010498046875, 1.250732421875, 1.33135986328125, 1.4119873046875, 1.49261474609375, 1.5732421875, 1.65386962890625, 1.7344970703125, 1.81512451171875, 1.895751953125, 1.97637939453125, 2.0570068359375, 2.13763427734375, 2.21826171875, 2.29888916015625, 2.3795166015625, 2.46014404296875, 2.540771484375, 2.62139892578125, 2.7020263671875, 2.78265380859375, 2.86328125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 5.0, 11.0, 18.0, 17.0, 23.0, 30.0, 51.0, 56.0, 83.0, 99.0, 111.0, 109.0, 86.0, 53.0, 57.0, 46.0, 34.0, 21.0, 17.0, 16.0, 9.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.08984375, -3.005584716796875, -2.92132568359375, -2.837066650390625, -2.7528076171875, -2.668548583984375, -2.58428955078125, -2.500030517578125, -2.415771484375, -2.331512451171875, -2.24725341796875, -2.162994384765625, -2.0787353515625, -1.994476318359375, -1.91021728515625, -1.825958251953125, -1.74169921875, -1.657440185546875, -1.57318115234375, -1.488922119140625, -1.4046630859375, -1.320404052734375, -1.23614501953125, -1.151885986328125, -1.067626953125, -0.983367919921875, -0.89910888671875, -0.814849853515625, -0.7305908203125, -0.646331787109375, -0.56207275390625, -0.477813720703125, -0.3935546875, -0.309295654296875, -0.22503662109375, -0.140777587890625, -0.0565185546875, 0.027740478515625, 0.11199951171875, 0.196258544921875, 0.280517578125, 0.364776611328125, 0.44903564453125, 0.533294677734375, 0.6175537109375, 0.701812744140625, 0.78607177734375, 0.870330810546875, 0.95458984375, 1.038848876953125, 1.12310791015625, 1.207366943359375, 1.2916259765625, 1.375885009765625, 1.46014404296875, 1.544403076171875, 1.628662109375, 1.712921142578125, 1.79718017578125, 1.881439208984375, 1.9656982421875, 2.049957275390625, 2.13421630859375, 2.218475341796875, 2.302734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 17.0, 38.0, 90.0, 219.0, 343.0, 198.0, 66.0, 18.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.83872985839844, -52.29728317260742, -49.755836486816406, -47.214385986328125, -44.67293930053711, -42.131492614746094, -39.59004211425781, -37.0485954284668, -34.50714874267578, -31.965702056884766, -29.424253463745117, -26.88280487060547, -24.341358184814453, -21.799911499023438, -19.25846290588379, -16.71701431274414, -14.175567626953125, -11.634119987487793, -9.092672348022461, -6.551224708557129, -4.009777069091797, -1.4683294296264648, 1.0731182098388672, 3.6145668029785156, 6.156013488769531, 8.697461128234863, 11.238908767700195, 13.780356407165527, 16.32180404663086, 18.863250732421875, 21.404699325561523, 23.946147918701172, 26.487586975097656, 29.029033660888672, 31.57048225402832, 34.11193084716797, 36.653377532958984, 39.19482421875, 41.73627471923828, 44.2777214050293, 46.81916809082031, 49.36061477661133, 51.902061462402344, 54.443511962890625, 56.98495864868164, 59.526405334472656, 62.06785583496094, 64.60929870605469, 67.15074920654297, 69.69219970703125, 72.233642578125, 74.77509307861328, 77.31654357910156, 79.85798645019531, 82.3994369506836, 84.94088745117188, 87.48233032226562, 90.0237808227539, 92.56522369384766, 95.10667419433594, 97.64811706542969, 100.18956756591797, 102.73101806640625, 105.2724609375, 107.81391143798828]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 11.0, 15.0, 18.0, 17.0, 29.0, 22.0, 22.0, 31.0, 29.0, 43.0, 42.0, 32.0, 40.0, 56.0, 42.0, 49.0, 60.0, 45.0, 47.0, 38.0, 52.0, 38.0, 28.0, 37.0, 19.0, 22.0, 14.0, 15.0, 15.0, 12.0, 6.0, 11.0, 6.0, 6.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.94635772705078, -34.75006866455078, -33.55377960205078, -32.35749053955078, -31.161203384399414, -29.964914321899414, -28.768627166748047, -27.572338104248047, -26.376049041748047, -25.179759979248047, -23.983470916748047, -22.78718376159668, -21.59089469909668, -20.39460563659668, -19.198318481445312, -18.002029418945312, -16.805740356445312, -15.609451293945312, -14.413163185119629, -13.216875076293945, -12.020586013793945, -10.824296951293945, -9.628008842468262, -8.431720733642578, -7.235431671142578, -6.039143085479736, -4.8428544998168945, -3.6465659141540527, -2.450277328491211, -1.2539887428283691, -0.057700157165527344, 1.1385879516601562, 2.3348731994628906, 3.5311617851257324, 4.727450370788574, 5.923738956451416, 7.120027542114258, 8.316316604614258, 9.512604713439941, 10.708892822265625, 11.905181884765625, 13.101470947265625, 14.297759056091309, 15.494047164916992, 16.690336227416992, 17.886625289916992, 19.08291244506836, 20.27920150756836, 21.47549057006836, 22.67177963256836, 23.86806869506836, 25.064355850219727, 26.260644912719727, 27.456933975219727, 28.653221130371094, 29.849510192871094, 31.045799255371094, 32.242088317871094, 33.438377380371094, 34.634666442871094, 35.830955505371094, 37.02724075317383, 38.22352981567383, 39.41981887817383, 40.61610794067383]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 10.0, 12.0, 37.0, 71.0, 139.0, 334.0, 1088.0, 4989.0, 73808.0, 4073417.0, 34890.0, 3718.0, 943.0, 358.0, 162.0, 82.0, 58.0, 38.0, 30.0, 23.0, 16.0, 14.0, 9.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.503173828125, -11.74072265625, -10.978271484375, -10.2158203125, -9.453369140625, -8.69091796875, -7.928466796875, -7.166015625, -6.403564453125, -5.64111328125, -4.878662109375, -4.1162109375, -3.353759765625, -2.59130859375, -1.828857421875, -1.06640625, -0.303955078125, 0.45849609375, 1.220947265625, 1.9833984375, 2.745849609375, 3.50830078125, 4.270751953125, 5.033203125, 5.795654296875, 6.55810546875, 7.320556640625, 8.0830078125, 8.845458984375, 9.60791015625, 10.370361328125, 11.1328125, 11.895263671875, 12.65771484375, 13.420166015625, 14.1826171875, 14.945068359375, 15.70751953125, 16.469970703125, 17.232421875, 17.994873046875, 18.75732421875, 19.519775390625, 20.2822265625, 21.044677734375, 21.80712890625, 22.569580078125, 23.33203125, 24.094482421875, 24.85693359375, 25.619384765625, 26.3818359375, 27.144287109375, 27.90673828125, 28.669189453125, 29.431640625, 30.194091796875, 30.95654296875, 31.718994140625, 32.4814453125, 33.243896484375, 34.00634765625, 34.768798828125, 35.53125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 10.0, 9.0, 29.0, 59.0, 90.0, 122.0, 133.0, 156.0, 144.0, 110.0, 60.0, 41.0, 20.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.131866455078125, -1.99224853515625, -1.852630615234375, -1.7130126953125, -1.573394775390625, -1.43377685546875, -1.294158935546875, -1.154541015625, -1.014923095703125, -0.87530517578125, -0.735687255859375, -0.5960693359375, -0.456451416015625, -0.31683349609375, -0.177215576171875, -0.03759765625, 0.102020263671875, 0.24163818359375, 0.381256103515625, 0.5208740234375, 0.660491943359375, 0.80010986328125, 0.939727783203125, 1.079345703125, 1.218963623046875, 1.35858154296875, 1.498199462890625, 1.6378173828125, 1.777435302734375, 1.91705322265625, 2.056671142578125, 2.1962890625, 2.335906982421875, 2.47552490234375, 2.615142822265625, 2.7547607421875, 2.894378662109375, 3.03399658203125, 3.173614501953125, 3.313232421875, 3.452850341796875, 3.59246826171875, 3.732086181640625, 3.8717041015625, 4.011322021484375, 4.15093994140625, 4.290557861328125, 4.43017578125, 4.569793701171875, 4.70941162109375, 4.849029541015625, 4.9886474609375, 5.128265380859375, 5.26788330078125, 5.407501220703125, 5.547119140625, 5.686737060546875, 5.82635498046875, 5.965972900390625, 6.1055908203125, 6.245208740234375, 6.38482666015625, 6.524444580078125, 6.6640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 20.0, 43.0, 59.0, 90.0, 194.0, 902.0, 3775329.0, 416668.0, 690.0, 149.0, 63.0, 40.0, 16.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.5, -93.32763671875, -91.1552734375, -88.98291015625, -86.810546875, -84.63818359375, -82.4658203125, -80.29345703125, -78.12109375, -75.94873046875, -73.7763671875, -71.60400390625, -69.431640625, -67.25927734375, -65.0869140625, -62.91455078125, -60.7421875, -58.56982421875, -56.3974609375, -54.22509765625, -52.052734375, -49.88037109375, -47.7080078125, -45.53564453125, -43.36328125, -41.19091796875, -39.0185546875, -36.84619140625, -34.673828125, -32.50146484375, -30.3291015625, -28.15673828125, -25.984375, -23.81201171875, -21.6396484375, -19.46728515625, -17.294921875, -15.12255859375, -12.9501953125, -10.77783203125, -8.60546875, -6.43310546875, -4.2607421875, -2.08837890625, 0.083984375, 2.25634765625, 4.4287109375, 6.60107421875, 8.7734375, 10.94580078125, 13.1181640625, 15.29052734375, 17.462890625, 19.63525390625, 21.8076171875, 23.97998046875, 26.15234375, 28.32470703125, 30.4970703125, 32.66943359375, 34.841796875, 37.01416015625, 39.1865234375, 41.35888671875, 43.53125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 11.0, 40.0, 305.0, 3435.0, 246.0, 32.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.5625, -17.16748046875, -16.7724609375, -16.37744140625, -15.982421875, -15.58740234375, -15.1923828125, -14.79736328125, -14.40234375, -14.00732421875, -13.6123046875, -13.21728515625, -12.822265625, -12.42724609375, -12.0322265625, -11.63720703125, -11.2421875, -10.84716796875, -10.4521484375, -10.05712890625, -9.662109375, -9.26708984375, -8.8720703125, -8.47705078125, -8.08203125, -7.68701171875, -7.2919921875, -6.89697265625, -6.501953125, -6.10693359375, -5.7119140625, -5.31689453125, -4.921875, -4.52685546875, -4.1318359375, -3.73681640625, -3.341796875, -2.94677734375, -2.5517578125, -2.15673828125, -1.76171875, -1.36669921875, -0.9716796875, -0.57666015625, -0.181640625, 0.21337890625, 0.6083984375, 1.00341796875, 1.3984375, 1.79345703125, 2.1884765625, 2.58349609375, 2.978515625, 3.37353515625, 3.7685546875, 4.16357421875, 4.55859375, 4.95361328125, 5.3486328125, 5.74365234375, 6.138671875, 6.53369140625, 6.9287109375, 7.32373046875, 7.71875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 45.0, 664.0, 274.0, 18.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-90.30525207519531, -87.55488586425781, -84.80451202392578, -82.05414581298828, -79.30377197265625, -76.55340576171875, -73.80303192138672, -71.05266571044922, -68.30229187011719, -65.55192565917969, -62.801551818847656, -60.05118179321289, -57.300811767578125, -54.55044174194336, -51.800071716308594, -49.049705505371094, -46.29933547973633, -43.54896545410156, -40.7985954284668, -38.04822540283203, -35.297855377197266, -32.5474853515625, -29.797117233276367, -27.0467472076416, -24.296377182006836, -21.54600715637207, -18.795637130737305, -16.045269012451172, -13.29489803314209, -10.544528007507324, -7.794158935546875, -5.043788909912109, -2.2934188842773438, 0.4569509029388428, 3.2073206901550293, 5.957690238952637, 8.708060264587402, 11.458430290222168, 14.208799362182617, 16.959169387817383, 19.70953941345215, 22.459909439086914, 25.21027946472168, 27.960647583007812, 30.711017608642578, 33.461387634277344, 36.21175765991211, 38.962127685546875, 41.71249771118164, 44.462867736816406, 47.21323776245117, 49.96360778808594, 52.7139778137207, 55.46434783935547, 58.21471405029297, 60.965087890625, 63.7154541015625, 66.4658203125, 69.21619415283203, 71.96656036376953, 74.71693420410156, 77.46730041503906, 80.2176742553711, 82.9680404663086, 85.71841430664062]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 11.0, 13.0, 26.0, 29.0, 43.0, 51.0, 76.0, 75.0, 84.0, 80.0, 82.0, 100.0, 69.0, 63.0, 66.0, 35.0, 32.0, 24.0, 14.0, 14.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.09068775177002, -13.561224937438965, -13.03176212310791, -12.502299308776855, -11.9728364944458, -11.443373680114746, -10.913909912109375, -10.38444709777832, -9.854984283447266, -9.325521469116211, -8.796058654785156, -8.266595840454102, -7.737133026123047, -7.207670211791992, -6.678206920623779, -6.148744106292725, -5.619281768798828, -5.089818954467773, -4.560356140136719, -4.030893325805664, -3.5014302730560303, -2.9719674587249756, -2.442504405975342, -1.913041591644287, -1.3835787773132324, -0.854115903377533, -0.3246530294418335, 0.20480990409851074, 0.7342727184295654, 1.2637355327606201, 1.793198585510254, 2.3226613998413086, 2.852123260498047, 3.3815860748291016, 3.9110488891601562, 4.440511703491211, 4.969974517822266, 5.49943733215332, 6.028900623321533, 6.558363437652588, 7.087826251983643, 7.617289066314697, 8.14675235748291, 8.676215171813965, 9.20567798614502, 9.735140800476074, 10.264603614807129, 10.794066429138184, 11.323529243469238, 11.852992057800293, 12.382454872131348, 12.911917686462402, 13.441380500793457, 13.970843315124512, 14.500307083129883, 15.029769897460938, 15.559232711791992, 16.088695526123047, 16.6181583404541, 17.147621154785156, 17.67708396911621, 18.206546783447266, 18.73600959777832, 19.265472412109375, 19.79493522644043]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 13.0, 10.0, 14.0, 16.0, 21.0, 33.0, 39.0, 40.0, 63.0, 139.0, 243.0, 749.0, 3339.0, 37980.0, 816001.0, 179778.0, 7897.0, 1342.0, 370.0, 146.0, 91.0, 60.0, 28.0, 39.0, 18.0, 19.0, 15.0, 11.0, 9.0, 15.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.09375, -16.5712890625, -16.048828125, -15.5263671875, -15.00390625, -14.4814453125, -13.958984375, -13.4365234375, -12.9140625, -12.3916015625, -11.869140625, -11.3466796875, -10.82421875, -10.3017578125, -9.779296875, -9.2568359375, -8.734375, -8.2119140625, -7.689453125, -7.1669921875, -6.64453125, -6.1220703125, -5.599609375, -5.0771484375, -4.5546875, -4.0322265625, -3.509765625, -2.9873046875, -2.46484375, -1.9423828125, -1.419921875, -0.8974609375, -0.375, 0.1474609375, 0.669921875, 1.1923828125, 1.71484375, 2.2373046875, 2.759765625, 3.2822265625, 3.8046875, 4.3271484375, 4.849609375, 5.3720703125, 5.89453125, 6.4169921875, 6.939453125, 7.4619140625, 7.984375, 8.5068359375, 9.029296875, 9.5517578125, 10.07421875, 10.5966796875, 11.119140625, 11.6416015625, 12.1640625, 12.6865234375, 13.208984375, 13.7314453125, 14.25390625, 14.7763671875, 15.298828125, 15.8212890625, 16.34375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 13.0, 30.0, 60.0, 83.0, 115.0, 171.0, 171.0, 138.0, 104.0, 66.0, 28.0, 16.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.893218994140625, -1.73760986328125, -1.582000732421875, -1.4263916015625, -1.270782470703125, -1.11517333984375, -0.959564208984375, -0.803955078125, -0.648345947265625, -0.49273681640625, -0.337127685546875, -0.1815185546875, -0.025909423828125, 0.12969970703125, 0.285308837890625, 0.44091796875, 0.596527099609375, 0.75213623046875, 0.907745361328125, 1.0633544921875, 1.218963623046875, 1.37457275390625, 1.530181884765625, 1.685791015625, 1.841400146484375, 1.99700927734375, 2.152618408203125, 2.3082275390625, 2.463836669921875, 2.61944580078125, 2.775054931640625, 2.9306640625, 3.086273193359375, 3.24188232421875, 3.397491455078125, 3.5531005859375, 3.708709716796875, 3.86431884765625, 4.019927978515625, 4.175537109375, 4.331146240234375, 4.48675537109375, 4.642364501953125, 4.7979736328125, 4.953582763671875, 5.10919189453125, 5.264801025390625, 5.42041015625, 5.576019287109375, 5.73162841796875, 5.887237548828125, 6.0428466796875, 6.198455810546875, 6.35406494140625, 6.509674072265625, 6.665283203125, 6.820892333984375, 6.97650146484375, 7.132110595703125, 7.2877197265625, 7.443328857421875, 7.59893798828125, 7.754547119140625, 7.91015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 3.0, 5.0, 13.0, 13.0, 18.0, 39.0, 42.0, 86.0, 129.0, 252.0, 484.0, 1001.0, 2598.0, 9258.0, 58784.0, 610711.0, 325477.0, 30255.0, 5793.0, 1930.0, 768.0, 376.0, 185.0, 111.0, 61.0, 56.0, 28.0, 25.0, 9.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.5, -8.1578369140625, -7.815673828125, -7.4735107421875, -7.13134765625, -6.7891845703125, -6.447021484375, -6.1048583984375, -5.7626953125, -5.4205322265625, -5.078369140625, -4.7362060546875, -4.39404296875, -4.0518798828125, -3.709716796875, -3.3675537109375, -3.025390625, -2.6832275390625, -2.341064453125, -1.9989013671875, -1.65673828125, -1.3145751953125, -0.972412109375, -0.6302490234375, -0.2880859375, 0.0540771484375, 0.396240234375, 0.7384033203125, 1.08056640625, 1.4227294921875, 1.764892578125, 2.1070556640625, 2.44921875, 2.7913818359375, 3.133544921875, 3.4757080078125, 3.81787109375, 4.1600341796875, 4.502197265625, 4.8443603515625, 5.1865234375, 5.5286865234375, 5.870849609375, 6.2130126953125, 6.55517578125, 6.8973388671875, 7.239501953125, 7.5816650390625, 7.923828125, 8.2659912109375, 8.608154296875, 8.9503173828125, 9.29248046875, 9.6346435546875, 9.976806640625, 10.3189697265625, 10.6611328125, 11.0032958984375, 11.345458984375, 11.6876220703125, 12.02978515625, 12.3719482421875, 12.714111328125, 13.0562744140625, 13.3984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 11.0, 14.0, 16.0, 20.0, 27.0, 34.0, 42.0, 63.0, 53.0, 74.0, 67.0, 78.0, 77.0, 56.0, 91.0, 53.0, 45.0, 38.0, 33.0, 32.0, 20.0, 11.0, 11.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0546875, -8.6925048828125, -8.330322265625, -7.9681396484375, -7.60595703125, -7.2437744140625, -6.881591796875, -6.5194091796875, -6.1572265625, -5.7950439453125, -5.432861328125, -5.0706787109375, -4.70849609375, -4.3463134765625, -3.984130859375, -3.6219482421875, -3.259765625, -2.8975830078125, -2.535400390625, -2.1732177734375, -1.81103515625, -1.4488525390625, -1.086669921875, -0.7244873046875, -0.3623046875, -0.0001220703125, 0.362060546875, 0.7242431640625, 1.08642578125, 1.4486083984375, 1.810791015625, 2.1729736328125, 2.53515625, 2.8973388671875, 3.259521484375, 3.6217041015625, 3.98388671875, 4.3460693359375, 4.708251953125, 5.0704345703125, 5.4326171875, 5.7947998046875, 6.156982421875, 6.5191650390625, 6.88134765625, 7.2435302734375, 7.605712890625, 7.9678955078125, 8.330078125, 8.6922607421875, 9.054443359375, 9.4166259765625, 9.77880859375, 10.1409912109375, 10.503173828125, 10.8653564453125, 11.2275390625, 11.5897216796875, 11.951904296875, 12.3140869140625, 12.67626953125, 13.0384521484375, 13.400634765625, 13.7628173828125, 14.125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 8.0, 7.0, 11.0, 18.0, 25.0, 22.0, 46.0, 68.0, 88.0, 142.0, 250.0, 431.0, 814.0, 1550.0, 3511.0, 8641.0, 28148.0, 136954.0, 551360.0, 248070.0, 46475.0, 12729.0, 4773.0, 2061.0, 1027.0, 529.0, 291.0, 167.0, 110.0, 73.0, 40.0, 27.0, 22.0, 13.0, 10.0, 8.0, 8.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.541015625, -2.452392578125, -2.36376953125, -2.275146484375, -2.1865234375, -2.097900390625, -2.00927734375, -1.920654296875, -1.83203125, -1.743408203125, -1.65478515625, -1.566162109375, -1.4775390625, -1.388916015625, -1.30029296875, -1.211669921875, -1.123046875, -1.034423828125, -0.94580078125, -0.857177734375, -0.7685546875, -0.679931640625, -0.59130859375, -0.502685546875, -0.4140625, -0.325439453125, -0.23681640625, -0.148193359375, -0.0595703125, 0.029052734375, 0.11767578125, 0.206298828125, 0.294921875, 0.383544921875, 0.47216796875, 0.560791015625, 0.6494140625, 0.738037109375, 0.82666015625, 0.915283203125, 1.00390625, 1.092529296875, 1.18115234375, 1.269775390625, 1.3583984375, 1.447021484375, 1.53564453125, 1.624267578125, 1.712890625, 1.801513671875, 1.89013671875, 1.978759765625, 2.0673828125, 2.156005859375, 2.24462890625, 2.333251953125, 2.421875, 2.510498046875, 2.59912109375, 2.687744140625, 2.7763671875, 2.864990234375, 2.95361328125, 3.042236328125, 3.130859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 3.0, 14.0, 6.0, 19.0, 37.0, 55.0, 79.0, 96.0, 138.0, 149.0, 137.0, 74.0, 53.0, 48.0, 21.0, 19.0, 15.0, 6.0, 4.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005502700805664062, -0.0005293413996696472, -0.0005084127187728882, -0.00048748403787612915, -0.0004665553569793701, -0.0004456266760826111, -0.00042469799518585205, -0.000403769314289093, -0.000382840633392334, -0.00036191195249557495, -0.0003409832715988159, -0.0003200545907020569, -0.00029912590980529785, -0.0002781972289085388, -0.0002572685480117798, -0.00023633986711502075, -0.00021541118621826172, -0.00019448250532150269, -0.00017355382442474365, -0.00015262514352798462, -0.00013169646263122559, -0.00011076778173446655, -8.983910083770752e-05, -6.891041994094849e-05, -4.798173904418945e-05, -2.705305814743042e-05, -6.124377250671387e-06, 1.4804303646087646e-05, 3.573298454284668e-05, 5.666166543960571e-05, 7.759034633636475e-05, 9.851902723312378e-05, 0.00011944770812988281, 0.00014037638902664185, 0.00016130506992340088, 0.0001822337508201599, 0.00020316243171691895, 0.00022409111261367798, 0.000245019793510437, 0.00026594847440719604, 0.0002868771553039551, 0.0003078058362007141, 0.00032873451709747314, 0.0003496631979942322, 0.0003705918788909912, 0.00039152055978775024, 0.0004124492406845093, 0.0004333779215812683, 0.00045430660247802734, 0.0004752352833747864, 0.0004961639642715454, 0.0005170926451683044, 0.0005380213260650635, 0.0005589500069618225, 0.0005798786878585815, 0.0006008073687553406, 0.0006217360496520996, 0.0006426647305488586, 0.0006635934114456177, 0.0006845220923423767, 0.0007054507732391357, 0.0007263794541358948, 0.0007473081350326538, 0.0007682368159294128, 0.0007891654968261719]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 16.0, 9.0, 14.0, 38.0, 37.0, 59.0, 89.0, 151.0, 227.0, 394.0, 790.0, 1793.0, 4025.0, 10756.0, 37573.0, 193637.0, 583466.0, 165171.0, 33415.0, 9697.0, 3733.0, 1649.0, 792.0, 405.0, 212.0, 137.0, 80.0, 53.0, 44.0, 22.0, 13.0, 12.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.94921875, -3.843780517578125, -3.73834228515625, -3.632904052734375, -3.5274658203125, -3.422027587890625, -3.31658935546875, -3.211151123046875, -3.105712890625, -3.000274658203125, -2.89483642578125, -2.789398193359375, -2.6839599609375, -2.578521728515625, -2.47308349609375, -2.367645263671875, -2.26220703125, -2.156768798828125, -2.05133056640625, -1.945892333984375, -1.8404541015625, -1.735015869140625, -1.62957763671875, -1.524139404296875, -1.418701171875, -1.313262939453125, -1.20782470703125, -1.102386474609375, -0.9969482421875, -0.891510009765625, -0.78607177734375, -0.680633544921875, -0.5751953125, -0.469757080078125, -0.36431884765625, -0.258880615234375, -0.1534423828125, -0.048004150390625, 0.05743408203125, 0.162872314453125, 0.268310546875, 0.373748779296875, 0.47918701171875, 0.584625244140625, 0.6900634765625, 0.795501708984375, 0.90093994140625, 1.006378173828125, 1.11181640625, 1.217254638671875, 1.32269287109375, 1.428131103515625, 1.5335693359375, 1.639007568359375, 1.74444580078125, 1.849884033203125, 1.955322265625, 2.060760498046875, 2.16619873046875, 2.271636962890625, 2.3770751953125, 2.482513427734375, 2.58795166015625, 2.693389892578125, 2.798828125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 7.0, 7.0, 9.0, 9.0, 9.0, 14.0, 27.0, 29.0, 49.0, 57.0, 61.0, 94.0, 102.0, 90.0, 100.0, 66.0, 58.0, 48.0, 45.0, 33.0, 23.0, 12.0, 14.0, 6.0, 5.0, 10.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.505859375, -3.409088134765625, -3.31231689453125, -3.215545654296875, -3.1187744140625, -3.022003173828125, -2.92523193359375, -2.828460693359375, -2.731689453125, -2.634918212890625, -2.53814697265625, -2.441375732421875, -2.3446044921875, -2.247833251953125, -2.15106201171875, -2.054290771484375, -1.95751953125, -1.860748291015625, -1.76397705078125, -1.667205810546875, -1.5704345703125, -1.473663330078125, -1.37689208984375, -1.280120849609375, -1.183349609375, -1.086578369140625, -0.98980712890625, -0.893035888671875, -0.7962646484375, -0.699493408203125, -0.60272216796875, -0.505950927734375, -0.4091796875, -0.312408447265625, -0.21563720703125, -0.118865966796875, -0.0220947265625, 0.074676513671875, 0.17144775390625, 0.268218994140625, 0.364990234375, 0.461761474609375, 0.55853271484375, 0.655303955078125, 0.7520751953125, 0.848846435546875, 0.94561767578125, 1.042388916015625, 1.13916015625, 1.235931396484375, 1.33270263671875, 1.429473876953125, 1.5262451171875, 1.623016357421875, 1.71978759765625, 1.816558837890625, 1.913330078125, 2.010101318359375, 2.10687255859375, 2.203643798828125, 2.3004150390625, 2.397186279296875, 2.49395751953125, 2.590728759765625, 2.6875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 10.0, 24.0, 64.0, 170.0, 320.0, 258.0, 95.0, 33.0, 15.0, 6.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.86557006835938, -127.0228271484375, -124.18009185791016, -121.33734893798828, -118.49461364746094, -115.65187072753906, -112.80912780761719, -109.96639251708984, -107.12364959716797, -104.2809066772461, -101.43817138671875, -98.59542846679688, -95.75269317626953, -92.90995025634766, -90.06721496582031, -87.22447204589844, -84.38172912597656, -81.53898620605469, -78.69625091552734, -75.85350799560547, -73.01077270507812, -70.16802978515625, -67.32528686523438, -64.48255157470703, -61.63981628417969, -58.79707717895508, -55.95433807373047, -53.111595153808594, -50.268856048583984, -47.426116943359375, -44.583377838134766, -41.740638732910156, -38.89789581298828, -36.05515670776367, -33.21241760253906, -30.36967658996582, -27.526935577392578, -24.68419647216797, -21.84145736694336, -18.998716354370117, -16.155977249145508, -13.313237190246582, -10.470497131347656, -7.627758026123047, -4.785017967224121, -1.9422779083251953, 0.9004611968994141, 3.7432022094726562, 6.585941314697266, 9.428681373596191, 12.271421432495117, 15.114160537719727, 17.95690155029297, 20.799640655517578, 23.642379760742188, 26.48512077331543, 29.32785987854004, 32.17060089111328, 35.01333999633789, 37.8560791015625, 40.69881820678711, 43.54155731201172, 46.384300231933594, 49.2270393371582, 52.06977844238281]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 9.0, 11.0, 8.0, 8.0, 24.0, 18.0, 16.0, 20.0, 28.0, 32.0, 32.0, 44.0, 30.0, 52.0, 47.0, 50.0, 43.0, 58.0, 43.0, 53.0, 44.0, 42.0, 33.0, 31.0, 35.0, 25.0, 24.0, 22.0, 17.0, 25.0, 13.0, 10.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.41595458984375, -37.097164154052734, -35.778377532958984, -34.45958709716797, -33.14080047607422, -31.822010040283203, -30.50322151184082, -29.184432983398438, -27.865644454956055, -26.546855926513672, -25.22806739807129, -23.909278869628906, -22.59048843383789, -21.27170181274414, -19.952911376953125, -18.634122848510742, -17.31533432006836, -15.996545791625977, -14.677757263183594, -13.358967781066895, -12.040179252624512, -10.721390724182129, -9.40260124206543, -8.083812713623047, -6.765024185180664, -5.446235656738281, -4.12744665145874, -2.8086578845977783, -1.4898691177368164, -0.1710805892944336, 1.1477084159851074, 2.4664974212646484, 3.7852859497070312, 5.104074478149414, 6.422863483428955, 7.741652488708496, 9.060441017150879, 10.379229545593262, 11.698019027709961, 13.016807556152344, 14.335596084594727, 15.65438461303711, 16.973173141479492, 18.291961669921875, 19.61075210571289, 20.92953872680664, 22.248329162597656, 23.56711769104004, 24.885906219482422, 26.204694747924805, 27.523483276367188, 28.84227180480957, 30.161060333251953, 31.47985076904297, 32.79863739013672, 34.117427825927734, 35.43621826171875, 36.755008697509766, 38.073795318603516, 39.39258575439453, 40.71137237548828, 42.0301628112793, 43.34894943237305, 44.66773986816406, 45.98652648925781]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 14.0, 24.0, 56.0, 117.0, 331.0, 972.0, 3887.0, 30998.0, 3951819.0, 192401.0, 10114.0, 2068.0, 730.0, 281.0, 157.0, 90.0, 59.0, 50.0, 29.0, 21.0, 8.0, 15.0, 7.0, 7.0, 6.0, 6.0, 6.0, 6.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.356201171875, -9.60302734375, -8.849853515625, -8.0966796875, -7.343505859375, -6.59033203125, -5.837158203125, -5.083984375, -4.330810546875, -3.57763671875, -2.824462890625, -2.0712890625, -1.318115234375, -0.56494140625, 0.188232421875, 0.94140625, 1.694580078125, 2.44775390625, 3.200927734375, 3.9541015625, 4.707275390625, 5.46044921875, 6.213623046875, 6.966796875, 7.719970703125, 8.47314453125, 9.226318359375, 9.9794921875, 10.732666015625, 11.48583984375, 12.239013671875, 12.9921875, 13.745361328125, 14.49853515625, 15.251708984375, 16.0048828125, 16.758056640625, 17.51123046875, 18.264404296875, 19.017578125, 19.770751953125, 20.52392578125, 21.277099609375, 22.0302734375, 22.783447265625, 23.53662109375, 24.289794921875, 25.04296875, 25.796142578125, 26.54931640625, 27.302490234375, 28.0556640625, 28.808837890625, 29.56201171875, 30.315185546875, 31.068359375, 31.821533203125, 32.57470703125, 33.327880859375, 34.0810546875, 34.834228515625, 35.58740234375, 36.340576171875, 37.09375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 12.0, 37.0, 55.0, 79.0, 96.0, 112.0, 131.0, 136.0, 89.0, 80.0, 67.0, 45.0, 29.0, 9.0, 9.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8024444580078125, -1.680084228515625, -1.5577239990234375, -1.43536376953125, -1.3130035400390625, -1.190643310546875, -1.0682830810546875, -0.9459228515625, -0.8235626220703125, -0.701202392578125, -0.5788421630859375, -0.45648193359375, -0.3341217041015625, -0.211761474609375, -0.0894012451171875, 0.032958984375, 0.1553192138671875, 0.277679443359375, 0.4000396728515625, 0.52239990234375, 0.6447601318359375, 0.767120361328125, 0.8894805908203125, 1.0118408203125, 1.1342010498046875, 1.256561279296875, 1.3789215087890625, 1.50128173828125, 1.6236419677734375, 1.746002197265625, 1.8683624267578125, 1.99072265625, 2.1130828857421875, 2.235443115234375, 2.3578033447265625, 2.48016357421875, 2.6025238037109375, 2.724884033203125, 2.8472442626953125, 2.9696044921875, 3.0919647216796875, 3.214324951171875, 3.3366851806640625, 3.45904541015625, 3.5814056396484375, 3.703765869140625, 3.8261260986328125, 3.948486328125, 4.0708465576171875, 4.193206787109375, 4.3155670166015625, 4.43792724609375, 4.5602874755859375, 4.682647705078125, 4.8050079345703125, 4.9273681640625, 5.0497283935546875, 5.172088623046875, 5.2944488525390625, 5.41680908203125, 5.5391693115234375, 5.661529541015625, 5.7838897705078125, 5.90625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 8.0, 4.0, 15.0, 21.0, 36.0, 53.0, 114.0, 178.0, 369.0, 807.0, 2795.0, 14211.0, 4014427.0, 150443.0, 7219.0, 2030.0, 730.0, 377.0, 182.0, 104.0, 53.0, 36.0, 26.0, 12.0, 15.0, 12.0, 3.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.46875, -27.4443359375, -26.419921875, -25.3955078125, -24.37109375, -23.3466796875, -22.322265625, -21.2978515625, -20.2734375, -19.2490234375, -18.224609375, -17.2001953125, -16.17578125, -15.1513671875, -14.126953125, -13.1025390625, -12.078125, -11.0537109375, -10.029296875, -9.0048828125, -7.98046875, -6.9560546875, -5.931640625, -4.9072265625, -3.8828125, -2.8583984375, -1.833984375, -0.8095703125, 0.21484375, 1.2392578125, 2.263671875, 3.2880859375, 4.3125, 5.3369140625, 6.361328125, 7.3857421875, 8.41015625, 9.4345703125, 10.458984375, 11.4833984375, 12.5078125, 13.5322265625, 14.556640625, 15.5810546875, 16.60546875, 17.6298828125, 18.654296875, 19.6787109375, 20.703125, 21.7275390625, 22.751953125, 23.7763671875, 24.80078125, 25.8251953125, 26.849609375, 27.8740234375, 28.8984375, 29.9228515625, 30.947265625, 31.9716796875, 32.99609375, 34.0205078125, 35.044921875, 36.0693359375, 37.09375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 5.0, 15.0, 71.0, 344.0, 3083.0, 425.0, 65.0, 25.0, 13.0, 6.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.76171875, -7.31964111328125, -6.8775634765625, -6.43548583984375, -5.993408203125, -5.55133056640625, -5.1092529296875, -4.66717529296875, -4.22509765625, -3.78302001953125, -3.3409423828125, -2.89886474609375, -2.456787109375, -2.01470947265625, -1.5726318359375, -1.13055419921875, -0.6884765625, -0.24639892578125, 0.1956787109375, 0.63775634765625, 1.079833984375, 1.52191162109375, 1.9639892578125, 2.40606689453125, 2.84814453125, 3.29022216796875, 3.7322998046875, 4.17437744140625, 4.616455078125, 5.05853271484375, 5.5006103515625, 5.94268798828125, 6.384765625, 6.82684326171875, 7.2689208984375, 7.71099853515625, 8.153076171875, 8.59515380859375, 9.0372314453125, 9.47930908203125, 9.92138671875, 10.36346435546875, 10.8055419921875, 11.24761962890625, 11.689697265625, 12.13177490234375, 12.5738525390625, 13.01593017578125, 13.4580078125, 13.90008544921875, 14.3421630859375, 14.78424072265625, 15.226318359375, 15.66839599609375, 16.1104736328125, 16.55255126953125, 16.99462890625, 17.43670654296875, 17.8787841796875, 18.32086181640625, 18.762939453125, 19.20501708984375, 19.6470947265625, 20.08917236328125, 20.53125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 30.0, 245.0, 559.0, 140.0, 18.0, 9.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.19833374023438, -172.62811279296875, -169.05789184570312, -165.48765563964844, -161.9174346923828, -158.3472137451172, -154.77699279785156, -151.20677185058594, -147.63653564453125, -144.06631469726562, -140.49609375, -136.9258575439453, -133.3556365966797, -129.78541564941406, -126.21519470214844, -122.64497375488281, -119.07475280761719, -115.50453186035156, -111.9343032836914, -108.36408233642578, -104.79385375976562, -101.2236328125, -97.65341186523438, -94.08319091796875, -90.5129623413086, -86.94274139404297, -83.37251281738281, -79.80229187011719, -76.23207092285156, -72.6618423461914, -69.09162139892578, -65.52139282226562, -61.95117950439453, -58.38095474243164, -54.81072998046875, -51.240509033203125, -47.670284271240234, -44.100059509277344, -40.52983856201172, -36.95961380004883, -33.38938903808594, -29.819164276123047, -26.24894142150879, -22.67871856689453, -19.10849380493164, -15.53826904296875, -11.968046188354492, -8.397823333740234, -4.827598571777344, -1.2573747634887695, 2.3128490447998047, 5.883072853088379, 9.453296661376953, 13.023521423339844, 16.5937442779541, 20.16396713256836, 23.73419189453125, 27.30441665649414, 30.8746395111084, 34.444862365722656, 38.01508712768555, 41.58531188964844, 45.15553283691406, 48.72575759887695, 52.295982360839844]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 24.0, 41.0, 82.0, 108.0, 154.0, 139.0, 141.0, 115.0, 84.0, 62.0, 24.0, 20.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.93634796142578, -56.12519073486328, -54.31403732299805, -52.50288009643555, -50.69172668457031, -48.88056945800781, -47.06941223144531, -45.25825500488281, -43.44710159301758, -41.63594436645508, -39.824790954589844, -38.013633728027344, -36.202476501464844, -34.39132308959961, -32.58016586303711, -30.769010543823242, -28.957855224609375, -27.146699905395508, -25.33554458618164, -23.52438735961914, -21.713232040405273, -19.902076721191406, -18.090919494628906, -16.27976417541504, -14.468608856201172, -12.657453536987305, -10.846297264099121, -9.035140991210938, -7.22398567199707, -5.412830352783203, -3.6016740798950195, -1.790517807006836, 0.020641326904296875, 1.8317971229553223, 3.6429529190063477, 5.454108715057373, 7.265264511108398, 9.076419830322266, 10.88757610321045, 12.698732376098633, 14.5098876953125, 16.321043014526367, 18.132198333740234, 19.943355560302734, 21.7545108795166, 23.56566619873047, 25.37682342529297, 27.187978744506836, 28.999134063720703, 30.81028938293457, 32.62144470214844, 34.43260192871094, 36.24375915527344, 38.05491256713867, 39.86606979370117, 41.677223205566406, 43.488380432128906, 45.299537658691406, 47.11069107055664, 48.92184829711914, 50.733001708984375, 52.544158935546875, 54.355316162109375, 56.166473388671875, 57.97762680053711]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 19.0, 22.0, 40.0, 83.0, 113.0, 192.0, 381.0, 871.0, 2569.0, 17615.0, 439551.0, 560303.0, 22035.0, 2875.0, 897.0, 429.0, 215.0, 115.0, 78.0, 47.0, 29.0, 20.0, 12.0, 8.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.33349609375, -15.7294921875, -15.12548828125, -14.521484375, -13.91748046875, -13.3134765625, -12.70947265625, -12.10546875, -11.50146484375, -10.8974609375, -10.29345703125, -9.689453125, -9.08544921875, -8.4814453125, -7.87744140625, -7.2734375, -6.66943359375, -6.0654296875, -5.46142578125, -4.857421875, -4.25341796875, -3.6494140625, -3.04541015625, -2.44140625, -1.83740234375, -1.2333984375, -0.62939453125, -0.025390625, 0.57861328125, 1.1826171875, 1.78662109375, 2.390625, 2.99462890625, 3.5986328125, 4.20263671875, 4.806640625, 5.41064453125, 6.0146484375, 6.61865234375, 7.22265625, 7.82666015625, 8.4306640625, 9.03466796875, 9.638671875, 10.24267578125, 10.8466796875, 11.45068359375, 12.0546875, 12.65869140625, 13.2626953125, 13.86669921875, 14.470703125, 15.07470703125, 15.6787109375, 16.28271484375, 16.88671875, 17.49072265625, 18.0947265625, 18.69873046875, 19.302734375, 19.90673828125, 20.5107421875, 21.11474609375, 21.71875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 14.0, 18.0, 44.0, 77.0, 101.0, 134.0, 142.0, 139.0, 99.0, 96.0, 60.0, 37.0, 18.0, 12.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.26171875, -3.1187744140625, -2.975830078125, -2.8328857421875, -2.68994140625, -2.5469970703125, -2.404052734375, -2.2611083984375, -2.1181640625, -1.9752197265625, -1.832275390625, -1.6893310546875, -1.54638671875, -1.4034423828125, -1.260498046875, -1.1175537109375, -0.974609375, -0.8316650390625, -0.688720703125, -0.5457763671875, -0.40283203125, -0.2598876953125, -0.116943359375, 0.0260009765625, 0.1689453125, 0.3118896484375, 0.454833984375, 0.5977783203125, 0.74072265625, 0.8836669921875, 1.026611328125, 1.1695556640625, 1.3125, 1.4554443359375, 1.598388671875, 1.7413330078125, 1.88427734375, 2.0272216796875, 2.170166015625, 2.3131103515625, 2.4560546875, 2.5989990234375, 2.741943359375, 2.8848876953125, 3.02783203125, 3.1707763671875, 3.313720703125, 3.4566650390625, 3.599609375, 3.7425537109375, 3.885498046875, 4.0284423828125, 4.17138671875, 4.3143310546875, 4.457275390625, 4.6002197265625, 4.7431640625, 4.8861083984375, 5.029052734375, 5.1719970703125, 5.31494140625, 5.4578857421875, 5.600830078125, 5.7437744140625, 5.88671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 5.0, 11.0, 15.0, 16.0, 17.0, 23.0, 37.0, 44.0, 65.0, 97.0, 148.0, 231.0, 330.0, 618.0, 1020.0, 1912.0, 3683.0, 7432.0, 15860.0, 38191.0, 101044.0, 265718.0, 351778.0, 158269.0, 57713.0, 23192.0, 10188.0, 4936.0, 2475.0, 1403.0, 762.0, 485.0, 268.0, 203.0, 99.0, 77.0, 56.0, 41.0, 20.0, 20.0, 12.0, 14.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-4.765625, -4.63031005859375, -4.4949951171875, -4.35968017578125, -4.224365234375, -4.08905029296875, -3.9537353515625, -3.81842041015625, -3.68310546875, -3.54779052734375, -3.4124755859375, -3.27716064453125, -3.141845703125, -3.00653076171875, -2.8712158203125, -2.73590087890625, -2.6005859375, -2.46527099609375, -2.3299560546875, -2.19464111328125, -2.059326171875, -1.92401123046875, -1.7886962890625, -1.65338134765625, -1.51806640625, -1.38275146484375, -1.2474365234375, -1.11212158203125, -0.976806640625, -0.84149169921875, -0.7061767578125, -0.57086181640625, -0.435546875, -0.30023193359375, -0.1649169921875, -0.02960205078125, 0.105712890625, 0.24102783203125, 0.3763427734375, 0.51165771484375, 0.64697265625, 0.78228759765625, 0.9176025390625, 1.05291748046875, 1.188232421875, 1.32354736328125, 1.4588623046875, 1.59417724609375, 1.7294921875, 1.86480712890625, 2.0001220703125, 2.13543701171875, 2.270751953125, 2.40606689453125, 2.5413818359375, 2.67669677734375, 2.81201171875, 2.94732666015625, 3.0826416015625, 3.21795654296875, 3.353271484375, 3.48858642578125, 3.6239013671875, 3.75921630859375, 3.89453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 4.0, 6.0, 8.0, 8.0, 13.0, 10.0, 17.0, 14.0, 14.0, 21.0, 33.0, 19.0, 25.0, 48.0, 30.0, 40.0, 37.0, 51.0, 51.0, 48.0, 34.0, 47.0, 38.0, 45.0, 35.0, 18.0, 30.0, 36.0, 29.0, 27.0, 18.0, 20.0, 26.0, 18.0, 14.0, 13.0, 11.0, 7.0, 3.0, 9.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.60150146484375, -5.4100341796875, -5.21856689453125, -5.027099609375, -4.83563232421875, -4.6441650390625, -4.45269775390625, -4.26123046875, -4.06976318359375, -3.8782958984375, -3.68682861328125, -3.495361328125, -3.30389404296875, -3.1124267578125, -2.92095947265625, -2.7294921875, -2.53802490234375, -2.3465576171875, -2.15509033203125, -1.963623046875, -1.77215576171875, -1.5806884765625, -1.38922119140625, -1.19775390625, -1.00628662109375, -0.8148193359375, -0.62335205078125, -0.431884765625, -0.24041748046875, -0.0489501953125, 0.14251708984375, 0.333984375, 0.52545166015625, 0.7169189453125, 0.90838623046875, 1.099853515625, 1.29132080078125, 1.4827880859375, 1.67425537109375, 1.86572265625, 2.05718994140625, 2.2486572265625, 2.44012451171875, 2.631591796875, 2.82305908203125, 3.0145263671875, 3.20599365234375, 3.3974609375, 3.58892822265625, 3.7803955078125, 3.97186279296875, 4.163330078125, 4.35479736328125, 4.5462646484375, 4.73773193359375, 4.92919921875, 5.12066650390625, 5.3121337890625, 5.50360107421875, 5.695068359375, 5.88653564453125, 6.0780029296875, 6.26947021484375, 6.4609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 5.0, 12.0, 17.0, 26.0, 31.0, 45.0, 75.0, 139.0, 233.0, 431.0, 822.0, 1794.0, 3917.0, 11253.0, 45677.0, 290369.0, 562922.0, 99355.0, 20272.0, 6249.0, 2400.0, 1104.0, 580.0, 362.0, 189.0, 88.0, 61.0, 39.0, 24.0, 20.0, 8.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.31640625, -3.222259521484375, -3.12811279296875, -3.033966064453125, -2.9398193359375, -2.845672607421875, -2.75152587890625, -2.657379150390625, -2.563232421875, -2.469085693359375, -2.37493896484375, -2.280792236328125, -2.1866455078125, -2.092498779296875, -1.99835205078125, -1.904205322265625, -1.81005859375, -1.715911865234375, -1.62176513671875, -1.527618408203125, -1.4334716796875, -1.339324951171875, -1.24517822265625, -1.151031494140625, -1.056884765625, -0.962738037109375, -0.86859130859375, -0.774444580078125, -0.6802978515625, -0.586151123046875, -0.49200439453125, -0.397857666015625, -0.3037109375, -0.209564208984375, -0.11541748046875, -0.021270751953125, 0.0728759765625, 0.167022705078125, 0.26116943359375, 0.355316162109375, 0.449462890625, 0.543609619140625, 0.63775634765625, 0.731903076171875, 0.8260498046875, 0.920196533203125, 1.01434326171875, 1.108489990234375, 1.20263671875, 1.296783447265625, 1.39093017578125, 1.485076904296875, 1.5792236328125, 1.673370361328125, 1.76751708984375, 1.861663818359375, 1.955810546875, 2.049957275390625, 2.14410400390625, 2.238250732421875, 2.3323974609375, 2.426544189453125, 2.52069091796875, 2.614837646484375, 2.708984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 2.0, 6.0, 9.0, 13.0, 16.0, 19.0, 31.0, 41.0, 62.0, 81.0, 123.0, 121.0, 121.0, 98.0, 79.0, 46.0, 25.0, 23.0, 20.0, 12.0, 11.0, 8.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005178451538085938, -0.0005037076771259308, -0.0004895702004432678, -0.00047543272376060486, -0.0004612952470779419, -0.00044715777039527893, -0.00043302029371261597, -0.000418882817029953, -0.00040474534034729004, -0.0003906078636646271, -0.0003764703869819641, -0.00036233291029930115, -0.0003481954336166382, -0.0003340579569339752, -0.00031992048025131226, -0.0003057830035686493, -0.00029164552688598633, -0.00027750805020332336, -0.0002633705735206604, -0.00024923309683799744, -0.00023509562015533447, -0.0002209581434726715, -0.00020682066679000854, -0.00019268319010734558, -0.00017854571342468262, -0.00016440823674201965, -0.0001502707600593567, -0.00013613328337669373, -0.00012199580669403076, -0.0001078583300113678, -9.372085332870483e-05, -7.958337664604187e-05, -6.54458999633789e-05, -5.130842328071594e-05, -3.717094659805298e-05, -2.3033469915390015e-05, -8.89599323272705e-06, 5.241483449935913e-06, 1.9378960132598877e-05, 3.351643681526184e-05, 4.7653913497924805e-05, 6.179139018058777e-05, 7.592886686325073e-05, 9.00663435459137e-05, 0.00010420382022857666, 0.00011834129691123962, 0.0001324787735939026, 0.00014661625027656555, 0.00016075372695922852, 0.00017489120364189148, 0.00018902868032455444, 0.0002031661570072174, 0.00021730363368988037, 0.00023144111037254333, 0.0002455785870552063, 0.00025971606373786926, 0.0002738535404205322, 0.0002879910171031952, 0.00030212849378585815, 0.0003162659704685211, 0.0003304034471511841, 0.00034454092383384705, 0.00035867840051651, 0.000372815877199173, 0.00038695335388183594]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 22.0, 14.0, 30.0, 41.0, 75.0, 111.0, 200.0, 381.0, 690.0, 1603.0, 3939.0, 11508.0, 42534.0, 279798.0, 590687.0, 86966.0, 19421.0, 6048.0, 2278.0, 1017.0, 500.0, 272.0, 150.0, 100.0, 57.0, 42.0, 19.0, 11.0, 8.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.837890625, -3.71875, -3.599609375, -3.48046875, -3.361328125, -3.2421875, -3.123046875, -3.00390625, -2.884765625, -2.765625, -2.646484375, -2.52734375, -2.408203125, -2.2890625, -2.169921875, -2.05078125, -1.931640625, -1.8125, -1.693359375, -1.57421875, -1.455078125, -1.3359375, -1.216796875, -1.09765625, -0.978515625, -0.859375, -0.740234375, -0.62109375, -0.501953125, -0.3828125, -0.263671875, -0.14453125, -0.025390625, 0.09375, 0.212890625, 0.33203125, 0.451171875, 0.5703125, 0.689453125, 0.80859375, 0.927734375, 1.046875, 1.166015625, 1.28515625, 1.404296875, 1.5234375, 1.642578125, 1.76171875, 1.880859375, 2.0, 2.119140625, 2.23828125, 2.357421875, 2.4765625, 2.595703125, 2.71484375, 2.833984375, 2.953125, 3.072265625, 3.19140625, 3.310546875, 3.4296875, 3.548828125, 3.66796875, 3.787109375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 11.0, 10.0, 15.0, 8.0, 21.0, 21.0, 60.0, 57.0, 125.0, 118.0, 110.0, 112.0, 88.0, 66.0, 39.0, 34.0, 23.0, 13.0, 10.0, 10.0, 10.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.42578125, -3.3292236328125, -3.232666015625, -3.1361083984375, -3.03955078125, -2.9429931640625, -2.846435546875, -2.7498779296875, -2.6533203125, -2.5567626953125, -2.460205078125, -2.3636474609375, -2.26708984375, -2.1705322265625, -2.073974609375, -1.9774169921875, -1.880859375, -1.7843017578125, -1.687744140625, -1.5911865234375, -1.49462890625, -1.3980712890625, -1.301513671875, -1.2049560546875, -1.1083984375, -1.0118408203125, -0.915283203125, -0.8187255859375, -0.72216796875, -0.6256103515625, -0.529052734375, -0.4324951171875, -0.3359375, -0.2393798828125, -0.142822265625, -0.0462646484375, 0.05029296875, 0.1468505859375, 0.243408203125, 0.3399658203125, 0.4365234375, 0.5330810546875, 0.629638671875, 0.7261962890625, 0.82275390625, 0.9193115234375, 1.015869140625, 1.1124267578125, 1.208984375, 1.3055419921875, 1.402099609375, 1.4986572265625, 1.59521484375, 1.6917724609375, 1.788330078125, 1.8848876953125, 1.9814453125, 2.0780029296875, 2.174560546875, 2.2711181640625, 2.36767578125, 2.4642333984375, 2.560791015625, 2.6573486328125, 2.75390625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 5.0, 3.0, 3.0, 7.0, 11.0, 15.0, 23.0, 35.0, 66.0, 103.0, 137.0, 147.0, 154.0, 107.0, 69.0, 51.0, 23.0, 20.0, 10.0, 7.0, 7.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.71232604980469, -37.42655944824219, -36.14078903198242, -34.85502243041992, -33.569252014160156, -32.283485412597656, -30.997718811035156, -29.711950302124023, -28.42618179321289, -27.140413284301758, -25.854644775390625, -24.568878173828125, -23.283109664916992, -21.99734115600586, -20.71157455444336, -19.425806045532227, -18.140037536621094, -16.85426902770996, -15.568501472473145, -14.282733917236328, -12.996965408325195, -11.711196899414062, -10.425429344177246, -9.13966178894043, -7.853893280029297, -6.568125247955322, -5.282357215881348, -3.996589183807373, -2.7108211517333984, -1.4250531196594238, -0.13928508758544922, 1.1464824676513672, 2.4322509765625, 3.7180190086364746, 5.003787040710449, 6.289555072784424, 7.575323104858398, 8.861091613769531, 10.146859169006348, 11.432626724243164, 12.718395233154297, 14.00416374206543, 15.289931297302246, 16.575698852539062, 17.861467361450195, 19.147235870361328, 20.433002471923828, 21.71877098083496, 23.004539489746094, 24.290307998657227, 25.57607650756836, 26.86184310913086, 28.147611618041992, 29.433380126953125, 30.719146728515625, 32.004913330078125, 33.29068374633789, 34.57645034790039, 35.862220764160156, 37.147987365722656, 38.433753967285156, 39.71952438354492, 41.00529098510742, 42.29106140136719, 43.57682800292969]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 10.0, 22.0, 20.0, 20.0, 22.0, 32.0, 36.0, 34.0, 49.0, 44.0, 35.0, 39.0, 43.0, 53.0, 59.0, 57.0, 39.0, 54.0, 48.0, 45.0, 28.0, 37.0, 29.0, 17.0, 31.0, 16.0, 18.0, 10.0, 10.0, 11.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.0434684753418, -41.76372528076172, -40.48398208618164, -39.20423889160156, -37.924495697021484, -36.644752502441406, -35.36500930786133, -34.08526611328125, -32.80552673339844, -31.52578353881836, -30.24604034423828, -28.966297149658203, -27.686553955078125, -26.406810760498047, -25.1270694732666, -23.847326278686523, -22.567581176757812, -21.287837982177734, -20.008094787597656, -18.728351593017578, -17.4486083984375, -16.168865203857422, -14.889123916625977, -13.609380722045898, -12.32963752746582, -11.049894332885742, -9.770151138305664, -8.490408897399902, -7.210665702819824, -5.930922508239746, -4.651179790496826, -3.3714370727539062, -2.0916976928710938, -0.8119547367095947, 0.4677882194519043, 1.7475311756134033, 3.0272741317749023, 4.3070173263549805, 5.5867600440979, 6.86650276184082, 8.146245956420898, 9.425989151000977, 10.705732345581055, 11.985474586486816, 13.265217781066895, 14.544960975646973, 15.824703216552734, 17.104446411132812, 18.38418960571289, 19.66393280029297, 20.943675994873047, 22.223419189453125, 23.503162384033203, 24.78290557861328, 26.062646865844727, 27.342390060424805, 28.622133255004883, 29.90187644958496, 31.18161964416504, 32.461360931396484, 33.74110412597656, 35.02084732055664, 36.30059051513672, 37.5803337097168, 38.860076904296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 11.0, 29.0, 51.0, 109.0, 180.0, 488.0, 1609.0, 13578.0, 4074731.0, 97839.0, 4040.0, 882.0, 350.0, 165.0, 87.0, 54.0, 22.0, 20.0, 9.0, 11.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.455078125, -17.73828125, -17.021484375, -16.3046875, -15.587890625, -14.87109375, -14.154296875, -13.4375, -12.720703125, -12.00390625, -11.287109375, -10.5703125, -9.853515625, -9.13671875, -8.419921875, -7.703125, -6.986328125, -6.26953125, -5.552734375, -4.8359375, -4.119140625, -3.40234375, -2.685546875, -1.96875, -1.251953125, -0.53515625, 0.181640625, 0.8984375, 1.615234375, 2.33203125, 3.048828125, 3.765625, 4.482421875, 5.19921875, 5.916015625, 6.6328125, 7.349609375, 8.06640625, 8.783203125, 9.5, 10.216796875, 10.93359375, 11.650390625, 12.3671875, 13.083984375, 13.80078125, 14.517578125, 15.234375, 15.951171875, 16.66796875, 17.384765625, 18.1015625, 18.818359375, 19.53515625, 20.251953125, 20.96875, 21.685546875, 22.40234375, 23.119140625, 23.8359375, 24.552734375, 25.26953125, 25.986328125, 26.703125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 9.0, 20.0, 45.0, 77.0, 78.0, 120.0, 135.0, 128.0, 124.0, 82.0, 70.0, 51.0, 26.0, 16.0, 11.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.365234375, -3.219940185546875, -3.07464599609375, -2.929351806640625, -2.7840576171875, -2.638763427734375, -2.49346923828125, -2.348175048828125, -2.202880859375, -2.057586669921875, -1.91229248046875, -1.766998291015625, -1.6217041015625, -1.476409912109375, -1.33111572265625, -1.185821533203125, -1.04052734375, -0.895233154296875, -0.74993896484375, -0.604644775390625, -0.4593505859375, -0.314056396484375, -0.16876220703125, -0.023468017578125, 0.121826171875, 0.267120361328125, 0.41241455078125, 0.557708740234375, 0.7030029296875, 0.848297119140625, 0.99359130859375, 1.138885498046875, 1.2841796875, 1.429473876953125, 1.57476806640625, 1.720062255859375, 1.8653564453125, 2.010650634765625, 2.15594482421875, 2.301239013671875, 2.446533203125, 2.591827392578125, 2.73712158203125, 2.882415771484375, 3.0277099609375, 3.173004150390625, 3.31829833984375, 3.463592529296875, 3.60888671875, 3.754180908203125, 3.89947509765625, 4.044769287109375, 4.1900634765625, 4.335357666015625, 4.48065185546875, 4.625946044921875, 4.771240234375, 4.916534423828125, 5.06182861328125, 5.207122802734375, 5.3524169921875, 5.497711181640625, 5.64300537109375, 5.788299560546875, 5.93359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 5.0, 10.0, 11.0, 18.0, 15.0, 44.0, 40.0, 42.0, 80.0, 95.0, 133.0, 231.0, 389.0, 857.0, 2441.0, 10169.0, 85270.0, 3954745.0, 122852.0, 12324.0, 2644.0, 881.0, 392.0, 195.0, 115.0, 71.0, 49.0, 38.0, 34.0, 18.0, 11.0, 15.0, 16.0, 3.0, 5.0, 9.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -11.24072265625, -10.8955078125, -10.55029296875, -10.205078125, -9.85986328125, -9.5146484375, -9.16943359375, -8.82421875, -8.47900390625, -8.1337890625, -7.78857421875, -7.443359375, -7.09814453125, -6.7529296875, -6.40771484375, -6.0625, -5.71728515625, -5.3720703125, -5.02685546875, -4.681640625, -4.33642578125, -3.9912109375, -3.64599609375, -3.30078125, -2.95556640625, -2.6103515625, -2.26513671875, -1.919921875, -1.57470703125, -1.2294921875, -0.88427734375, -0.5390625, -0.19384765625, 0.1513671875, 0.49658203125, 0.841796875, 1.18701171875, 1.5322265625, 1.87744140625, 2.22265625, 2.56787109375, 2.9130859375, 3.25830078125, 3.603515625, 3.94873046875, 4.2939453125, 4.63916015625, 4.984375, 5.32958984375, 5.6748046875, 6.02001953125, 6.365234375, 6.71044921875, 7.0556640625, 7.40087890625, 7.74609375, 8.09130859375, 8.4365234375, 8.78173828125, 9.126953125, 9.47216796875, 9.8173828125, 10.16259765625, 10.5078125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 10.0, 2.0, 5.0, 11.0, 17.0, 19.0, 32.0, 54.0, 93.0, 257.0, 1048.0, 1963.0, 329.0, 118.0, 45.0, 26.0, 15.0, 11.0, 13.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.06640625, -4.9589691162109375, -4.851531982421875, -4.7440948486328125, -4.63665771484375, -4.5292205810546875, -4.421783447265625, -4.3143463134765625, -4.2069091796875, -4.0994720458984375, -3.992034912109375, -3.8845977783203125, -3.77716064453125, -3.6697235107421875, -3.562286376953125, -3.4548492431640625, -3.347412109375, -3.2399749755859375, -3.132537841796875, -3.0251007080078125, -2.91766357421875, -2.8102264404296875, -2.702789306640625, -2.5953521728515625, -2.4879150390625, -2.3804779052734375, -2.273040771484375, -2.1656036376953125, -2.05816650390625, -1.9507293701171875, -1.843292236328125, -1.7358551025390625, -1.62841796875, -1.5209808349609375, -1.413543701171875, -1.3061065673828125, -1.19866943359375, -1.0912322998046875, -0.983795166015625, -0.8763580322265625, -0.7689208984375, -0.6614837646484375, -0.554046630859375, -0.4466094970703125, -0.33917236328125, -0.2317352294921875, -0.124298095703125, -0.0168609619140625, 0.090576171875, 0.1980133056640625, 0.305450439453125, 0.4128875732421875, 0.52032470703125, 0.6277618408203125, 0.735198974609375, 0.8426361083984375, 0.9500732421875, 1.0575103759765625, 1.164947509765625, 1.2723846435546875, 1.37982177734375, 1.4872589111328125, 1.594696044921875, 1.7021331787109375, 1.8095703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 7.0, 13.0, 23.0, 42.0, 86.0, 157.0, 222.0, 182.0, 136.0, 77.0, 31.0, 13.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.342247009277344, -31.711666107177734, -31.081087112426758, -30.45050621032715, -29.81992530822754, -29.189346313476562, -28.558765411376953, -27.928184509277344, -27.297603607177734, -26.667022705078125, -26.03644371032715, -25.40586280822754, -24.77528190612793, -24.144702911376953, -23.514122009277344, -22.883541107177734, -22.252962112426758, -21.62238121032715, -20.991802215576172, -20.361221313476562, -19.730640411376953, -19.100059509277344, -18.469480514526367, -17.838899612426758, -17.20832061767578, -16.577739715576172, -15.947159767150879, -15.316579818725586, -14.685998916625977, -14.055418968200684, -13.42483901977539, -12.794258117675781, -12.163675308227539, -11.533095359802246, -10.902514457702637, -10.271934509277344, -9.641353607177734, -9.010773658752441, -8.380193710327148, -7.749613285064697, -7.119032859802246, -6.488452434539795, -5.857872009277344, -5.227292060852051, -4.5967116355896, -3.9661312103271484, -3.3355510234832764, -2.7049708366394043, -2.074390411376953, -1.4438101053237915, -0.8132297992706299, -0.18264949321746826, 0.44793081283569336, 1.0785112380981445, 1.7090914249420166, 2.3396716117858887, 2.97025203704834, 3.600832462310791, 4.231412887573242, 4.861992835998535, 5.492573261260986, 6.1231536865234375, 6.7537336349487305, 7.384314060211182, 8.014894485473633]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 12.0, 11.0, 25.0, 27.0, 41.0, 42.0, 54.0, 59.0, 84.0, 61.0, 63.0, 80.0, 68.0, 76.0, 60.0, 50.0, 48.0, 33.0, 22.0, 25.0, 21.0, 11.0, 9.0, 7.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.256521224975586, -16.842187881469727, -16.427854537963867, -16.013521194458008, -15.599188804626465, -15.184855461120605, -14.770522117614746, -14.356189727783203, -13.941856384277344, -13.527523040771484, -13.113189697265625, -12.698857307434082, -12.284523963928223, -11.870190620422363, -11.455857276916504, -11.041524887084961, -10.627191543579102, -10.212858200073242, -9.798524856567383, -9.38419246673584, -8.96985912322998, -8.555525779724121, -8.141192436218262, -7.7268595695495605, -7.312525749206543, -6.898192405700684, -6.483859539031982, -6.069526195526123, -5.655193328857422, -5.2408599853515625, -4.826526641845703, -4.412193775177002, -3.997860908508301, -3.5835278034210205, -3.1691946983337402, -2.754861354827881, -2.3405284881591797, -1.9261951446533203, -1.51186203956604, -1.0975289344787598, -0.6831958293914795, -0.26886269450187683, 0.14547044038772583, 0.5598036050796509, 0.9741367101669312, 1.388469934463501, 1.8028030395507812, 2.2171361446380615, 2.631469249725342, 3.045802354812622, 3.4601354598999023, 3.8744688034057617, 4.288801670074463, 4.703135013580322, 5.117467880249023, 5.531801223754883, 5.946134567260742, 6.360467910766602, 6.774800777435303, 7.189134120941162, 7.603466987609863, 8.017800331115723, 8.432133674621582, 8.846466064453125, 9.260799407958984]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 6.0, 4.0, 20.0, 13.0, 19.0, 27.0, 22.0, 42.0, 51.0, 62.0, 103.0, 174.0, 232.0, 369.0, 655.0, 1457.0, 4292.0, 18348.0, 115597.0, 634862.0, 229895.0, 31545.0, 6590.0, 2005.0, 866.0, 416.0, 278.0, 179.0, 114.0, 85.0, 49.0, 47.0, 29.0, 24.0, 14.0, 19.0, 9.0, 5.0, 6.0, 9.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.3203125, -10.9627685546875, -10.605224609375, -10.2476806640625, -9.89013671875, -9.5325927734375, -9.175048828125, -8.8175048828125, -8.4599609375, -8.1024169921875, -7.744873046875, -7.3873291015625, -7.02978515625, -6.6722412109375, -6.314697265625, -5.9571533203125, -5.599609375, -5.2420654296875, -4.884521484375, -4.5269775390625, -4.16943359375, -3.8118896484375, -3.454345703125, -3.0968017578125, -2.7392578125, -2.3817138671875, -2.024169921875, -1.6666259765625, -1.30908203125, -0.9515380859375, -0.593994140625, -0.2364501953125, 0.12109375, 0.4786376953125, 0.836181640625, 1.1937255859375, 1.55126953125, 1.9088134765625, 2.266357421875, 2.6239013671875, 2.9814453125, 3.3389892578125, 3.696533203125, 4.0540771484375, 4.41162109375, 4.7691650390625, 5.126708984375, 5.4842529296875, 5.841796875, 6.1993408203125, 6.556884765625, 6.9144287109375, 7.27197265625, 7.6295166015625, 7.987060546875, 8.3446044921875, 8.7021484375, 9.0596923828125, 9.417236328125, 9.7747802734375, 10.13232421875, 10.4898681640625, 10.847412109375, 11.2049560546875, 11.5625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 17.0, 40.0, 61.0, 88.0, 130.0, 158.0, 138.0, 121.0, 90.0, 56.0, 47.0, 26.0, 17.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.276336669921875, -3.12103271484375, -2.965728759765625, -2.8104248046875, -2.655120849609375, -2.49981689453125, -2.344512939453125, -2.189208984375, -2.033905029296875, -1.87860107421875, -1.723297119140625, -1.5679931640625, -1.412689208984375, -1.25738525390625, -1.102081298828125, -0.94677734375, -0.791473388671875, -0.63616943359375, -0.480865478515625, -0.3255615234375, -0.170257568359375, -0.01495361328125, 0.140350341796875, 0.295654296875, 0.450958251953125, 0.60626220703125, 0.761566162109375, 0.9168701171875, 1.072174072265625, 1.22747802734375, 1.382781982421875, 1.5380859375, 1.693389892578125, 1.84869384765625, 2.003997802734375, 2.1593017578125, 2.314605712890625, 2.46990966796875, 2.625213623046875, 2.780517578125, 2.935821533203125, 3.09112548828125, 3.246429443359375, 3.4017333984375, 3.557037353515625, 3.71234130859375, 3.867645263671875, 4.02294921875, 4.178253173828125, 4.33355712890625, 4.488861083984375, 4.6441650390625, 4.799468994140625, 4.95477294921875, 5.110076904296875, 5.265380859375, 5.420684814453125, 5.57598876953125, 5.731292724609375, 5.8865966796875, 6.041900634765625, 6.19720458984375, 6.352508544921875, 6.5078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 2.0, 4.0, 6.0, 7.0, 17.0, 17.0, 23.0, 45.0, 46.0, 66.0, 86.0, 143.0, 200.0, 280.0, 442.0, 717.0, 1115.0, 1893.0, 3290.0, 6071.0, 11856.0, 25737.0, 60596.0, 155753.0, 332106.0, 261168.0, 105737.0, 42208.0, 18545.0, 8990.0, 4674.0, 2563.0, 1425.0, 927.0, 556.0, 367.0, 279.0, 168.0, 114.0, 76.0, 70.0, 47.0, 35.0, 24.0, 24.0, 15.0, 10.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.47265625, -4.3441162109375, -4.215576171875, -4.0870361328125, -3.95849609375, -3.8299560546875, -3.701416015625, -3.5728759765625, -3.4443359375, -3.3157958984375, -3.187255859375, -3.0587158203125, -2.93017578125, -2.8016357421875, -2.673095703125, -2.5445556640625, -2.416015625, -2.2874755859375, -2.158935546875, -2.0303955078125, -1.90185546875, -1.7733154296875, -1.644775390625, -1.5162353515625, -1.3876953125, -1.2591552734375, -1.130615234375, -1.0020751953125, -0.87353515625, -0.7449951171875, -0.616455078125, -0.4879150390625, -0.359375, -0.2308349609375, -0.102294921875, 0.0262451171875, 0.15478515625, 0.2833251953125, 0.411865234375, 0.5404052734375, 0.6689453125, 0.7974853515625, 0.926025390625, 1.0545654296875, 1.18310546875, 1.3116455078125, 1.440185546875, 1.5687255859375, 1.697265625, 1.8258056640625, 1.954345703125, 2.0828857421875, 2.21142578125, 2.3399658203125, 2.468505859375, 2.5970458984375, 2.7255859375, 2.8541259765625, 2.982666015625, 3.1112060546875, 3.23974609375, 3.3682861328125, 3.496826171875, 3.6253662109375, 3.75390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 13.0, 13.0, 14.0, 22.0, 23.0, 28.0, 29.0, 34.0, 28.0, 37.0, 36.0, 34.0, 33.0, 43.0, 43.0, 47.0, 46.0, 39.0, 48.0, 46.0, 30.0, 50.0, 32.0, 36.0, 24.0, 23.0, 17.0, 15.0, 14.0, 7.0, 18.0, 19.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-7.19140625, -6.97174072265625, -6.7520751953125, -6.53240966796875, -6.312744140625, -6.09307861328125, -5.8734130859375, -5.65374755859375, -5.43408203125, -5.21441650390625, -4.9947509765625, -4.77508544921875, -4.555419921875, -4.33575439453125, -4.1160888671875, -3.89642333984375, -3.6767578125, -3.45709228515625, -3.2374267578125, -3.01776123046875, -2.798095703125, -2.57843017578125, -2.3587646484375, -2.13909912109375, -1.91943359375, -1.69976806640625, -1.4801025390625, -1.26043701171875, -1.040771484375, -0.82110595703125, -0.6014404296875, -0.38177490234375, -0.162109375, 0.05755615234375, 0.2772216796875, 0.49688720703125, 0.716552734375, 0.93621826171875, 1.1558837890625, 1.37554931640625, 1.59521484375, 1.81488037109375, 2.0345458984375, 2.25421142578125, 2.473876953125, 2.69354248046875, 2.9132080078125, 3.13287353515625, 3.3525390625, 3.57220458984375, 3.7918701171875, 4.01153564453125, 4.231201171875, 4.45086669921875, 4.6705322265625, 4.89019775390625, 5.10986328125, 5.32952880859375, 5.5491943359375, 5.76885986328125, 5.988525390625, 6.20819091796875, 6.4278564453125, 6.64752197265625, 6.8671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 17.0, 24.0, 34.0, 54.0, 131.0, 207.0, 444.0, 962.0, 2418.0, 7353.0, 30529.0, 212532.0, 677494.0, 91678.0, 16917.0, 4689.0, 1663.0, 670.0, 350.0, 150.0, 100.0, 44.0, 23.0, 17.0, 13.0, 9.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.359375, -4.20538330078125, -4.0513916015625, -3.89739990234375, -3.743408203125, -3.58941650390625, -3.4354248046875, -3.28143310546875, -3.12744140625, -2.97344970703125, -2.8194580078125, -2.66546630859375, -2.511474609375, -2.35748291015625, -2.2034912109375, -2.04949951171875, -1.8955078125, -1.74151611328125, -1.5875244140625, -1.43353271484375, -1.279541015625, -1.12554931640625, -0.9715576171875, -0.81756591796875, -0.66357421875, -0.50958251953125, -0.3555908203125, -0.20159912109375, -0.047607421875, 0.10638427734375, 0.2603759765625, 0.41436767578125, 0.568359375, 0.72235107421875, 0.8763427734375, 1.03033447265625, 1.184326171875, 1.33831787109375, 1.4923095703125, 1.64630126953125, 1.80029296875, 1.95428466796875, 2.1082763671875, 2.26226806640625, 2.416259765625, 2.57025146484375, 2.7242431640625, 2.87823486328125, 3.0322265625, 3.18621826171875, 3.3402099609375, 3.49420166015625, 3.648193359375, 3.80218505859375, 3.9561767578125, 4.11016845703125, 4.26416015625, 4.41815185546875, 4.5721435546875, 4.72613525390625, 4.880126953125, 5.03411865234375, 5.1881103515625, 5.34210205078125, 5.49609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 10.0, 15.0, 16.0, 14.0, 33.0, 38.0, 54.0, 67.0, 101.0, 173.0, 133.0, 99.0, 62.0, 52.0, 22.0, 26.0, 19.0, 15.0, 8.0, 6.0, 5.0, 4.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007023811340332031, -0.0006795227527618408, -0.0006566643714904785, -0.0006338059902191162, -0.0006109476089477539, -0.0005880892276763916, -0.0005652308464050293, -0.000542372465133667, -0.0005195140838623047, -0.0004966557025909424, -0.0004737973213195801, -0.0004509389400482178, -0.00042808055877685547, -0.00040522217750549316, -0.00038236379623413086, -0.00035950541496276855, -0.00033664703369140625, -0.00031378865242004395, -0.00029093027114868164, -0.00026807188987731934, -0.00024521350860595703, -0.00022235512733459473, -0.00019949674606323242, -0.00017663836479187012, -0.0001537799835205078, -0.0001309216022491455, -0.0001080632209777832, -8.52048397064209e-05, -6.23464584350586e-05, -3.948807716369629e-05, -1.6629695892333984e-05, 6.22868537902832e-06, 2.9087066650390625e-05, 5.194544792175293e-05, 7.480382919311523e-05, 9.766221046447754e-05, 0.00012052059173583984, 0.00014337897300720215, 0.00016623735427856445, 0.00018909573554992676, 0.00021195411682128906, 0.00023481249809265137, 0.00025767087936401367, 0.000280529260635376, 0.0003033876419067383, 0.0003262460231781006, 0.0003491044044494629, 0.0003719627857208252, 0.0003948211669921875, 0.0004176795482635498, 0.0004405379295349121, 0.0004633963108062744, 0.0004862546920776367, 0.000509113073348999, 0.0005319714546203613, 0.0005548298358917236, 0.0005776882171630859, 0.0006005465984344482, 0.0006234049797058105, 0.0006462633609771729, 0.0006691217422485352, 0.0006919801235198975, 0.0007148385047912598, 0.0007376968860626221, 0.0007605552673339844]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 9.0, 25.0, 35.0, 57.0, 143.0, 330.0, 882.0, 2776.0, 12634.0, 89078.0, 809033.0, 113807.0, 15031.0, 3215.0, 868.0, 334.0, 138.0, 72.0, 47.0, 23.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.898681640625, -8.64111328125, -8.383544921875, -8.1259765625, -7.868408203125, -7.61083984375, -7.353271484375, -7.095703125, -6.838134765625, -6.58056640625, -6.322998046875, -6.0654296875, -5.807861328125, -5.55029296875, -5.292724609375, -5.03515625, -4.777587890625, -4.52001953125, -4.262451171875, -4.0048828125, -3.747314453125, -3.48974609375, -3.232177734375, -2.974609375, -2.717041015625, -2.45947265625, -2.201904296875, -1.9443359375, -1.686767578125, -1.42919921875, -1.171630859375, -0.9140625, -0.656494140625, -0.39892578125, -0.141357421875, 0.1162109375, 0.373779296875, 0.63134765625, 0.888916015625, 1.146484375, 1.404052734375, 1.66162109375, 1.919189453125, 2.1767578125, 2.434326171875, 2.69189453125, 2.949462890625, 3.20703125, 3.464599609375, 3.72216796875, 3.979736328125, 4.2373046875, 4.494873046875, 4.75244140625, 5.010009765625, 5.267578125, 5.525146484375, 5.78271484375, 6.040283203125, 6.2978515625, 6.555419921875, 6.81298828125, 7.070556640625, 7.328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 6.0, 9.0, 7.0, 11.0, 11.0, 9.0, 11.0, 22.0, 27.0, 27.0, 36.0, 54.0, 75.0, 97.0, 109.0, 97.0, 73.0, 66.0, 42.0, 36.0, 29.0, 28.0, 17.0, 17.0, 8.0, 10.0, 11.0, 6.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.94140625, -3.83074951171875, -3.7200927734375, -3.60943603515625, -3.498779296875, -3.38812255859375, -3.2774658203125, -3.16680908203125, -3.05615234375, -2.94549560546875, -2.8348388671875, -2.72418212890625, -2.613525390625, -2.50286865234375, -2.3922119140625, -2.28155517578125, -2.1708984375, -2.06024169921875, -1.9495849609375, -1.83892822265625, -1.728271484375, -1.61761474609375, -1.5069580078125, -1.39630126953125, -1.28564453125, -1.17498779296875, -1.0643310546875, -0.95367431640625, -0.843017578125, -0.73236083984375, -0.6217041015625, -0.51104736328125, -0.400390625, -0.28973388671875, -0.1790771484375, -0.06842041015625, 0.042236328125, 0.15289306640625, 0.2635498046875, 0.37420654296875, 0.48486328125, 0.59552001953125, 0.7061767578125, 0.81683349609375, 0.927490234375, 1.03814697265625, 1.1488037109375, 1.25946044921875, 1.3701171875, 1.48077392578125, 1.5914306640625, 1.70208740234375, 1.812744140625, 1.92340087890625, 2.0340576171875, 2.14471435546875, 2.25537109375, 2.36602783203125, 2.4766845703125, 2.58734130859375, 2.697998046875, 2.80865478515625, 2.9193115234375, 3.02996826171875, 3.140625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 5.0, 4.0, 11.0, 7.0, 34.0, 65.0, 152.0, 305.0, 238.0, 124.0, 39.0, 10.0, 11.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.027982711791992, -25.73267936706543, -22.437376022338867, -19.142072677612305, -15.846769332885742, -12.55146598815918, -9.256162643432617, -5.960859298706055, -2.665555953979492, 0.6297473907470703, 3.925050735473633, 7.220354080200195, 10.515657424926758, 13.81096076965332, 17.106264114379883, 20.401567459106445, 23.696870803833008, 26.99217414855957, 30.287477493286133, 33.58277893066406, 36.878082275390625, 40.17338562011719, 43.46868896484375, 46.76399230957031, 50.059295654296875, 53.35459899902344, 56.64990234375, 59.94520568847656, 63.240509033203125, 66.53581237792969, 69.83111572265625, 73.12641906738281, 76.42172241210938, 79.71702575683594, 83.0123291015625, 86.30763244628906, 89.60293579101562, 92.89823913574219, 96.19354248046875, 99.48884582519531, 102.78414916992188, 106.07945251464844, 109.374755859375, 112.67005920410156, 115.96536254882812, 119.26066589355469, 122.55596923828125, 125.85127258300781, 129.14657592773438, 132.44187927246094, 135.7371826171875, 139.03248596191406, 142.32778930664062, 145.6230926513672, 148.91839599609375, 152.2136993408203, 155.50900268554688, 158.80430603027344, 162.099609375, 165.39491271972656, 168.69021606445312, 171.9855194091797, 175.28082275390625, 178.5761260986328, 181.87142944335938]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 8.0, 2.0, 5.0, 5.0, 11.0, 11.0, 15.0, 16.0, 26.0, 29.0, 28.0, 26.0, 24.0, 36.0, 49.0, 33.0, 29.0, 45.0, 23.0, 43.0, 45.0, 45.0, 44.0, 40.0, 46.0, 40.0, 44.0, 35.0, 29.0, 25.0, 20.0, 26.0, 22.0, 11.0, 8.0, 15.0, 12.0, 7.0, 5.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.568180084228516, -46.148834228515625, -44.7294921875, -43.31014633178711, -41.89080047607422, -40.471458435058594, -39.0521125793457, -37.63276672363281, -36.21342468261719, -34.7940788269043, -33.37473678588867, -31.95539093017578, -30.53604507446289, -29.116701126098633, -27.697357177734375, -26.278011322021484, -24.858665466308594, -23.439321517944336, -22.019975662231445, -20.600631713867188, -19.181285858154297, -17.76194190979004, -16.34259796142578, -14.923253059387207, -13.503908157348633, -12.084563255310059, -10.665218353271484, -9.245874404907227, -7.826529502868652, -6.407184600830078, -4.98784065246582, -3.568495750427246, -2.1491546630859375, -0.7298099994659424, 0.6895346641540527, 2.1088790893554688, 3.528223991394043, 4.947568893432617, 6.366912841796875, 7.786257743835449, 9.205602645874023, 10.624947547912598, 12.044292449951172, 13.46363639831543, 14.882981300354004, 16.302326202392578, 17.721670150756836, 19.141014099121094, 20.560359954833984, 21.979703903198242, 23.399049758911133, 24.81839370727539, 26.23773956298828, 27.65708351135254, 29.076427459716797, 30.495773315429688, 31.915117263793945, 33.3344612121582, 34.753807067871094, 36.17314910888672, 37.59249496459961, 39.0118408203125, 40.431182861328125, 41.850528717041016, 43.269874572753906]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 18.0, 24.0, 37.0, 73.0, 140.0, 259.0, 637.0, 1571.0, 6282.0, 63350.0, 4059626.0, 53741.0, 5777.0, 1499.0, 599.0, 277.0, 137.0, 70.0, 53.0, 31.0, 19.0, 7.0, 6.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.171875, -14.552001953125, -13.93212890625, -13.312255859375, -12.6923828125, -12.072509765625, -11.45263671875, -10.832763671875, -10.212890625, -9.593017578125, -8.97314453125, -8.353271484375, -7.7333984375, -7.113525390625, -6.49365234375, -5.873779296875, -5.25390625, -4.634033203125, -4.01416015625, -3.394287109375, -2.7744140625, -2.154541015625, -1.53466796875, -0.914794921875, -0.294921875, 0.324951171875, 0.94482421875, 1.564697265625, 2.1845703125, 2.804443359375, 3.42431640625, 4.044189453125, 4.6640625, 5.283935546875, 5.90380859375, 6.523681640625, 7.1435546875, 7.763427734375, 8.38330078125, 9.003173828125, 9.623046875, 10.242919921875, 10.86279296875, 11.482666015625, 12.1025390625, 12.722412109375, 13.34228515625, 13.962158203125, 14.58203125, 15.201904296875, 15.82177734375, 16.441650390625, 17.0615234375, 17.681396484375, 18.30126953125, 18.921142578125, 19.541015625, 20.160888671875, 20.78076171875, 21.400634765625, 22.0205078125, 22.640380859375, 23.26025390625, 23.880126953125, 24.5]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 16.0, 26.0, 43.0, 61.0, 78.0, 95.0, 87.0, 136.0, 106.0, 99.0, 71.0, 63.0, 46.0, 35.0, 15.0, 14.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.57421875, -3.42938232421875, -3.2845458984375, -3.13970947265625, -2.994873046875, -2.85003662109375, -2.7052001953125, -2.56036376953125, -2.41552734375, -2.27069091796875, -2.1258544921875, -1.98101806640625, -1.836181640625, -1.69134521484375, -1.5465087890625, -1.40167236328125, -1.2568359375, -1.11199951171875, -0.9671630859375, -0.82232666015625, -0.677490234375, -0.53265380859375, -0.3878173828125, -0.24298095703125, -0.09814453125, 0.04669189453125, 0.1915283203125, 0.33636474609375, 0.481201171875, 0.62603759765625, 0.7708740234375, 0.91571044921875, 1.060546875, 1.20538330078125, 1.3502197265625, 1.49505615234375, 1.639892578125, 1.78472900390625, 1.9295654296875, 2.07440185546875, 2.21923828125, 2.36407470703125, 2.5089111328125, 2.65374755859375, 2.798583984375, 2.94342041015625, 3.0882568359375, 3.23309326171875, 3.3779296875, 3.52276611328125, 3.6676025390625, 3.81243896484375, 3.957275390625, 4.10211181640625, 4.2469482421875, 4.39178466796875, 4.53662109375, 4.68145751953125, 4.8262939453125, 4.97113037109375, 5.115966796875, 5.26080322265625, 5.4056396484375, 5.55047607421875, 5.6953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 4.0, 10.0, 18.0, 14.0, 23.0, 35.0, 32.0, 60.0, 68.0, 117.0, 191.0, 264.0, 393.0, 673.0, 993.0, 1782.0, 3513.0, 7524.0, 18235.0, 59194.0, 555267.0, 3361143.0, 133503.0, 29582.0, 10987.0, 4828.0, 2404.0, 1296.0, 726.0, 464.0, 297.0, 192.0, 120.0, 86.0, 51.0, 43.0, 46.0, 23.0, 28.0, 15.0, 10.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-7.30078125, -7.08111572265625, -6.8614501953125, -6.64178466796875, -6.422119140625, -6.20245361328125, -5.9827880859375, -5.76312255859375, -5.54345703125, -5.32379150390625, -5.1041259765625, -4.88446044921875, -4.664794921875, -4.44512939453125, -4.2254638671875, -4.00579833984375, -3.7861328125, -3.56646728515625, -3.3468017578125, -3.12713623046875, -2.907470703125, -2.68780517578125, -2.4681396484375, -2.24847412109375, -2.02880859375, -1.80914306640625, -1.5894775390625, -1.36981201171875, -1.150146484375, -0.93048095703125, -0.7108154296875, -0.49114990234375, -0.271484375, -0.05181884765625, 0.1678466796875, 0.38751220703125, 0.607177734375, 0.82684326171875, 1.0465087890625, 1.26617431640625, 1.48583984375, 1.70550537109375, 1.9251708984375, 2.14483642578125, 2.364501953125, 2.58416748046875, 2.8038330078125, 3.02349853515625, 3.2431640625, 3.46282958984375, 3.6824951171875, 3.90216064453125, 4.121826171875, 4.34149169921875, 4.5611572265625, 4.78082275390625, 5.00048828125, 5.22015380859375, 5.4398193359375, 5.65948486328125, 5.879150390625, 6.09881591796875, 6.3184814453125, 6.53814697265625, 6.7578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 8.0, 14.0, 18.0, 12.0, 29.0, 42.0, 80.0, 160.0, 356.0, 1779.0, 982.0, 263.0, 118.0, 64.0, 41.0, 22.0, 10.0, 15.0, 9.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.5, -4.3670654296875, -4.234130859375, -4.1011962890625, -3.96826171875, -3.8353271484375, -3.702392578125, -3.5694580078125, -3.4365234375, -3.3035888671875, -3.170654296875, -3.0377197265625, -2.90478515625, -2.7718505859375, -2.638916015625, -2.5059814453125, -2.373046875, -2.2401123046875, -2.107177734375, -1.9742431640625, -1.84130859375, -1.7083740234375, -1.575439453125, -1.4425048828125, -1.3095703125, -1.1766357421875, -1.043701171875, -0.9107666015625, -0.77783203125, -0.6448974609375, -0.511962890625, -0.3790283203125, -0.24609375, -0.1131591796875, 0.019775390625, 0.1527099609375, 0.28564453125, 0.4185791015625, 0.551513671875, 0.6844482421875, 0.8173828125, 0.9503173828125, 1.083251953125, 1.2161865234375, 1.34912109375, 1.4820556640625, 1.614990234375, 1.7479248046875, 1.880859375, 2.0137939453125, 2.146728515625, 2.2796630859375, 2.41259765625, 2.5455322265625, 2.678466796875, 2.8114013671875, 2.9443359375, 3.0772705078125, 3.210205078125, 3.3431396484375, 3.47607421875, 3.6090087890625, 3.741943359375, 3.8748779296875, 4.0078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 10.0, 15.0, 25.0, 53.0, 136.0, 205.0, 201.0, 156.0, 100.0, 39.0, 28.0, 15.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-50.06025695800781, -49.08889389038086, -48.117530822753906, -47.14617156982422, -46.174808502197266, -45.20344543457031, -44.23208236694336, -43.260719299316406, -42.28935623168945, -41.3179931640625, -40.34663009643555, -39.375267028808594, -38.403907775878906, -37.43254470825195, -36.461181640625, -35.48981857299805, -34.518455505371094, -33.54709243774414, -32.57572937011719, -31.604368209838867, -30.633005142211914, -29.661643981933594, -28.69028091430664, -27.718917846679688, -26.74755859375, -25.776195526123047, -24.804834365844727, -23.833471298217773, -22.86210823059082, -21.8907470703125, -20.919384002685547, -19.948020935058594, -18.976659774780273, -18.00529670715332, -17.033935546875, -16.062572479248047, -15.091209411621094, -14.119847297668457, -13.14848518371582, -12.177122116088867, -11.20576000213623, -10.234397888183594, -9.26303482055664, -8.291672706604004, -7.320310115814209, -6.348947525024414, -5.377585411071777, -4.406222820281982, -3.4348602294921875, -2.4634976387023926, -1.4921352863311768, -0.5207729339599609, 0.450589656829834, 1.421952247619629, 2.3933143615722656, 3.3646769523620605, 4.3360395431518555, 5.30740213394165, 6.278764724731445, 7.250126838684082, 8.221488952636719, 9.192852020263672, 10.164214134216309, 11.135576248168945, 12.106939315795898]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 8.0, 12.0, 12.0, 23.0, 25.0, 32.0, 28.0, 27.0, 47.0, 46.0, 55.0, 58.0, 61.0, 53.0, 49.0, 55.0, 52.0, 61.0, 58.0, 37.0, 36.0, 27.0, 31.0, 28.0, 15.0, 4.0, 15.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.609703063964844, -16.133255004882812, -15.656805992126465, -15.180356979370117, -14.70390796661377, -14.227458953857422, -13.75101089477539, -13.274561882019043, -12.798112869262695, -12.321663856506348, -11.845215797424316, -11.368766784667969, -10.892317771911621, -10.415868759155273, -9.939420700073242, -9.462971687316895, -8.986523628234863, -8.510074615478516, -8.033626556396484, -7.557177543640137, -7.080728530883789, -6.6042799949646, -6.12783145904541, -5.6513824462890625, -5.174933910369873, -4.698485374450684, -4.222036361694336, -3.7455878257751465, -3.269139051437378, -2.7926902770996094, -2.31624174118042, -1.8397929668426514, -1.3633451461791992, -0.8868964314460754, -0.41044771671295166, 0.06600093841552734, 0.5424497127532959, 1.0188984870910645, 1.495347023010254, 1.9717957973480225, 2.448244571685791, 2.9246933460235596, 3.401142120361328, 3.8775906562805176, 4.354039192199707, 4.830488204956055, 5.306936740875244, 5.783385276794434, 6.259834289550781, 6.736282825469971, 7.212731838226318, 7.689180374145508, 8.165629386901855, 8.642078399658203, 9.118526458740234, 9.594975471496582, 10.07142448425293, 10.547873497009277, 11.024321556091309, 11.500770568847656, 11.977219581604004, 12.453668594360352, 12.930116653442383, 13.40656566619873, 13.883013725280762]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 14.0, 13.0, 12.0, 22.0, 37.0, 45.0, 92.0, 162.0, 272.0, 556.0, 1184.0, 3425.0, 11777.0, 55651.0, 474238.0, 432769.0, 51642.0, 10939.0, 3298.0, 1216.0, 521.0, 252.0, 167.0, 81.0, 47.0, 36.0, 30.0, 22.0, 5.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.859375, -11.488525390625, -11.11767578125, -10.746826171875, -10.3759765625, -10.005126953125, -9.63427734375, -9.263427734375, -8.892578125, -8.521728515625, -8.15087890625, -7.780029296875, -7.4091796875, -7.038330078125, -6.66748046875, -6.296630859375, -5.92578125, -5.554931640625, -5.18408203125, -4.813232421875, -4.4423828125, -4.071533203125, -3.70068359375, -3.329833984375, -2.958984375, -2.588134765625, -2.21728515625, -1.846435546875, -1.4755859375, -1.104736328125, -0.73388671875, -0.363037109375, 0.0078125, 0.378662109375, 0.74951171875, 1.120361328125, 1.4912109375, 1.862060546875, 2.23291015625, 2.603759765625, 2.974609375, 3.345458984375, 3.71630859375, 4.087158203125, 4.4580078125, 4.828857421875, 5.19970703125, 5.570556640625, 5.94140625, 6.312255859375, 6.68310546875, 7.053955078125, 7.4248046875, 7.795654296875, 8.16650390625, 8.537353515625, 8.908203125, 9.279052734375, 9.64990234375, 10.020751953125, 10.3916015625, 10.762451171875, 11.13330078125, 11.504150390625, 11.875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 9.0, 15.0, 23.0, 28.0, 56.0, 45.0, 78.0, 77.0, 104.0, 84.0, 103.0, 91.0, 72.0, 57.0, 40.0, 48.0, 26.0, 21.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.552734375, -3.428863525390625, -3.30499267578125, -3.181121826171875, -3.0572509765625, -2.933380126953125, -2.80950927734375, -2.685638427734375, -2.561767578125, -2.437896728515625, -2.31402587890625, -2.190155029296875, -2.0662841796875, -1.942413330078125, -1.81854248046875, -1.694671630859375, -1.57080078125, -1.446929931640625, -1.32305908203125, -1.199188232421875, -1.0753173828125, -0.951446533203125, -0.82757568359375, -0.703704833984375, -0.579833984375, -0.455963134765625, -0.33209228515625, -0.208221435546875, -0.0843505859375, 0.039520263671875, 0.16339111328125, 0.287261962890625, 0.4111328125, 0.535003662109375, 0.65887451171875, 0.782745361328125, 0.9066162109375, 1.030487060546875, 1.15435791015625, 1.278228759765625, 1.402099609375, 1.525970458984375, 1.64984130859375, 1.773712158203125, 1.8975830078125, 2.021453857421875, 2.14532470703125, 2.269195556640625, 2.39306640625, 2.516937255859375, 2.64080810546875, 2.764678955078125, 2.8885498046875, 3.012420654296875, 3.13629150390625, 3.260162353515625, 3.384033203125, 3.507904052734375, 3.63177490234375, 3.755645751953125, 3.8795166015625, 4.003387451171875, 4.12725830078125, 4.251129150390625, 4.375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 8.0, 8.0, 9.0, 10.0, 17.0, 31.0, 38.0, 45.0, 80.0, 93.0, 155.0, 222.0, 336.0, 483.0, 776.0, 1377.0, 2440.0, 4786.0, 10353.0, 27561.0, 91672.0, 408267.0, 371257.0, 83183.0, 25292.0, 9834.0, 4464.0, 2297.0, 1265.0, 743.0, 467.0, 310.0, 202.0, 141.0, 107.0, 73.0, 42.0, 26.0, 25.0, 18.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0], "bins": [-7.6015625, -7.39019775390625, -7.1788330078125, -6.96746826171875, -6.756103515625, -6.54473876953125, -6.3333740234375, -6.12200927734375, -5.91064453125, -5.69927978515625, -5.4879150390625, -5.27655029296875, -5.065185546875, -4.85382080078125, -4.6424560546875, -4.43109130859375, -4.2197265625, -4.00836181640625, -3.7969970703125, -3.58563232421875, -3.374267578125, -3.16290283203125, -2.9515380859375, -2.74017333984375, -2.52880859375, -2.31744384765625, -2.1060791015625, -1.89471435546875, -1.683349609375, -1.47198486328125, -1.2606201171875, -1.04925537109375, -0.837890625, -0.62652587890625, -0.4151611328125, -0.20379638671875, 0.007568359375, 0.21893310546875, 0.4302978515625, 0.64166259765625, 0.85302734375, 1.06439208984375, 1.2757568359375, 1.48712158203125, 1.698486328125, 1.90985107421875, 2.1212158203125, 2.33258056640625, 2.5439453125, 2.75531005859375, 2.9666748046875, 3.17803955078125, 3.389404296875, 3.60076904296875, 3.8121337890625, 4.02349853515625, 4.23486328125, 4.44622802734375, 4.6575927734375, 4.86895751953125, 5.080322265625, 5.29168701171875, 5.5030517578125, 5.71441650390625, 5.92578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 3.0, 5.0, 3.0, 9.0, 6.0, 16.0, 15.0, 18.0, 23.0, 40.0, 38.0, 50.0, 41.0, 52.0, 51.0, 60.0, 75.0, 60.0, 83.0, 54.0, 58.0, 51.0, 39.0, 28.0, 26.0, 23.0, 18.0, 14.0, 10.0, 11.0, 9.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.0, -12.6376953125, -12.275390625, -11.9130859375, -11.55078125, -11.1884765625, -10.826171875, -10.4638671875, -10.1015625, -9.7392578125, -9.376953125, -9.0146484375, -8.65234375, -8.2900390625, -7.927734375, -7.5654296875, -7.203125, -6.8408203125, -6.478515625, -6.1162109375, -5.75390625, -5.3916015625, -5.029296875, -4.6669921875, -4.3046875, -3.9423828125, -3.580078125, -3.2177734375, -2.85546875, -2.4931640625, -2.130859375, -1.7685546875, -1.40625, -1.0439453125, -0.681640625, -0.3193359375, 0.04296875, 0.4052734375, 0.767578125, 1.1298828125, 1.4921875, 1.8544921875, 2.216796875, 2.5791015625, 2.94140625, 3.3037109375, 3.666015625, 4.0283203125, 4.390625, 4.7529296875, 5.115234375, 5.4775390625, 5.83984375, 6.2021484375, 6.564453125, 6.9267578125, 7.2890625, 7.6513671875, 8.013671875, 8.3759765625, 8.73828125, 9.1005859375, 9.462890625, 9.8251953125, 10.1875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 5.0, 13.0, 12.0, 29.0, 47.0, 112.0, 281.0, 744.0, 3983.0, 46233.0, 969078.0, 24216.0, 2812.0, 591.0, 218.0, 76.0, 46.0, 18.0, 17.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.015625, -12.6580810546875, -12.300537109375, -11.9429931640625, -11.58544921875, -11.2279052734375, -10.870361328125, -10.5128173828125, -10.1552734375, -9.7977294921875, -9.440185546875, -9.0826416015625, -8.72509765625, -8.3675537109375, -8.010009765625, -7.6524658203125, -7.294921875, -6.9373779296875, -6.579833984375, -6.2222900390625, -5.86474609375, -5.5072021484375, -5.149658203125, -4.7921142578125, -4.4345703125, -4.0770263671875, -3.719482421875, -3.3619384765625, -3.00439453125, -2.6468505859375, -2.289306640625, -1.9317626953125, -1.57421875, -1.2166748046875, -0.859130859375, -0.5015869140625, -0.14404296875, 0.2135009765625, 0.571044921875, 0.9285888671875, 1.2861328125, 1.6436767578125, 2.001220703125, 2.3587646484375, 2.71630859375, 3.0738525390625, 3.431396484375, 3.7889404296875, 4.146484375, 4.5040283203125, 4.861572265625, 5.2191162109375, 5.57666015625, 5.9342041015625, 6.291748046875, 6.6492919921875, 7.0068359375, 7.3643798828125, 7.721923828125, 8.0794677734375, 8.43701171875, 8.7945556640625, 9.152099609375, 9.5096435546875, 9.8671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 5.0, 9.0, 9.0, 14.0, 17.0, 38.0, 70.0, 204.0, 321.0, 142.0, 59.0, 34.0, 28.0, 10.0, 11.0, 7.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011072158813476562, -0.0010767504572868347, -0.0010462850332260132, -0.0010158196091651917, -0.0009853541851043701, -0.0009548887610435486, -0.000924423336982727, -0.0008939579129219055, -0.000863492488861084, -0.0008330270648002625, -0.0008025616407394409, -0.0007720962166786194, -0.0007416307926177979, -0.0007111653685569763, -0.0006806999444961548, -0.0006502345204353333, -0.0006197690963745117, -0.0005893036723136902, -0.0005588382482528687, -0.0005283728241920471, -0.0004979074001312256, -0.00046744197607040405, -0.0004369765520095825, -0.000406511127948761, -0.00037604570388793945, -0.0003455802798271179, -0.0003151148557662964, -0.00028464943170547485, -0.0002541840076446533, -0.0002237185835838318, -0.00019325315952301025, -0.00016278773546218872, -0.0001323223114013672, -0.00010185688734054565, -7.139146327972412e-05, -4.092603921890259e-05, -1.0460615158081055e-05, 2.000480890274048e-05, 5.047023296356201e-05, 8.093565702438354e-05, 0.00011140108108520508, 0.0001418665051460266, 0.00017233192920684814, 0.00020279735326766968, 0.0002332627773284912, 0.00026372820138931274, 0.0002941936254501343, 0.0003246590495109558, 0.00035512447357177734, 0.0003855898976325989, 0.0004160553216934204, 0.00044652074575424194, 0.0004769861698150635, 0.000507451593875885, 0.0005379170179367065, 0.0005683824419975281, 0.0005988478660583496, 0.0006293132901191711, 0.0006597787141799927, 0.0006902441382408142, 0.0007207095623016357, 0.0007511749863624573, 0.0007816404104232788, 0.0008121058344841003, 0.0008425712585449219]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 14.0, 34.0, 44.0, 107.0, 182.0, 460.0, 1655.0, 8774.0, 168461.0, 847432.0, 17632.0, 2582.0, 664.0, 249.0, 116.0, 72.0, 32.0, 19.0, 8.0, 3.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.03125, -14.615478515625, -14.19970703125, -13.783935546875, -13.3681640625, -12.952392578125, -12.53662109375, -12.120849609375, -11.705078125, -11.289306640625, -10.87353515625, -10.457763671875, -10.0419921875, -9.626220703125, -9.21044921875, -8.794677734375, -8.37890625, -7.963134765625, -7.54736328125, -7.131591796875, -6.7158203125, -6.300048828125, -5.88427734375, -5.468505859375, -5.052734375, -4.636962890625, -4.22119140625, -3.805419921875, -3.3896484375, -2.973876953125, -2.55810546875, -2.142333984375, -1.7265625, -1.310791015625, -0.89501953125, -0.479248046875, -0.0634765625, 0.352294921875, 0.76806640625, 1.183837890625, 1.599609375, 2.015380859375, 2.43115234375, 2.846923828125, 3.2626953125, 3.678466796875, 4.09423828125, 4.510009765625, 4.92578125, 5.341552734375, 5.75732421875, 6.173095703125, 6.5888671875, 7.004638671875, 7.42041015625, 7.836181640625, 8.251953125, 8.667724609375, 9.08349609375, 9.499267578125, 9.9150390625, 10.330810546875, 10.74658203125, 11.162353515625, 11.578125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 9.0, 20.0, 55.0, 138.0, 474.0, 177.0, 56.0, 39.0, 8.0, 14.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8203125, -13.408935546875, -12.99755859375, -12.586181640625, -12.1748046875, -11.763427734375, -11.35205078125, -10.940673828125, -10.529296875, -10.117919921875, -9.70654296875, -9.295166015625, -8.8837890625, -8.472412109375, -8.06103515625, -7.649658203125, -7.23828125, -6.826904296875, -6.41552734375, -6.004150390625, -5.5927734375, -5.181396484375, -4.77001953125, -4.358642578125, -3.947265625, -3.535888671875, -3.12451171875, -2.713134765625, -2.3017578125, -1.890380859375, -1.47900390625, -1.067626953125, -0.65625, -0.244873046875, 0.16650390625, 0.577880859375, 0.9892578125, 1.400634765625, 1.81201171875, 2.223388671875, 2.634765625, 3.046142578125, 3.45751953125, 3.868896484375, 4.2802734375, 4.691650390625, 5.10302734375, 5.514404296875, 5.92578125, 6.337158203125, 6.74853515625, 7.159912109375, 7.5712890625, 7.982666015625, 8.39404296875, 8.805419921875, 9.216796875, 9.628173828125, 10.03955078125, 10.450927734375, 10.8623046875, 11.273681640625, 11.68505859375, 12.096435546875, 12.5078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 15.0, 29.0, 75.0, 189.0, 325.0, 210.0, 92.0, 33.0, 13.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.35951232910156, -64.50629425048828, -60.653072357177734, -56.79985046386719, -52.946632385253906, -49.09341049194336, -45.24018859863281, -41.38697052001953, -37.53375244140625, -33.6805305480957, -29.827312469482422, -25.974090576171875, -22.120872497558594, -18.267650604248047, -14.414430618286133, -10.561210632324219, -6.707988739013672, -2.8547685146331787, 0.9984517097473145, 4.851672172546387, 8.7048921585083, 12.558113098144531, 16.411333084106445, 20.26455307006836, 24.117773056030273, 27.970993041992188, 31.8242130279541, 35.677433013916016, 39.53065490722656, 43.383872985839844, 47.23709487915039, 51.09031677246094, 54.94353485107422, 58.796756744384766, 62.64997482299805, 66.5031967163086, 70.35641479492188, 74.20964050292969, 78.06285858154297, 81.91607666015625, 85.76929473876953, 89.62251281738281, 93.47573852539062, 97.3289566040039, 101.18217468261719, 105.035400390625, 108.88861846923828, 112.74183654785156, 116.59506225585938, 120.44828033447266, 124.30150604248047, 128.15472412109375, 132.00794982910156, 135.8611602783203, 139.71438598632812, 143.56759643554688, 147.4208221435547, 151.2740478515625, 155.12725830078125, 158.98048400878906, 162.83370971679688, 166.68692016601562, 170.54014587402344, 174.39337158203125, 178.24658203125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 6.0, 4.0, 6.0, 7.0, 10.0, 7.0, 12.0, 16.0, 18.0, 24.0, 22.0, 19.0, 44.0, 19.0, 40.0, 28.0, 35.0, 39.0, 32.0, 52.0, 46.0, 40.0, 43.0, 37.0, 41.0, 47.0, 40.0, 43.0, 34.0, 31.0, 27.0, 18.0, 25.0, 12.0, 22.0, 11.0, 12.0, 10.0, 4.0, 5.0, 3.0, 4.0, 9.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.158470153808594, -36.744163513183594, -35.32985305786133, -33.91554641723633, -32.50123596191406, -31.086929321289062, -29.67262077331543, -28.258312225341797, -26.844005584716797, -25.429697036743164, -24.01538848876953, -22.60108184814453, -21.1867733001709, -19.772464752197266, -18.358156204223633, -16.94384765625, -15.529539108276367, -14.115230560302734, -12.700922966003418, -11.286614418029785, -9.872306823730469, -8.457998275756836, -7.043689727783203, -5.629382133483887, -4.215073585510254, -2.8007655143737793, -1.3864572048187256, 0.027851104736328125, 1.4421591758728027, 2.8564672470092773, 4.27077579498291, 5.685083389282227, 7.099391937255859, 8.513700485229492, 9.928008079528809, 11.342316627502441, 12.756624221801758, 14.17093276977539, 15.585241317749023, 16.999549865722656, 18.413856506347656, 19.82816505432129, 21.242473602294922, 22.656780242919922, 24.071088790893555, 25.485397338867188, 26.89970588684082, 28.314014434814453, 29.728322982788086, 31.14263153076172, 32.55693817138672, 33.971248626708984, 35.385555267333984, 36.79986572265625, 38.21417236328125, 39.62847900390625, 41.042789459228516, 42.457096099853516, 43.87140655517578, 45.28571319580078, 46.70002365112305, 48.11433029174805, 49.52864074707031, 50.94294738769531, 52.35725402832031]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 7.0, 10.0, 21.0, 33.0, 37.0, 86.0, 183.0, 338.0, 854.0, 2798.0, 14828.0, 3051303.0, 1105716.0, 13772.0, 2650.0, 891.0, 338.0, 166.0, 95.0, 58.0, 38.0, 20.0, 9.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0078125, -14.4071044921875, -13.806396484375, -13.2056884765625, -12.60498046875, -12.0042724609375, -11.403564453125, -10.8028564453125, -10.2021484375, -9.6014404296875, -9.000732421875, -8.4000244140625, -7.79931640625, -7.1986083984375, -6.597900390625, -5.9971923828125, -5.396484375, -4.7957763671875, -4.195068359375, -3.5943603515625, -2.99365234375, -2.3929443359375, -1.792236328125, -1.1915283203125, -0.5908203125, 0.0098876953125, 0.610595703125, 1.2113037109375, 1.81201171875, 2.4127197265625, 3.013427734375, 3.6141357421875, 4.21484375, 4.8155517578125, 5.416259765625, 6.0169677734375, 6.61767578125, 7.2183837890625, 7.819091796875, 8.4197998046875, 9.0205078125, 9.6212158203125, 10.221923828125, 10.8226318359375, 11.42333984375, 12.0240478515625, 12.624755859375, 13.2254638671875, 13.826171875, 14.4268798828125, 15.027587890625, 15.6282958984375, 16.22900390625, 16.8297119140625, 17.430419921875, 18.0311279296875, 18.6318359375, 19.2325439453125, 19.833251953125, 20.4339599609375, 21.03466796875, 21.6353759765625, 22.236083984375, 22.8367919921875, 23.4375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 13.0, 10.0, 25.0, 40.0, 44.0, 55.0, 68.0, 86.0, 94.0, 96.0, 90.0, 93.0, 78.0, 54.0, 42.0, 29.0, 34.0, 24.0, 7.0, 10.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.440826416015625, -3.30157470703125, -3.162322998046875, -3.0230712890625, -2.883819580078125, -2.74456787109375, -2.605316162109375, -2.466064453125, -2.326812744140625, -2.18756103515625, -2.048309326171875, -1.9090576171875, -1.769805908203125, -1.63055419921875, -1.491302490234375, -1.35205078125, -1.212799072265625, -1.07354736328125, -0.934295654296875, -0.7950439453125, -0.655792236328125, -0.51654052734375, -0.377288818359375, -0.238037109375, -0.098785400390625, 0.04046630859375, 0.179718017578125, 0.3189697265625, 0.458221435546875, 0.59747314453125, 0.736724853515625, 0.8759765625, 1.015228271484375, 1.15447998046875, 1.293731689453125, 1.4329833984375, 1.572235107421875, 1.71148681640625, 1.850738525390625, 1.989990234375, 2.129241943359375, 2.26849365234375, 2.407745361328125, 2.5469970703125, 2.686248779296875, 2.82550048828125, 2.964752197265625, 3.10400390625, 3.243255615234375, 3.38250732421875, 3.521759033203125, 3.6610107421875, 3.800262451171875, 3.93951416015625, 4.078765869140625, 4.218017578125, 4.357269287109375, 4.49652099609375, 4.635772705078125, 4.7750244140625, 4.914276123046875, 5.05352783203125, 5.192779541015625, 5.33203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 7.0, 12.0, 18.0, 43.0, 60.0, 108.0, 109.0, 217.0, 371.0, 813.0, 1840.0, 5211.0, 21864.0, 321444.0, 3784361.0, 44812.0, 8287.0, 2538.0, 956.0, 518.0, 268.0, 132.0, 105.0, 72.0, 43.0, 15.0, 14.0, 17.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.40625, -10.970703125, -10.53515625, -10.099609375, -9.6640625, -9.228515625, -8.79296875, -8.357421875, -7.921875, -7.486328125, -7.05078125, -6.615234375, -6.1796875, -5.744140625, -5.30859375, -4.873046875, -4.4375, -4.001953125, -3.56640625, -3.130859375, -2.6953125, -2.259765625, -1.82421875, -1.388671875, -0.953125, -0.517578125, -0.08203125, 0.353515625, 0.7890625, 1.224609375, 1.66015625, 2.095703125, 2.53125, 2.966796875, 3.40234375, 3.837890625, 4.2734375, 4.708984375, 5.14453125, 5.580078125, 6.015625, 6.451171875, 6.88671875, 7.322265625, 7.7578125, 8.193359375, 8.62890625, 9.064453125, 9.5, 9.935546875, 10.37109375, 10.806640625, 11.2421875, 11.677734375, 12.11328125, 12.548828125, 12.984375, 13.419921875, 13.85546875, 14.291015625, 14.7265625, 15.162109375, 15.59765625, 16.033203125, 16.46875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 0.0, 0.0, 4.0, 6.0, 5.0, 8.0, 18.0, 31.0, 64.0, 109.0, 536.0, 2831.0, 289.0, 87.0, 40.0, 17.0, 11.0, 8.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.9072265625, -3.705078125, -3.5029296875, -3.30078125, -3.0986328125, -2.896484375, -2.6943359375, -2.4921875, -2.2900390625, -2.087890625, -1.8857421875, -1.68359375, -1.4814453125, -1.279296875, -1.0771484375, -0.875, -0.6728515625, -0.470703125, -0.2685546875, -0.06640625, 0.1357421875, 0.337890625, 0.5400390625, 0.7421875, 0.9443359375, 1.146484375, 1.3486328125, 1.55078125, 1.7529296875, 1.955078125, 2.1572265625, 2.359375, 2.5615234375, 2.763671875, 2.9658203125, 3.16796875, 3.3701171875, 3.572265625, 3.7744140625, 3.9765625, 4.1787109375, 4.380859375, 4.5830078125, 4.78515625, 4.9873046875, 5.189453125, 5.3916015625, 5.59375, 5.7958984375, 5.998046875, 6.2001953125, 6.40234375, 6.6044921875, 6.806640625, 7.0087890625, 7.2109375, 7.4130859375, 7.615234375, 7.8173828125, 8.01953125, 8.2216796875, 8.423828125, 8.6259765625, 8.828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 16.0, 21.0, 20.0, 55.0, 108.0, 192.0, 198.0, 196.0, 91.0, 57.0, 24.0, 7.0, 8.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.190452575683594, -40.322509765625, -39.454566955566406, -38.58662414550781, -37.71868133544922, -36.850738525390625, -35.98279571533203, -35.11484909057617, -34.24690628051758, -33.378963470458984, -32.51102066040039, -31.643077850341797, -30.77513313293457, -29.907190322875977, -29.039247512817383, -28.17130470275879, -27.303361892700195, -26.4354190826416, -25.567476272583008, -24.69953155517578, -23.831588745117188, -22.963645935058594, -22.095703125, -21.227760314941406, -20.359817504882812, -19.49187469482422, -18.623931884765625, -17.75598907470703, -16.888044357299805, -16.02010154724121, -15.152158737182617, -14.284215927124023, -13.416272163391113, -12.54832935333252, -11.68038558959961, -10.812442779541016, -9.944499969482422, -9.076556205749512, -8.208613395690918, -7.340670108795166, -6.472726821899414, -5.604783535003662, -4.73684024810791, -3.8688974380493164, -3.0009541511535645, -2.1330108642578125, -1.2650680541992188, -0.3971247673034668, 0.47081851959228516, 1.3387616872787476, 2.20670485496521, 3.074647903442383, 3.9425911903381348, 4.810534477233887, 5.6784772872924805, 6.546420574188232, 7.414363861083984, 8.282306671142578, 9.150250434875488, 10.018193244934082, 10.886137008666992, 11.754079818725586, 12.62202262878418, 13.489965438842773, 14.357909202575684]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 13.0, 2.0, 9.0, 11.0, 13.0, 21.0, 19.0, 25.0, 25.0, 28.0, 24.0, 30.0, 40.0, 38.0, 28.0, 37.0, 46.0, 53.0, 40.0, 48.0, 44.0, 34.0, 61.0, 30.0, 41.0, 35.0, 28.0, 33.0, 27.0, 18.0, 15.0, 10.0, 17.0, 14.0, 9.0, 9.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.52735424041748, -10.2219877243042, -9.916621208190918, -9.611254692077637, -9.305888175964355, -9.000521659851074, -8.695155143737793, -8.389788627624512, -8.08442211151123, -7.779055595397949, -7.473689079284668, -7.168322563171387, -6.8629560470581055, -6.557589530944824, -6.252223014831543, -5.946856498718262, -5.6414899826049805, -5.336123466491699, -5.030756950378418, -4.725390434265137, -4.4200239181518555, -4.114657402038574, -3.809290885925293, -3.5039243698120117, -3.1985578536987305, -2.893191337585449, -2.587824821472168, -2.2824583053588867, -1.9770917892456055, -1.6717252731323242, -1.366358757019043, -1.0609922409057617, -0.7556266784667969, -0.4502601623535156, -0.14489364624023438, 0.16047286987304688, 0.4658393859863281, 0.7712059020996094, 1.0765724182128906, 1.3819389343261719, 1.6873054504394531, 1.9926719665527344, 2.2980384826660156, 2.603404998779297, 2.908771514892578, 3.2141380310058594, 3.5195045471191406, 3.824871063232422, 4.130237579345703, 4.435604095458984, 4.740970611572266, 5.046337127685547, 5.351703643798828, 5.657070159912109, 5.962436676025391, 6.267803192138672, 6.573169708251953, 6.878536224365234, 7.183902740478516, 7.489269256591797, 7.794635772705078, 8.10000228881836, 8.40536880493164, 8.710735321044922, 9.016101837158203]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 9.0, 6.0, 10.0, 12.0, 15.0, 23.0, 45.0, 58.0, 87.0, 197.0, 329.0, 662.0, 1987.0, 7388.0, 31288.0, 191055.0, 646358.0, 136267.0, 23936.0, 5871.0, 1642.0, 575.0, 289.0, 146.0, 101.0, 59.0, 34.0, 43.0, 17.0, 13.0, 8.0, 12.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5, -9.076171875, -8.65234375, -8.228515625, -7.8046875, -7.380859375, -6.95703125, -6.533203125, -6.109375, -5.685546875, -5.26171875, -4.837890625, -4.4140625, -3.990234375, -3.56640625, -3.142578125, -2.71875, -2.294921875, -1.87109375, -1.447265625, -1.0234375, -0.599609375, -0.17578125, 0.248046875, 0.671875, 1.095703125, 1.51953125, 1.943359375, 2.3671875, 2.791015625, 3.21484375, 3.638671875, 4.0625, 4.486328125, 4.91015625, 5.333984375, 5.7578125, 6.181640625, 6.60546875, 7.029296875, 7.453125, 7.876953125, 8.30078125, 8.724609375, 9.1484375, 9.572265625, 9.99609375, 10.419921875, 10.84375, 11.267578125, 11.69140625, 12.115234375, 12.5390625, 12.962890625, 13.38671875, 13.810546875, 14.234375, 14.658203125, 15.08203125, 15.505859375, 15.9296875, 16.353515625, 16.77734375, 17.201171875, 17.625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 15.0, 28.0, 37.0, 50.0, 70.0, 92.0, 93.0, 103.0, 97.0, 93.0, 92.0, 64.0, 45.0, 31.0, 38.0, 29.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.806640625, -3.655059814453125, -3.50347900390625, -3.351898193359375, -3.2003173828125, -3.048736572265625, -2.89715576171875, -2.745574951171875, -2.593994140625, -2.442413330078125, -2.29083251953125, -2.139251708984375, -1.9876708984375, -1.836090087890625, -1.68450927734375, -1.532928466796875, -1.38134765625, -1.229766845703125, -1.07818603515625, -0.926605224609375, -0.7750244140625, -0.623443603515625, -0.47186279296875, -0.320281982421875, -0.168701171875, -0.017120361328125, 0.13446044921875, 0.286041259765625, 0.4376220703125, 0.589202880859375, 0.74078369140625, 0.892364501953125, 1.0439453125, 1.195526123046875, 1.34710693359375, 1.498687744140625, 1.6502685546875, 1.801849365234375, 1.95343017578125, 2.105010986328125, 2.256591796875, 2.408172607421875, 2.55975341796875, 2.711334228515625, 2.8629150390625, 3.014495849609375, 3.16607666015625, 3.317657470703125, 3.46923828125, 3.620819091796875, 3.77239990234375, 3.923980712890625, 4.0755615234375, 4.227142333984375, 4.37872314453125, 4.530303955078125, 4.681884765625, 4.833465576171875, 4.98504638671875, 5.136627197265625, 5.2882080078125, 5.439788818359375, 5.59136962890625, 5.742950439453125, 5.89453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 5.0, 8.0, 6.0, 15.0, 20.0, 26.0, 45.0, 58.0, 101.0, 176.0, 290.0, 540.0, 1119.0, 2164.0, 5041.0, 12309.0, 36063.0, 132088.0, 505809.0, 257075.0, 62460.0, 19617.0, 7209.0, 3167.0, 1475.0, 734.0, 394.0, 206.0, 113.0, 76.0, 50.0, 34.0, 21.0, 13.0, 11.0, 8.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0390625, -7.78564453125, -7.5322265625, -7.27880859375, -7.025390625, -6.77197265625, -6.5185546875, -6.26513671875, -6.01171875, -5.75830078125, -5.5048828125, -5.25146484375, -4.998046875, -4.74462890625, -4.4912109375, -4.23779296875, -3.984375, -3.73095703125, -3.4775390625, -3.22412109375, -2.970703125, -2.71728515625, -2.4638671875, -2.21044921875, -1.95703125, -1.70361328125, -1.4501953125, -1.19677734375, -0.943359375, -0.68994140625, -0.4365234375, -0.18310546875, 0.0703125, 0.32373046875, 0.5771484375, 0.83056640625, 1.083984375, 1.33740234375, 1.5908203125, 1.84423828125, 2.09765625, 2.35107421875, 2.6044921875, 2.85791015625, 3.111328125, 3.36474609375, 3.6181640625, 3.87158203125, 4.125, 4.37841796875, 4.6318359375, 4.88525390625, 5.138671875, 5.39208984375, 5.6455078125, 5.89892578125, 6.15234375, 6.40576171875, 6.6591796875, 6.91259765625, 7.166015625, 7.41943359375, 7.6728515625, 7.92626953125, 8.1796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 8.0, 6.0, 3.0, 7.0, 11.0, 8.0, 18.0, 16.0, 18.0, 29.0, 31.0, 23.0, 41.0, 39.0, 45.0, 53.0, 68.0, 50.0, 57.0, 74.0, 53.0, 52.0, 47.0, 37.0, 40.0, 30.0, 24.0, 31.0, 21.0, 13.0, 13.0, 10.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.5078125, -9.1640625, -8.8203125, -8.4765625, -8.1328125, -7.7890625, -7.4453125, -7.1015625, -6.7578125, -6.4140625, -6.0703125, -5.7265625, -5.3828125, -5.0390625, -4.6953125, -4.3515625, -4.0078125, -3.6640625, -3.3203125, -2.9765625, -2.6328125, -2.2890625, -1.9453125, -1.6015625, -1.2578125, -0.9140625, -0.5703125, -0.2265625, 0.1171875, 0.4609375, 0.8046875, 1.1484375, 1.4921875, 1.8359375, 2.1796875, 2.5234375, 2.8671875, 3.2109375, 3.5546875, 3.8984375, 4.2421875, 4.5859375, 4.9296875, 5.2734375, 5.6171875, 5.9609375, 6.3046875, 6.6484375, 6.9921875, 7.3359375, 7.6796875, 8.0234375, 8.3671875, 8.7109375, 9.0546875, 9.3984375, 9.7421875, 10.0859375, 10.4296875, 10.7734375, 11.1171875, 11.4609375, 11.8046875, 12.1484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 8.0, 20.0, 30.0, 40.0, 83.0, 148.0, 324.0, 735.0, 2175.0, 7620.0, 41364.0, 643054.0, 317585.0, 26951.0, 5557.0, 1672.0, 592.0, 296.0, 121.0, 61.0, 39.0, 23.0, 13.0, 11.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.76751708984375, -4.6131591796875, -4.45880126953125, -4.304443359375, -4.15008544921875, -3.9957275390625, -3.84136962890625, -3.68701171875, -3.53265380859375, -3.3782958984375, -3.22393798828125, -3.069580078125, -2.91522216796875, -2.7608642578125, -2.60650634765625, -2.4521484375, -2.29779052734375, -2.1434326171875, -1.98907470703125, -1.834716796875, -1.68035888671875, -1.5260009765625, -1.37164306640625, -1.21728515625, -1.06292724609375, -0.9085693359375, -0.75421142578125, -0.599853515625, -0.44549560546875, -0.2911376953125, -0.13677978515625, 0.017578125, 0.17193603515625, 0.3262939453125, 0.48065185546875, 0.635009765625, 0.78936767578125, 0.9437255859375, 1.09808349609375, 1.25244140625, 1.40679931640625, 1.5611572265625, 1.71551513671875, 1.869873046875, 2.02423095703125, 2.1785888671875, 2.33294677734375, 2.4873046875, 2.64166259765625, 2.7960205078125, 2.95037841796875, 3.104736328125, 3.25909423828125, 3.4134521484375, 3.56781005859375, 3.72216796875, 3.87652587890625, 4.0308837890625, 4.18524169921875, 4.339599609375, 4.49395751953125, 4.6483154296875, 4.80267333984375, 4.95703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 5.0, 11.0, 7.0, 15.0, 23.0, 36.0, 48.0, 114.0, 242.0, 247.0, 80.0, 45.0, 37.0, 18.0, 17.0, 11.0, 12.0, 6.0, 5.0, 5.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009126663208007812, -0.0008872896432876587, -0.0008619129657745361, -0.0008365362882614136, -0.000811159610748291, -0.0007857829332351685, -0.0007604062557220459, -0.0007350295782089233, -0.0007096529006958008, -0.0006842762231826782, -0.0006588995456695557, -0.0006335228681564331, -0.0006081461906433105, -0.000582769513130188, -0.0005573928356170654, -0.0005320161581039429, -0.0005066394805908203, -0.00048126280307769775, -0.0004558861255645752, -0.00043050944805145264, -0.0004051327705383301, -0.0003797560930252075, -0.00035437941551208496, -0.0003290027379989624, -0.00030362606048583984, -0.0002782493829727173, -0.0002528727054595947, -0.00022749602794647217, -0.0002021193504333496, -0.00017674267292022705, -0.0001513659954071045, -0.00012598931789398193, -0.00010061264038085938, -7.523596286773682e-05, -4.985928535461426e-05, -2.44826078414917e-05, 8.940696716308594e-07, 2.6270747184753418e-05, 5.1647424697875977e-05, 7.702410221099854e-05, 0.0001024007797241211, 0.00012777745723724365, 0.0001531541347503662, 0.00017853081226348877, 0.00020390748977661133, 0.0002292841672897339, 0.00025466084480285645, 0.000280037522315979, 0.00030541419982910156, 0.0003307908773422241, 0.0003561675548553467, 0.00038154423236846924, 0.0004069209098815918, 0.00043229758739471436, 0.0004576742649078369, 0.00048305094242095947, 0.000508427619934082, 0.0005338042974472046, 0.0005591809749603271, 0.0005845576524734497, 0.0006099343299865723, 0.0006353110074996948, 0.0006606876850128174, 0.0006860643625259399, 0.0007114410400390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 2.0, 7.0, 8.0, 16.0, 20.0, 29.0, 44.0, 67.0, 97.0, 153.0, 275.0, 404.0, 710.0, 1354.0, 2462.0, 5618.0, 14110.0, 48171.0, 411275.0, 483716.0, 53015.0, 15240.0, 5786.0, 2597.0, 1380.0, 794.0, 459.0, 270.0, 162.0, 105.0, 68.0, 47.0, 25.0, 19.0, 11.0, 11.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5703125, -3.44732666015625, -3.3243408203125, -3.20135498046875, -3.078369140625, -2.95538330078125, -2.8323974609375, -2.70941162109375, -2.58642578125, -2.46343994140625, -2.3404541015625, -2.21746826171875, -2.094482421875, -1.97149658203125, -1.8485107421875, -1.72552490234375, -1.6025390625, -1.47955322265625, -1.3565673828125, -1.23358154296875, -1.110595703125, -0.98760986328125, -0.8646240234375, -0.74163818359375, -0.61865234375, -0.49566650390625, -0.3726806640625, -0.24969482421875, -0.126708984375, -0.00372314453125, 0.1192626953125, 0.24224853515625, 0.365234375, 0.48822021484375, 0.6112060546875, 0.73419189453125, 0.857177734375, 0.98016357421875, 1.1031494140625, 1.22613525390625, 1.34912109375, 1.47210693359375, 1.5950927734375, 1.71807861328125, 1.841064453125, 1.96405029296875, 2.0870361328125, 2.21002197265625, 2.3330078125, 2.45599365234375, 2.5789794921875, 2.70196533203125, 2.824951171875, 2.94793701171875, 3.0709228515625, 3.19390869140625, 3.31689453125, 3.43988037109375, 3.5628662109375, 3.68585205078125, 3.808837890625, 3.93182373046875, 4.0548095703125, 4.17779541015625, 4.30078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 6.0, 9.0, 10.0, 15.0, 26.0, 33.0, 44.0, 78.0, 161.0, 221.0, 173.0, 71.0, 46.0, 17.0, 24.0, 17.0, 11.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.075439453125, -5.90869140625, -5.741943359375, -5.5751953125, -5.408447265625, -5.24169921875, -5.074951171875, -4.908203125, -4.741455078125, -4.57470703125, -4.407958984375, -4.2412109375, -4.074462890625, -3.90771484375, -3.740966796875, -3.57421875, -3.407470703125, -3.24072265625, -3.073974609375, -2.9072265625, -2.740478515625, -2.57373046875, -2.406982421875, -2.240234375, -2.073486328125, -1.90673828125, -1.739990234375, -1.5732421875, -1.406494140625, -1.23974609375, -1.072998046875, -0.90625, -0.739501953125, -0.57275390625, -0.406005859375, -0.2392578125, -0.072509765625, 0.09423828125, 0.260986328125, 0.427734375, 0.594482421875, 0.76123046875, 0.927978515625, 1.0947265625, 1.261474609375, 1.42822265625, 1.594970703125, 1.76171875, 1.928466796875, 2.09521484375, 2.261962890625, 2.4287109375, 2.595458984375, 2.76220703125, 2.928955078125, 3.095703125, 3.262451171875, 3.42919921875, 3.595947265625, 3.7626953125, 3.929443359375, 4.09619140625, 4.262939453125, 4.4296875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 16.0, 17.0, 18.0, 51.0, 102.0, 152.0, 201.0, 164.0, 127.0, 65.0, 30.0, 20.0, 13.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.76167297363281, -34.56254959106445, -32.363426208496094, -30.16429901123047, -27.96517562866211, -25.76605224609375, -23.566926956176758, -21.367801666259766, -19.168678283691406, -16.969554901123047, -14.770429611206055, -12.571305274963379, -10.372180938720703, -8.173056602478027, -5.973932266235352, -3.774807929992676, -1.57568359375, 0.6234407424926758, 2.8225650787353516, 5.021689414978027, 7.220813751220703, 9.419938087463379, 11.619062423706055, 13.81818675994873, 16.017311096191406, 18.216434478759766, 20.415559768676758, 22.61468505859375, 24.81380844116211, 27.01293182373047, 29.21205711364746, 31.411182403564453, 33.61029815673828, 35.80942153930664, 38.008544921875, 40.207672119140625, 42.406795501708984, 44.605918884277344, 46.80504608154297, 49.00416946411133, 51.20329284667969, 53.40241622924805, 55.601539611816406, 57.80066680908203, 59.99979019165039, 62.19891357421875, 64.39804077148438, 66.59716033935547, 68.7962875366211, 70.99541473388672, 73.19453430175781, 75.39366149902344, 77.59278869628906, 79.79190826416016, 81.99103546142578, 84.19015502929688, 86.3892822265625, 88.58840942382812, 90.78752899169922, 92.98665618896484, 95.18577575683594, 97.38490295410156, 99.58403015136719, 101.78314971923828, 103.9822769165039]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 2.0, 4.0, 10.0, 14.0, 21.0, 19.0, 14.0, 23.0, 19.0, 24.0, 27.0, 21.0, 30.0, 31.0, 30.0, 40.0, 43.0, 40.0, 44.0, 39.0, 51.0, 39.0, 35.0, 27.0, 30.0, 36.0, 31.0, 31.0, 23.0, 29.0, 22.0, 14.0, 17.0, 20.0, 20.0, 11.0, 13.0, 9.0, 12.0, 5.0, 9.0, 10.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.0693359375, -40.86619186401367, -39.663047790527344, -38.459903717041016, -37.25675964355469, -36.05361557006836, -34.85047149658203, -33.64732360839844, -32.444183349609375, -31.241039276123047, -30.03789520263672, -28.83475112915039, -27.631607055664062, -26.428462982177734, -25.225317001342773, -24.022172927856445, -22.819026947021484, -21.615882873535156, -20.412738800048828, -19.2095947265625, -18.006450653076172, -16.803306579589844, -15.600160598754883, -14.397016525268555, -13.193872451782227, -11.990728378295898, -10.78758430480957, -9.584439277648926, -8.381295204162598, -7.1781511306762695, -5.975006580352783, -4.771862030029297, -3.5687179565429688, -2.3655736446380615, -1.1624293327331543, 0.04071497917175293, 1.2438592910766602, 2.4470033645629883, 3.6501479148864746, 4.853292465209961, 6.056436538696289, 7.259580612182617, 8.462724685668945, 9.66586971282959, 10.869013786315918, 12.072157859802246, 13.27530288696289, 14.478446960449219, 15.681591033935547, 16.884735107421875, 18.087879180908203, 19.29102325439453, 20.49416732788086, 21.697311401367188, 22.90045738220215, 24.103601455688477, 25.306745529174805, 26.509889602661133, 27.71303367614746, 28.91617774963379, 30.11932373046875, 31.322467803955078, 32.525611877441406, 33.728755950927734, 34.93190002441406]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 15.0, 12.0, 35.0, 36.0, 64.0, 126.0, 222.0, 507.0, 1437.0, 5724.0, 65795.0, 4094487.0, 21084.0, 3070.0, 841.0, 362.0, 196.0, 113.0, 57.0, 40.0, 19.0, 14.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.1875, -32.88818359375, -31.5888671875, -30.28955078125, -28.990234375, -27.69091796875, -26.3916015625, -25.09228515625, -23.79296875, -22.49365234375, -21.1943359375, -19.89501953125, -18.595703125, -17.29638671875, -15.9970703125, -14.69775390625, -13.3984375, -12.09912109375, -10.7998046875, -9.50048828125, -8.201171875, -6.90185546875, -5.6025390625, -4.30322265625, -3.00390625, -1.70458984375, -0.4052734375, 0.89404296875, 2.193359375, 3.49267578125, 4.7919921875, 6.09130859375, 7.390625, 8.68994140625, 9.9892578125, 11.28857421875, 12.587890625, 13.88720703125, 15.1865234375, 16.48583984375, 17.78515625, 19.08447265625, 20.3837890625, 21.68310546875, 22.982421875, 24.28173828125, 25.5810546875, 26.88037109375, 28.1796875, 29.47900390625, 30.7783203125, 32.07763671875, 33.376953125, 34.67626953125, 35.9755859375, 37.27490234375, 38.57421875, 39.87353515625, 41.1728515625, 42.47216796875, 43.771484375, 45.07080078125, 46.3701171875, 47.66943359375, 48.96875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 10.0, 13.0, 25.0, 33.0, 42.0, 56.0, 60.0, 85.0, 82.0, 77.0, 84.0, 83.0, 75.0, 69.0, 50.0, 44.0, 34.0, 36.0, 17.0, 14.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.625, -3.486083984375, -3.34716796875, -3.208251953125, -3.0693359375, -2.930419921875, -2.79150390625, -2.652587890625, -2.513671875, -2.374755859375, -2.23583984375, -2.096923828125, -1.9580078125, -1.819091796875, -1.68017578125, -1.541259765625, -1.40234375, -1.263427734375, -1.12451171875, -0.985595703125, -0.8466796875, -0.707763671875, -0.56884765625, -0.429931640625, -0.291015625, -0.152099609375, -0.01318359375, 0.125732421875, 0.2646484375, 0.403564453125, 0.54248046875, 0.681396484375, 0.8203125, 0.959228515625, 1.09814453125, 1.237060546875, 1.3759765625, 1.514892578125, 1.65380859375, 1.792724609375, 1.931640625, 2.070556640625, 2.20947265625, 2.348388671875, 2.4873046875, 2.626220703125, 2.76513671875, 2.904052734375, 3.04296875, 3.181884765625, 3.32080078125, 3.459716796875, 3.5986328125, 3.737548828125, 3.87646484375, 4.015380859375, 4.154296875, 4.293212890625, 4.43212890625, 4.571044921875, 4.7099609375, 4.848876953125, 4.98779296875, 5.126708984375, 5.265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 7.0, 5.0, 13.0, 18.0, 19.0, 30.0, 30.0, 49.0, 75.0, 115.0, 230.0, 500.0, 1251.0, 3646.0, 13124.0, 84562.0, 3978944.0, 91798.0, 13706.0, 3825.0, 1191.0, 527.0, 232.0, 129.0, 74.0, 56.0, 30.0, 25.0, 17.0, 6.0, 6.0, 7.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.21875, -20.621337890625, -20.02392578125, -19.426513671875, -18.8291015625, -18.231689453125, -17.63427734375, -17.036865234375, -16.439453125, -15.842041015625, -15.24462890625, -14.647216796875, -14.0498046875, -13.452392578125, -12.85498046875, -12.257568359375, -11.66015625, -11.062744140625, -10.46533203125, -9.867919921875, -9.2705078125, -8.673095703125, -8.07568359375, -7.478271484375, -6.880859375, -6.283447265625, -5.68603515625, -5.088623046875, -4.4912109375, -3.893798828125, -3.29638671875, -2.698974609375, -2.1015625, -1.504150390625, -0.90673828125, -0.309326171875, 0.2880859375, 0.885498046875, 1.48291015625, 2.080322265625, 2.677734375, 3.275146484375, 3.87255859375, 4.469970703125, 5.0673828125, 5.664794921875, 6.26220703125, 6.859619140625, 7.45703125, 8.054443359375, 8.65185546875, 9.249267578125, 9.8466796875, 10.444091796875, 11.04150390625, 11.638916015625, 12.236328125, 12.833740234375, 13.43115234375, 14.028564453125, 14.6259765625, 15.223388671875, 15.82080078125, 16.418212890625, 17.015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 9.0, 15.0, 30.0, 55.0, 132.0, 1312.0, 2284.0, 111.0, 51.0, 26.0, 12.0, 10.0, 7.0, 3.0, 0.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.46875, -12.185546875, -11.90234375, -11.619140625, -11.3359375, -11.052734375, -10.76953125, -10.486328125, -10.203125, -9.919921875, -9.63671875, -9.353515625, -9.0703125, -8.787109375, -8.50390625, -8.220703125, -7.9375, -7.654296875, -7.37109375, -7.087890625, -6.8046875, -6.521484375, -6.23828125, -5.955078125, -5.671875, -5.388671875, -5.10546875, -4.822265625, -4.5390625, -4.255859375, -3.97265625, -3.689453125, -3.40625, -3.123046875, -2.83984375, -2.556640625, -2.2734375, -1.990234375, -1.70703125, -1.423828125, -1.140625, -0.857421875, -0.57421875, -0.291015625, -0.0078125, 0.275390625, 0.55859375, 0.841796875, 1.125, 1.408203125, 1.69140625, 1.974609375, 2.2578125, 2.541015625, 2.82421875, 3.107421875, 3.390625, 3.673828125, 3.95703125, 4.240234375, 4.5234375, 4.806640625, 5.08984375, 5.373046875, 5.65625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 10.0, 14.0, 26.0, 44.0, 90.0, 160.0, 232.0, 230.0, 104.0, 55.0, 21.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-50.45697784423828, -49.33268737792969, -48.208396911621094, -47.0841064453125, -45.959815979003906, -44.83552551269531, -43.71123504638672, -42.58694839477539, -41.4626579284668, -40.3383674621582, -39.21407699584961, -38.089786529541016, -36.96549606323242, -35.841209411621094, -34.7169189453125, -33.592628479003906, -32.46833801269531, -31.34404754638672, -30.219757080078125, -29.09546661376953, -27.97117805480957, -26.846887588500977, -25.722597122192383, -24.59830665588379, -23.474014282226562, -22.34972381591797, -21.225433349609375, -20.10114288330078, -18.97685432434082, -17.852563858032227, -16.728273391723633, -15.603982925415039, -14.479692459106445, -13.355401992797852, -12.231112480163574, -11.10682201385498, -9.982532501220703, -8.85824203491211, -7.733951568603516, -6.60966157913208, -5.4853715896606445, -4.361081600189209, -3.2367913722991943, -2.1125011444091797, -0.9882111549377441, 0.1360788345336914, 1.2603693008422852, 2.3846592903137207, 3.5089492797851562, 4.633239269256592, 5.757529258728027, 6.881819725036621, 8.006109237670898, 9.130399703979492, 10.254690170288086, 11.37898063659668, 12.503270149230957, 13.62756061553955, 14.751850128173828, 15.876140594482422, 17.000431060791016, 18.12472152709961, 19.249011993408203, 20.373300552368164, 21.497591018676758]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 10.0, 14.0, 20.0, 15.0, 27.0, 32.0, 35.0, 40.0, 36.0, 43.0, 46.0, 71.0, 51.0, 61.0, 53.0, 57.0, 59.0, 50.0, 58.0, 42.0, 42.0, 27.0, 21.0, 22.0, 14.0, 14.0, 9.0, 7.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.091163635253906, -15.572766304016113, -15.05436897277832, -14.535971641540527, -14.017574310302734, -13.499177932739258, -12.980780601501465, -12.462383270263672, -11.943985939025879, -11.425588607788086, -10.907191276550293, -10.3887939453125, -9.870397567749023, -9.351999282836914, -8.833602905273438, -8.315205574035645, -7.796808242797852, -7.278410911560059, -6.760013580322266, -6.241616725921631, -5.723219394683838, -5.204822063446045, -4.68642520904541, -4.168027877807617, -3.649630546569824, -3.1312332153320312, -2.6128361225128174, -2.0944390296936035, -1.5760416984558105, -1.0576443672180176, -0.5392472743988037, -0.020850181579589844, 0.4975471496582031, 1.0159443616867065, 1.53434157371521, 2.052738666534424, 2.571135997772217, 3.0895333290100098, 3.6079304218292236, 4.1263275146484375, 4.6447248458862305, 5.163122177124023, 5.681519508361816, 6.199916362762451, 6.718313694000244, 7.236711025238037, 7.755107879638672, 8.273505210876465, 8.791902542114258, 9.31029987335205, 9.828697204589844, 10.347094535827637, 10.86549186706543, 11.383888244628906, 11.9022855758667, 12.420682907104492, 12.939080238342285, 13.457477569580078, 13.975874900817871, 14.494272232055664, 15.01266860961914, 15.53106689453125, 16.049463272094727, 16.567859649658203, 17.086257934570312]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 1.0, 6.0, 5.0, 5.0, 9.0, 8.0, 14.0, 17.0, 35.0, 67.0, 129.0, 288.0, 534.0, 1110.0, 2814.0, 8106.0, 34628.0, 277297.0, 624401.0, 77738.0, 13988.0, 4158.0, 1697.0, 711.0, 373.0, 167.0, 94.0, 49.0, 32.0, 20.0, 22.0, 11.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.349609375, -17.76171875, -17.173828125, -16.5859375, -15.998046875, -15.41015625, -14.822265625, -14.234375, -13.646484375, -13.05859375, -12.470703125, -11.8828125, -11.294921875, -10.70703125, -10.119140625, -9.53125, -8.943359375, -8.35546875, -7.767578125, -7.1796875, -6.591796875, -6.00390625, -5.416015625, -4.828125, -4.240234375, -3.65234375, -3.064453125, -2.4765625, -1.888671875, -1.30078125, -0.712890625, -0.125, 0.462890625, 1.05078125, 1.638671875, 2.2265625, 2.814453125, 3.40234375, 3.990234375, 4.578125, 5.166015625, 5.75390625, 6.341796875, 6.9296875, 7.517578125, 8.10546875, 8.693359375, 9.28125, 9.869140625, 10.45703125, 11.044921875, 11.6328125, 12.220703125, 12.80859375, 13.396484375, 13.984375, 14.572265625, 15.16015625, 15.748046875, 16.3359375, 16.923828125, 17.51171875, 18.099609375, 18.6875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 15.0, 14.0, 20.0, 31.0, 37.0, 64.0, 56.0, 76.0, 82.0, 77.0, 80.0, 91.0, 67.0, 71.0, 57.0, 45.0, 37.0, 24.0, 30.0, 14.0, 7.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.38031005859375, -3.2410888671875, -3.10186767578125, -2.962646484375, -2.82342529296875, -2.6842041015625, -2.54498291015625, -2.40576171875, -2.26654052734375, -2.1273193359375, -1.98809814453125, -1.848876953125, -1.70965576171875, -1.5704345703125, -1.43121337890625, -1.2919921875, -1.15277099609375, -1.0135498046875, -0.87432861328125, -0.735107421875, -0.59588623046875, -0.4566650390625, -0.31744384765625, -0.17822265625, -0.03900146484375, 0.1002197265625, 0.23944091796875, 0.378662109375, 0.51788330078125, 0.6571044921875, 0.79632568359375, 0.935546875, 1.07476806640625, 1.2139892578125, 1.35321044921875, 1.492431640625, 1.63165283203125, 1.7708740234375, 1.91009521484375, 2.04931640625, 2.18853759765625, 2.3277587890625, 2.46697998046875, 2.606201171875, 2.74542236328125, 2.8846435546875, 3.02386474609375, 3.1630859375, 3.30230712890625, 3.4415283203125, 3.58074951171875, 3.719970703125, 3.85919189453125, 3.9984130859375, 4.13763427734375, 4.27685546875, 4.41607666015625, 4.5552978515625, 4.69451904296875, 4.833740234375, 4.97296142578125, 5.1121826171875, 5.25140380859375, 5.390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 8.0, 12.0, 22.0, 35.0, 49.0, 72.0, 117.0, 189.0, 320.0, 602.0, 1199.0, 2543.0, 5775.0, 16417.0, 60752.0, 364859.0, 485012.0, 78431.0, 19703.0, 6848.0, 2774.0, 1286.0, 619.0, 351.0, 183.0, 132.0, 88.0, 51.0, 23.0, 26.0, 10.0, 11.0, 4.0, 10.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.0230712890625, -8.663330078125, -8.3035888671875, -7.94384765625, -7.5841064453125, -7.224365234375, -6.8646240234375, -6.5048828125, -6.1451416015625, -5.785400390625, -5.4256591796875, -5.06591796875, -4.7061767578125, -4.346435546875, -3.9866943359375, -3.626953125, -3.2672119140625, -2.907470703125, -2.5477294921875, -2.18798828125, -1.8282470703125, -1.468505859375, -1.1087646484375, -0.7490234375, -0.3892822265625, -0.029541015625, 0.3302001953125, 0.68994140625, 1.0496826171875, 1.409423828125, 1.7691650390625, 2.12890625, 2.4886474609375, 2.848388671875, 3.2081298828125, 3.56787109375, 3.9276123046875, 4.287353515625, 4.6470947265625, 5.0068359375, 5.3665771484375, 5.726318359375, 6.0860595703125, 6.44580078125, 6.8055419921875, 7.165283203125, 7.5250244140625, 7.884765625, 8.2445068359375, 8.604248046875, 8.9639892578125, 9.32373046875, 9.6834716796875, 10.043212890625, 10.4029541015625, 10.7626953125, 11.1224365234375, 11.482177734375, 11.8419189453125, 12.20166015625, 12.5614013671875, 12.921142578125, 13.2808837890625, 13.640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 8.0, 15.0, 16.0, 23.0, 21.0, 24.0, 32.0, 31.0, 41.0, 50.0, 57.0, 63.0, 75.0, 66.0, 71.0, 67.0, 49.0, 61.0, 45.0, 37.0, 31.0, 23.0, 21.0, 8.0, 11.0, 6.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-20.4375, -19.9178466796875, -19.398193359375, -18.8785400390625, -18.35888671875, -17.8392333984375, -17.319580078125, -16.7999267578125, -16.2802734375, -15.7606201171875, -15.240966796875, -14.7213134765625, -14.20166015625, -13.6820068359375, -13.162353515625, -12.6427001953125, -12.123046875, -11.6033935546875, -11.083740234375, -10.5640869140625, -10.04443359375, -9.5247802734375, -9.005126953125, -8.4854736328125, -7.9658203125, -7.4461669921875, -6.926513671875, -6.4068603515625, -5.88720703125, -5.3675537109375, -4.847900390625, -4.3282470703125, -3.80859375, -3.2889404296875, -2.769287109375, -2.2496337890625, -1.72998046875, -1.2103271484375, -0.690673828125, -0.1710205078125, 0.3486328125, 0.8682861328125, 1.387939453125, 1.9075927734375, 2.42724609375, 2.9468994140625, 3.466552734375, 3.9862060546875, 4.505859375, 5.0255126953125, 5.545166015625, 6.0648193359375, 6.58447265625, 7.1041259765625, 7.623779296875, 8.1434326171875, 8.6630859375, 9.1827392578125, 9.702392578125, 10.2220458984375, 10.74169921875, 11.2613525390625, 11.781005859375, 12.3006591796875, 12.8203125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 12.0, 15.0, 25.0, 32.0, 47.0, 48.0, 72.0, 131.0, 201.0, 403.0, 895.0, 2565.0, 10222.0, 84859.0, 888666.0, 49094.0, 7604.0, 2000.0, 764.0, 353.0, 191.0, 103.0, 64.0, 47.0, 30.0, 21.0, 23.0, 17.0, 12.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.140625, -15.67138671875, -15.2021484375, -14.73291015625, -14.263671875, -13.79443359375, -13.3251953125, -12.85595703125, -12.38671875, -11.91748046875, -11.4482421875, -10.97900390625, -10.509765625, -10.04052734375, -9.5712890625, -9.10205078125, -8.6328125, -8.16357421875, -7.6943359375, -7.22509765625, -6.755859375, -6.28662109375, -5.8173828125, -5.34814453125, -4.87890625, -4.40966796875, -3.9404296875, -3.47119140625, -3.001953125, -2.53271484375, -2.0634765625, -1.59423828125, -1.125, -0.65576171875, -0.1865234375, 0.28271484375, 0.751953125, 1.22119140625, 1.6904296875, 2.15966796875, 2.62890625, 3.09814453125, 3.5673828125, 4.03662109375, 4.505859375, 4.97509765625, 5.4443359375, 5.91357421875, 6.3828125, 6.85205078125, 7.3212890625, 7.79052734375, 8.259765625, 8.72900390625, 9.1982421875, 9.66748046875, 10.13671875, 10.60595703125, 11.0751953125, 11.54443359375, 12.013671875, 12.48291015625, 12.9521484375, 13.42138671875, 13.890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 7.0, 6.0, 13.0, 17.0, 30.0, 50.0, 46.0, 109.0, 230.0, 212.0, 88.0, 58.0, 46.0, 28.0, 16.0, 10.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008792877197265625, -0.0008303225040435791, -0.0007813572883605957, -0.0007323920726776123, -0.0006834268569946289, -0.0006344616413116455, -0.0005854964256286621, -0.0005365312099456787, -0.0004875659942626953, -0.0004386007785797119, -0.0003896355628967285, -0.0003406703472137451, -0.0002917051315307617, -0.00024273991584777832, -0.00019377470016479492, -0.00014480948448181152, -9.584426879882812e-05, -4.6879053115844727e-05, 2.086162567138672e-06, 5.105137825012207e-05, 0.00010001659393310547, 0.00014898180961608887, 0.00019794702529907227, 0.00024691224098205566, 0.00029587745666503906, 0.00034484267234802246, 0.00039380788803100586, 0.00044277310371398926, 0.0004917383193969727, 0.0005407035350799561, 0.0005896687507629395, 0.0006386339664459229, 0.0006875991821289062, 0.0007365643978118896, 0.000785529613494873, 0.0008344948291778564, 0.0008834600448608398, 0.0009324252605438232, 0.0009813904762268066, 0.00103035569190979, 0.0010793209075927734, 0.0011282861232757568, 0.0011772513389587402, 0.0012262165546417236, 0.001275181770324707, 0.0013241469860076904, 0.0013731122016906738, 0.0014220774173736572, 0.0014710426330566406, 0.001520007848739624, 0.0015689730644226074, 0.0016179382801055908, 0.0016669034957885742, 0.0017158687114715576, 0.001764833927154541, 0.0018137991428375244, 0.0018627643585205078, 0.0019117295742034912, 0.0019606947898864746, 0.002009660005569458, 0.0020586252212524414, 0.002107590436935425, 0.002156555652618408, 0.0022055208683013916, 0.002254486083984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 5.0, 7.0, 8.0, 13.0, 17.0, 48.0, 62.0, 125.0, 233.0, 517.0, 1231.0, 2922.0, 9237.0, 45317.0, 795543.0, 166127.0, 18964.0, 4898.0, 1709.0, 779.0, 350.0, 202.0, 90.0, 52.0, 42.0, 14.0, 10.0, 7.0, 2.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-18.203125, -17.7564697265625, -17.309814453125, -16.8631591796875, -16.41650390625, -15.9698486328125, -15.523193359375, -15.0765380859375, -14.6298828125, -14.1832275390625, -13.736572265625, -13.2899169921875, -12.84326171875, -12.3966064453125, -11.949951171875, -11.5032958984375, -11.056640625, -10.6099853515625, -10.163330078125, -9.7166748046875, -9.27001953125, -8.8233642578125, -8.376708984375, -7.9300537109375, -7.4833984375, -7.0367431640625, -6.590087890625, -6.1434326171875, -5.69677734375, -5.2501220703125, -4.803466796875, -4.3568115234375, -3.91015625, -3.4635009765625, -3.016845703125, -2.5701904296875, -2.12353515625, -1.6768798828125, -1.230224609375, -0.7835693359375, -0.3369140625, 0.1097412109375, 0.556396484375, 1.0030517578125, 1.44970703125, 1.8963623046875, 2.343017578125, 2.7896728515625, 3.236328125, 3.6829833984375, 4.129638671875, 4.5762939453125, 5.02294921875, 5.4696044921875, 5.916259765625, 6.3629150390625, 6.8095703125, 7.2562255859375, 7.702880859375, 8.1495361328125, 8.59619140625, 9.0428466796875, 9.489501953125, 9.9361572265625, 10.3828125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 12.0, 8.0, 16.0, 17.0, 35.0, 63.0, 109.0, 269.0, 197.0, 97.0, 49.0, 28.0, 22.0, 14.0, 9.0, 7.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.515625, -16.0423583984375, -15.569091796875, -15.0958251953125, -14.62255859375, -14.1492919921875, -13.676025390625, -13.2027587890625, -12.7294921875, -12.2562255859375, -11.782958984375, -11.3096923828125, -10.83642578125, -10.3631591796875, -9.889892578125, -9.4166259765625, -8.943359375, -8.4700927734375, -7.996826171875, -7.5235595703125, -7.05029296875, -6.5770263671875, -6.103759765625, -5.6304931640625, -5.1572265625, -4.6839599609375, -4.210693359375, -3.7374267578125, -3.26416015625, -2.7908935546875, -2.317626953125, -1.8443603515625, -1.37109375, -0.8978271484375, -0.424560546875, 0.0487060546875, 0.52197265625, 0.9952392578125, 1.468505859375, 1.9417724609375, 2.4150390625, 2.8883056640625, 3.361572265625, 3.8348388671875, 4.30810546875, 4.7813720703125, 5.254638671875, 5.7279052734375, 6.201171875, 6.6744384765625, 7.147705078125, 7.6209716796875, 8.09423828125, 8.5675048828125, 9.040771484375, 9.5140380859375, 9.9873046875, 10.4605712890625, 10.933837890625, 11.4071044921875, 11.88037109375, 12.3536376953125, 12.826904296875, 13.3001708984375, 13.7734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 10.0, 11.0, 25.0, 27.0, 47.0, 82.0, 115.0, 141.0, 137.0, 135.0, 74.0, 79.0, 33.0, 32.0, 18.0, 16.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.53411865234375, -126.13600158691406, -122.73788452148438, -119.33977508544922, -115.94165802001953, -112.54354095458984, -109.14543151855469, -105.747314453125, -102.34919738769531, -98.95108032226562, -95.55296325683594, -92.15485382080078, -88.7567367553711, -85.3586196899414, -81.96051025390625, -78.56239318847656, -75.16427612304688, -71.76615905761719, -68.3680419921875, -64.96993255615234, -61.571815490722656, -58.17369842529297, -54.77558517456055, -51.377471923828125, -47.97935485839844, -44.58123779296875, -41.18312454223633, -37.785011291503906, -34.38689422607422, -30.988779067993164, -27.59066390991211, -24.192548751831055, -20.79443359375, -17.396318435668945, -13.99820327758789, -10.600088119506836, -7.201972961425781, -3.8038578033447266, -0.4057426452636719, 2.992372512817383, 6.3904876708984375, 9.788602828979492, 13.186717987060547, 16.5848331451416, 19.982948303222656, 23.38106346130371, 26.779178619384766, 30.17729377746582, 33.575408935546875, 36.97352600097656, 40.371639251708984, 43.769752502441406, 47.167869567871094, 50.56598663330078, 53.9640998840332, 57.362213134765625, 60.76033020019531, 64.158447265625, 67.55656433105469, 70.95467376708984, 74.35279083251953, 77.75090789794922, 81.14901733398438, 84.54713439941406, 87.94525146484375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 8.0, 9.0, 14.0, 13.0, 19.0, 20.0, 34.0, 24.0, 32.0, 36.0, 55.0, 53.0, 47.0, 51.0, 71.0, 49.0, 59.0, 53.0, 57.0, 42.0, 49.0, 42.0, 36.0, 27.0, 20.0, 19.0, 16.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.43598937988281, -84.06910705566406, -80.70222473144531, -77.33534240722656, -73.96846008300781, -70.60157775878906, -67.23469543457031, -63.867820739746094, -60.500938415527344, -57.134056091308594, -53.767173767089844, -50.400291442871094, -47.03341293334961, -43.66653060913086, -40.29964828491211, -36.932769775390625, -33.56588363647461, -30.19900131225586, -26.832120895385742, -23.465238571166992, -20.098358154296875, -16.731475830078125, -13.364593505859375, -9.997713088989258, -6.630830764770508, -3.263949155807495, 0.10293245315551758, 3.4698143005371094, 6.836695671081543, 10.203577041625977, 13.570459365844727, 16.937339782714844, 20.304222106933594, 23.671104431152344, 27.03798484802246, 30.40486717224121, 33.77174758911133, 37.13862991333008, 40.50551223754883, 43.87239074707031, 47.23927307128906, 50.60615539550781, 53.97303771972656, 57.33992004394531, 60.7067985534668, 64.07368469238281, 67.44056701660156, 70.80744171142578, 74.17433166503906, 77.54121398925781, 80.90809631347656, 84.27497863769531, 87.64186096191406, 91.00874328613281, 94.37562561035156, 97.74250030517578, 101.10938262939453, 104.47626495361328, 107.84314727783203, 111.21002960205078, 114.57691192626953, 117.94378662109375, 121.3106689453125, 124.67755126953125, 128.04443359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 6.0, 11.0, 14.0, 30.0, 34.0, 47.0, 86.0, 130.0, 201.0, 317.0, 584.0, 1162.0, 2741.0, 9951.0, 70775.0, 3984229.0, 105639.0, 12277.0, 3235.0, 1231.0, 607.0, 348.0, 195.0, 138.0, 80.0, 74.0, 40.0, 26.0, 14.0, 16.0, 8.0, 5.0, 2.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.546875, -18.751220703125, -17.95556640625, -17.159912109375, -16.3642578125, -15.568603515625, -14.77294921875, -13.977294921875, -13.181640625, -12.385986328125, -11.59033203125, -10.794677734375, -9.9990234375, -9.203369140625, -8.40771484375, -7.612060546875, -6.81640625, -6.020751953125, -5.22509765625, -4.429443359375, -3.6337890625, -2.838134765625, -2.04248046875, -1.246826171875, -0.451171875, 0.344482421875, 1.14013671875, 1.935791015625, 2.7314453125, 3.527099609375, 4.32275390625, 5.118408203125, 5.9140625, 6.709716796875, 7.50537109375, 8.301025390625, 9.0966796875, 9.892333984375, 10.68798828125, 11.483642578125, 12.279296875, 13.074951171875, 13.87060546875, 14.666259765625, 15.4619140625, 16.257568359375, 17.05322265625, 17.848876953125, 18.64453125, 19.440185546875, 20.23583984375, 21.031494140625, 21.8271484375, 22.622802734375, 23.41845703125, 24.214111328125, 25.009765625, 25.805419921875, 26.60107421875, 27.396728515625, 28.1923828125, 28.988037109375, 29.78369140625, 30.579345703125, 31.375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 10.0, 13.0, 21.0, 19.0, 20.0, 40.0, 27.0, 41.0, 33.0, 48.0, 49.0, 53.0, 80.0, 62.0, 66.0, 68.0, 59.0, 48.0, 56.0, 31.0, 31.0, 23.0, 17.0, 26.0, 18.0, 10.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.560546875, -3.425506591796875, -3.29046630859375, -3.155426025390625, -3.0203857421875, -2.885345458984375, -2.75030517578125, -2.615264892578125, -2.480224609375, -2.345184326171875, -2.21014404296875, -2.075103759765625, -1.9400634765625, -1.805023193359375, -1.66998291015625, -1.534942626953125, -1.39990234375, -1.264862060546875, -1.12982177734375, -0.994781494140625, -0.8597412109375, -0.724700927734375, -0.58966064453125, -0.454620361328125, -0.319580078125, -0.184539794921875, -0.04949951171875, 0.085540771484375, 0.2205810546875, 0.355621337890625, 0.49066162109375, 0.625701904296875, 0.7607421875, 0.895782470703125, 1.03082275390625, 1.165863037109375, 1.3009033203125, 1.435943603515625, 1.57098388671875, 1.706024169921875, 1.841064453125, 1.976104736328125, 2.11114501953125, 2.246185302734375, 2.3812255859375, 2.516265869140625, 2.65130615234375, 2.786346435546875, 2.92138671875, 3.056427001953125, 3.19146728515625, 3.326507568359375, 3.4615478515625, 3.596588134765625, 3.73162841796875, 3.866668701171875, 4.001708984375, 4.136749267578125, 4.27178955078125, 4.406829833984375, 4.5418701171875, 4.676910400390625, 4.81195068359375, 4.946990966796875, 5.08203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 8.0, 10.0, 22.0, 22.0, 58.0, 87.0, 138.0, 274.0, 561.0, 1185.0, 2870.0, 9100.0, 40450.0, 616122.0, 3436778.0, 67298.0, 12542.0, 3860.0, 1448.0, 678.0, 343.0, 192.0, 98.0, 49.0, 36.0, 19.0, 14.0, 6.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.734375, -21.11572265625, -20.4970703125, -19.87841796875, -19.259765625, -18.64111328125, -18.0224609375, -17.40380859375, -16.78515625, -16.16650390625, -15.5478515625, -14.92919921875, -14.310546875, -13.69189453125, -13.0732421875, -12.45458984375, -11.8359375, -11.21728515625, -10.5986328125, -9.97998046875, -9.361328125, -8.74267578125, -8.1240234375, -7.50537109375, -6.88671875, -6.26806640625, -5.6494140625, -5.03076171875, -4.412109375, -3.79345703125, -3.1748046875, -2.55615234375, -1.9375, -1.31884765625, -0.7001953125, -0.08154296875, 0.537109375, 1.15576171875, 1.7744140625, 2.39306640625, 3.01171875, 3.63037109375, 4.2490234375, 4.86767578125, 5.486328125, 6.10498046875, 6.7236328125, 7.34228515625, 7.9609375, 8.57958984375, 9.1982421875, 9.81689453125, 10.435546875, 11.05419921875, 11.6728515625, 12.29150390625, 12.91015625, 13.52880859375, 14.1474609375, 14.76611328125, 15.384765625, 16.00341796875, 16.6220703125, 17.24072265625, 17.859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 13.0, 18.0, 26.0, 42.0, 59.0, 119.0, 290.0, 2277.0, 776.0, 194.0, 92.0, 49.0, 31.0, 23.0, 17.0, 10.0, 10.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.078125, -12.7410888671875, -12.404052734375, -12.0670166015625, -11.72998046875, -11.3929443359375, -11.055908203125, -10.7188720703125, -10.3818359375, -10.0447998046875, -9.707763671875, -9.3707275390625, -9.03369140625, -8.6966552734375, -8.359619140625, -8.0225830078125, -7.685546875, -7.3485107421875, -7.011474609375, -6.6744384765625, -6.33740234375, -6.0003662109375, -5.663330078125, -5.3262939453125, -4.9892578125, -4.6522216796875, -4.315185546875, -3.9781494140625, -3.64111328125, -3.3040771484375, -2.967041015625, -2.6300048828125, -2.29296875, -1.9559326171875, -1.618896484375, -1.2818603515625, -0.94482421875, -0.6077880859375, -0.270751953125, 0.0662841796875, 0.4033203125, 0.7403564453125, 1.077392578125, 1.4144287109375, 1.75146484375, 2.0885009765625, 2.425537109375, 2.7625732421875, 3.099609375, 3.4366455078125, 3.773681640625, 4.1107177734375, 4.44775390625, 4.7847900390625, 5.121826171875, 5.4588623046875, 5.7958984375, 6.1329345703125, 6.469970703125, 6.8070068359375, 7.14404296875, 7.4810791015625, 7.818115234375, 8.1551513671875, 8.4921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 24.0, 64.0, 159.0, 239.0, 246.0, 133.0, 68.0, 29.0, 20.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.79466247558594, -68.25247955322266, -65.71029663085938, -63.16810989379883, -60.62592315673828, -58.083740234375, -55.54155731201172, -52.99937438964844, -50.45718765258789, -47.91500473022461, -45.37281799316406, -42.83063507080078, -40.2884521484375, -37.74626541137695, -35.20408248901367, -32.661895751953125, -30.119712829589844, -27.57752799987793, -25.035343170166016, -22.493160247802734, -19.95097541809082, -17.408790588378906, -14.866606712341309, -12.324422836303711, -9.782238006591797, -7.240053653717041, -4.697869300842285, -2.1556849479675293, 0.38649940490722656, 2.9286842346191406, 5.470868110656738, 8.013051986694336, 10.555229187011719, 13.097414016723633, 15.63959789276123, 18.181781768798828, 20.723966598510742, 23.266151428222656, 25.808334350585938, 28.35051918029785, 30.892704010009766, 33.43488693237305, 35.977073669433594, 38.519256591796875, 41.061439514160156, 43.6036262512207, 46.145809173583984, 48.68799591064453, 51.23017883300781, 53.772361755371094, 56.31454849243164, 58.85673141479492, 61.39891815185547, 63.94110107421875, 66.48328399658203, 69.02546691894531, 71.56765747070312, 74.1098403930664, 76.65202331542969, 79.1942138671875, 81.73639678955078, 84.27857971191406, 86.82076263427734, 89.36294555664062, 91.9051284790039]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 9.0, 13.0, 14.0, 19.0, 14.0, 26.0, 20.0, 27.0, 34.0, 40.0, 38.0, 39.0, 48.0, 54.0, 33.0, 43.0, 60.0, 47.0, 46.0, 44.0, 45.0, 42.0, 38.0, 33.0, 27.0, 19.0, 24.0, 18.0, 9.0, 12.0, 16.0, 5.0, 10.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-23.774707794189453, -22.93950080871582, -22.104293823242188, -21.269084930419922, -20.43387794494629, -19.598670959472656, -18.763463973999023, -17.92825698852539, -17.093050003051758, -16.257843017578125, -15.422635078430176, -14.587428092956543, -13.75222110748291, -12.917013168334961, -12.081806182861328, -11.246599197387695, -10.411391258239746, -9.576184272766113, -8.740976333618164, -7.905769348144531, -7.070562362670898, -6.235354900360107, -5.400147438049316, -4.564940452575684, -3.7297329902648926, -2.8945257663726807, -2.0593185424804688, -1.2241110801696777, -0.3889038562774658, 0.4463033676147461, 1.281510829925537, 2.11671781539917, 2.951925277709961, 3.787132501602173, 4.622339725494385, 5.457547187805176, 6.292754173278809, 7.1279616355896, 7.963169097900391, 8.798376083374023, 9.633583068847656, 10.468790054321289, 11.303997993469238, 12.139204978942871, 12.974411964416504, 13.809619903564453, 14.644826889038086, 15.480033874511719, 16.315242767333984, 17.150449752807617, 17.98565673828125, 18.820865631103516, 19.65607261657715, 20.49127960205078, 21.326486587524414, 22.161693572998047, 22.99690055847168, 23.832107543945312, 24.667314529418945, 25.502521514892578, 26.337730407714844, 27.172937393188477, 28.00814437866211, 28.843351364135742, 29.678558349609375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 10.0, 9.0, 18.0, 25.0, 44.0, 66.0, 107.0, 170.0, 258.0, 431.0, 680.0, 1281.0, 2470.0, 5155.0, 12159.0, 31342.0, 94671.0, 292989.0, 383402.0, 146120.0, 46266.0, 16824.0, 6938.0, 3263.0, 1647.0, 869.0, 495.0, 300.0, 197.0, 129.0, 71.0, 45.0, 29.0, 21.0, 18.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.40185546875, -8.0927734375, -7.78369140625, -7.474609375, -7.16552734375, -6.8564453125, -6.54736328125, -6.23828125, -5.92919921875, -5.6201171875, -5.31103515625, -5.001953125, -4.69287109375, -4.3837890625, -4.07470703125, -3.765625, -3.45654296875, -3.1474609375, -2.83837890625, -2.529296875, -2.22021484375, -1.9111328125, -1.60205078125, -1.29296875, -0.98388671875, -0.6748046875, -0.36572265625, -0.056640625, 0.25244140625, 0.5615234375, 0.87060546875, 1.1796875, 1.48876953125, 1.7978515625, 2.10693359375, 2.416015625, 2.72509765625, 3.0341796875, 3.34326171875, 3.65234375, 3.96142578125, 4.2705078125, 4.57958984375, 4.888671875, 5.19775390625, 5.5068359375, 5.81591796875, 6.125, 6.43408203125, 6.7431640625, 7.05224609375, 7.361328125, 7.67041015625, 7.9794921875, 8.28857421875, 8.59765625, 8.90673828125, 9.2158203125, 9.52490234375, 9.833984375, 10.14306640625, 10.4521484375, 10.76123046875, 11.0703125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 4.0, 12.0, 8.0, 20.0, 19.0, 21.0, 22.0, 26.0, 30.0, 35.0, 42.0, 54.0, 34.0, 41.0, 61.0, 56.0, 69.0, 63.0, 44.0, 48.0, 39.0, 42.0, 36.0, 31.0, 20.0, 29.0, 15.0, 21.0, 11.0, 11.0, 2.0, 6.0, 11.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.107513427734375, -2.98260498046875, -2.857696533203125, -2.7327880859375, -2.607879638671875, -2.48297119140625, -2.358062744140625, -2.233154296875, -2.108245849609375, -1.98333740234375, -1.858428955078125, -1.7335205078125, -1.608612060546875, -1.48370361328125, -1.358795166015625, -1.23388671875, -1.108978271484375, -0.98406982421875, -0.859161376953125, -0.7342529296875, -0.609344482421875, -0.48443603515625, -0.359527587890625, -0.234619140625, -0.109710693359375, 0.01519775390625, 0.140106201171875, 0.2650146484375, 0.389923095703125, 0.51483154296875, 0.639739990234375, 0.7646484375, 0.889556884765625, 1.01446533203125, 1.139373779296875, 1.2642822265625, 1.389190673828125, 1.51409912109375, 1.639007568359375, 1.763916015625, 1.888824462890625, 2.01373291015625, 2.138641357421875, 2.2635498046875, 2.388458251953125, 2.51336669921875, 2.638275146484375, 2.76318359375, 2.888092041015625, 3.01300048828125, 3.137908935546875, 3.2628173828125, 3.387725830078125, 3.51263427734375, 3.637542724609375, 3.762451171875, 3.887359619140625, 4.01226806640625, 4.137176513671875, 4.2620849609375, 4.386993408203125, 4.51190185546875, 4.636810302734375, 4.76171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 5.0, 8.0, 8.0, 8.0, 18.0, 17.0, 32.0, 49.0, 82.0, 160.0, 298.0, 638.0, 1364.0, 3659.0, 11269.0, 47120.0, 295498.0, 561518.0, 97285.0, 19964.0, 5780.0, 2049.0, 832.0, 407.0, 182.0, 102.0, 63.0, 37.0, 31.0, 16.0, 11.0, 15.0, 4.0, 9.0, 5.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.21875, -15.66357421875, -15.1083984375, -14.55322265625, -13.998046875, -13.44287109375, -12.8876953125, -12.33251953125, -11.77734375, -11.22216796875, -10.6669921875, -10.11181640625, -9.556640625, -9.00146484375, -8.4462890625, -7.89111328125, -7.3359375, -6.78076171875, -6.2255859375, -5.67041015625, -5.115234375, -4.56005859375, -4.0048828125, -3.44970703125, -2.89453125, -2.33935546875, -1.7841796875, -1.22900390625, -0.673828125, -0.11865234375, 0.4365234375, 0.99169921875, 1.546875, 2.10205078125, 2.6572265625, 3.21240234375, 3.767578125, 4.32275390625, 4.8779296875, 5.43310546875, 5.98828125, 6.54345703125, 7.0986328125, 7.65380859375, 8.208984375, 8.76416015625, 9.3193359375, 9.87451171875, 10.4296875, 10.98486328125, 11.5400390625, 12.09521484375, 12.650390625, 13.20556640625, 13.7607421875, 14.31591796875, 14.87109375, 15.42626953125, 15.9814453125, 16.53662109375, 17.091796875, 17.64697265625, 18.2021484375, 18.75732421875, 19.3125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 10.0, 5.0, 7.0, 8.0, 9.0, 22.0, 17.0, 18.0, 24.0, 28.0, 25.0, 32.0, 49.0, 44.0, 47.0, 60.0, 51.0, 56.0, 51.0, 83.0, 61.0, 36.0, 35.0, 37.0, 30.0, 39.0, 16.0, 22.0, 18.0, 15.0, 10.0, 12.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.171875, -24.321044921875, -23.47021484375, -22.619384765625, -21.7685546875, -20.917724609375, -20.06689453125, -19.216064453125, -18.365234375, -17.514404296875, -16.66357421875, -15.812744140625, -14.9619140625, -14.111083984375, -13.26025390625, -12.409423828125, -11.55859375, -10.707763671875, -9.85693359375, -9.006103515625, -8.1552734375, -7.304443359375, -6.45361328125, -5.602783203125, -4.751953125, -3.901123046875, -3.05029296875, -2.199462890625, -1.3486328125, -0.497802734375, 0.35302734375, 1.203857421875, 2.0546875, 2.905517578125, 3.75634765625, 4.607177734375, 5.4580078125, 6.308837890625, 7.15966796875, 8.010498046875, 8.861328125, 9.712158203125, 10.56298828125, 11.413818359375, 12.2646484375, 13.115478515625, 13.96630859375, 14.817138671875, 15.66796875, 16.518798828125, 17.36962890625, 18.220458984375, 19.0712890625, 19.922119140625, 20.77294921875, 21.623779296875, 22.474609375, 23.325439453125, 24.17626953125, 25.027099609375, 25.8779296875, 26.728759765625, 27.57958984375, 28.430419921875, 29.28125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 11.0, 6.0, 19.0, 11.0, 23.0, 29.0, 76.0, 88.0, 193.0, 386.0, 1062.0, 3287.0, 19247.0, 349832.0, 633895.0, 33478.0, 4621.0, 1287.0, 478.0, 235.0, 121.0, 56.0, 34.0, 26.0, 21.0, 9.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.866943359375, -11.44482421875, -11.022705078125, -10.6005859375, -10.178466796875, -9.75634765625, -9.334228515625, -8.912109375, -8.489990234375, -8.06787109375, -7.645751953125, -7.2236328125, -6.801513671875, -6.37939453125, -5.957275390625, -5.53515625, -5.113037109375, -4.69091796875, -4.268798828125, -3.8466796875, -3.424560546875, -3.00244140625, -2.580322265625, -2.158203125, -1.736083984375, -1.31396484375, -0.891845703125, -0.4697265625, -0.047607421875, 0.37451171875, 0.796630859375, 1.21875, 1.640869140625, 2.06298828125, 2.485107421875, 2.9072265625, 3.329345703125, 3.75146484375, 4.173583984375, 4.595703125, 5.017822265625, 5.43994140625, 5.862060546875, 6.2841796875, 6.706298828125, 7.12841796875, 7.550537109375, 7.97265625, 8.394775390625, 8.81689453125, 9.239013671875, 9.6611328125, 10.083251953125, 10.50537109375, 10.927490234375, 11.349609375, 11.771728515625, 12.19384765625, 12.615966796875, 13.0380859375, 13.460205078125, 13.88232421875, 14.304443359375, 14.7265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 2.0, 10.0, 11.0, 16.0, 21.0, 48.0, 51.0, 84.0, 119.0, 140.0, 125.0, 110.0, 75.0, 60.0, 37.0, 32.0, 19.0, 9.0, 7.0, 2.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010900497436523438, -0.0010421723127365112, -0.0009942948818206787, -0.0009464174509048462, -0.0008985400199890137, -0.0008506625890731812, -0.0008027851581573486, -0.0007549077272415161, -0.0007070302963256836, -0.0006591528654098511, -0.0006112754344940186, -0.000563398003578186, -0.0005155205726623535, -0.000467643141746521, -0.0004197657108306885, -0.00037188827991485596, -0.00032401084899902344, -0.0002761334180831909, -0.0002282559871673584, -0.00018037855625152588, -0.00013250112533569336, -8.462369441986084e-05, -3.674626350402832e-05, 1.11311674118042e-05, 5.900859832763672e-05, 0.00010688602924346924, 0.00015476346015930176, 0.00020264089107513428, 0.0002505183219909668, 0.0002983957529067993, 0.00034627318382263184, 0.00039415061473846436, 0.0004420280456542969, 0.0004899054765701294, 0.0005377829074859619, 0.0005856603384017944, 0.000633537769317627, 0.0006814152002334595, 0.000729292631149292, 0.0007771700620651245, 0.000825047492980957, 0.0008729249238967896, 0.0009208023548126221, 0.0009686797857284546, 0.0010165572166442871, 0.0010644346475601196, 0.0011123120784759521, 0.0011601895093917847, 0.0012080669403076172, 0.0012559443712234497, 0.0013038218021392822, 0.0013516992330551147, 0.0013995766639709473, 0.0014474540948867798, 0.0014953315258026123, 0.0015432089567184448, 0.0015910863876342773, 0.0016389638185501099, 0.0016868412494659424, 0.001734718680381775, 0.0017825961112976074, 0.00183047354221344, 0.0018783509731292725, 0.001926228404045105, 0.0019741058349609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 10.0, 16.0, 37.0, 35.0, 62.0, 117.0, 234.0, 456.0, 971.0, 2649.0, 8756.0, 42813.0, 291677.0, 575172.0, 100742.0, 17616.0, 4367.0, 1514.0, 626.0, 284.0, 139.0, 94.0, 58.0, 41.0, 23.0, 20.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.9705810546875, -8.683349609375, -8.3961181640625, -8.10888671875, -7.8216552734375, -7.534423828125, -7.2471923828125, -6.9599609375, -6.6727294921875, -6.385498046875, -6.0982666015625, -5.81103515625, -5.5238037109375, -5.236572265625, -4.9493408203125, -4.662109375, -4.3748779296875, -4.087646484375, -3.8004150390625, -3.51318359375, -3.2259521484375, -2.938720703125, -2.6514892578125, -2.3642578125, -2.0770263671875, -1.789794921875, -1.5025634765625, -1.21533203125, -0.9281005859375, -0.640869140625, -0.3536376953125, -0.06640625, 0.2208251953125, 0.508056640625, 0.7952880859375, 1.08251953125, 1.3697509765625, 1.656982421875, 1.9442138671875, 2.2314453125, 2.5186767578125, 2.805908203125, 3.0931396484375, 3.38037109375, 3.6676025390625, 3.954833984375, 4.2420654296875, 4.529296875, 4.8165283203125, 5.103759765625, 5.3909912109375, 5.67822265625, 5.9654541015625, 6.252685546875, 6.5399169921875, 6.8271484375, 7.1143798828125, 7.401611328125, 7.6888427734375, 7.97607421875, 8.2633056640625, 8.550537109375, 8.8377685546875, 9.125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 7.0, 4.0, 9.0, 11.0, 18.0, 16.0, 24.0, 35.0, 45.0, 60.0, 96.0, 101.0, 109.0, 127.0, 84.0, 75.0, 49.0, 39.0, 27.0, 23.0, 16.0, 13.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9765625, -12.579833984375, -12.18310546875, -11.786376953125, -11.3896484375, -10.992919921875, -10.59619140625, -10.199462890625, -9.802734375, -9.406005859375, -9.00927734375, -8.612548828125, -8.2158203125, -7.819091796875, -7.42236328125, -7.025634765625, -6.62890625, -6.232177734375, -5.83544921875, -5.438720703125, -5.0419921875, -4.645263671875, -4.24853515625, -3.851806640625, -3.455078125, -3.058349609375, -2.66162109375, -2.264892578125, -1.8681640625, -1.471435546875, -1.07470703125, -0.677978515625, -0.28125, 0.115478515625, 0.51220703125, 0.908935546875, 1.3056640625, 1.702392578125, 2.09912109375, 2.495849609375, 2.892578125, 3.289306640625, 3.68603515625, 4.082763671875, 4.4794921875, 4.876220703125, 5.27294921875, 5.669677734375, 6.06640625, 6.463134765625, 6.85986328125, 7.256591796875, 7.6533203125, 8.050048828125, 8.44677734375, 8.843505859375, 9.240234375, 9.636962890625, 10.03369140625, 10.430419921875, 10.8271484375, 11.223876953125, 11.62060546875, 12.017333984375, 12.4140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 13.0, 62.0, 168.0, 283.0, 267.0, 136.0, 52.0, 15.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-411.8455810546875, -403.589111328125, -395.3326416015625, -387.076171875, -378.8197021484375, -370.563232421875, -362.3067626953125, -354.05029296875, -345.7938232421875, -337.537353515625, -329.2808837890625, -321.0244140625, -312.7679443359375, -304.511474609375, -296.2550048828125, -287.99853515625, -279.7420349121094, -271.4855651855469, -263.2290954589844, -254.97262573242188, -246.71615600585938, -238.45968627929688, -230.2032012939453, -221.9467315673828, -213.6902618408203, -205.4337921142578, -197.1773223876953, -188.9208526611328, -180.66436767578125, -172.40789794921875, -164.15142822265625, -155.89495849609375, -147.63851928710938, -139.38204956054688, -131.12557983398438, -122.86910247802734, -114.61263275146484, -106.35616302490234, -98.09968566894531, -89.84321594238281, -81.58674621582031, -73.33027648925781, -65.07380676269531, -56.81732940673828, -48.56085968017578, -40.30438995361328, -32.047916412353516, -23.79144287109375, -15.53497314453125, -7.278501510620117, 0.9779701232910156, 9.234441757202148, 17.49091339111328, 25.74738311767578, 34.00385665893555, 42.26033020019531, 50.51679992675781, 58.77326965332031, 67.02973937988281, 75.28621673583984, 83.54268646240234, 91.79915618896484, 100.05563354492188, 108.31210327148438, 116.56857299804688]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 9.0, 9.0, 17.0, 21.0, 14.0, 16.0, 21.0, 25.0, 25.0, 32.0, 33.0, 42.0, 39.0, 47.0, 38.0, 50.0, 48.0, 52.0, 43.0, 38.0, 42.0, 44.0, 43.0, 31.0, 35.0, 28.0, 19.0, 27.0, 19.0, 16.0, 14.0, 8.0, 9.0, 10.0, 3.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-120.56280517578125, -116.78648376464844, -113.01016998291016, -109.23384857177734, -105.45753479003906, -101.68121337890625, -97.90489196777344, -94.12857818603516, -90.35226440429688, -86.57594299316406, -82.79962921142578, -79.02330780029297, -75.24699401855469, -71.47067260742188, -67.69435119628906, -63.91803741455078, -60.14171600341797, -56.36539840698242, -52.589080810546875, -48.81275939941406, -45.03644561767578, -41.26012420654297, -37.48380661010742, -33.707489013671875, -29.931171417236328, -26.15485382080078, -22.378536224365234, -18.602216720581055, -14.825899124145508, -11.049581527709961, -7.273262023925781, -3.4969444274902344, 0.27938079833984375, 4.055698871612549, 7.832016944885254, 11.608335494995117, 15.384653091430664, 19.16097068786621, 22.93729019165039, 26.713607788085938, 30.489925384521484, 34.26624298095703, 38.04256057739258, 41.818878173828125, 45.59519958496094, 49.37151336669922, 53.14783477783203, 56.92415237426758, 60.700469970703125, 64.47679138183594, 68.25310516357422, 72.02942657470703, 75.80574035644531, 79.58206176757812, 83.35838317871094, 87.13469696044922, 90.9110107421875, 94.68733215332031, 98.4636459350586, 102.2399673461914, 106.01628112792969, 109.7926025390625, 113.56892395019531, 117.3452377319336, 121.1215591430664]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 9.0, 8.0, 5.0, 10.0, 18.0, 30.0, 27.0, 54.0, 62.0, 83.0, 138.0, 193.0, 333.0, 579.0, 1010.0, 2132.0, 5747.0, 24085.0, 3901866.0, 233662.0, 15801.0, 4360.0, 1799.0, 878.0, 491.0, 304.0, 181.0, 119.0, 93.0, 66.0, 32.0, 28.0, 19.0, 16.0, 17.0, 4.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-16.046875, -15.47119140625, -14.8955078125, -14.31982421875, -13.744140625, -13.16845703125, -12.5927734375, -12.01708984375, -11.44140625, -10.86572265625, -10.2900390625, -9.71435546875, -9.138671875, -8.56298828125, -7.9873046875, -7.41162109375, -6.8359375, -6.26025390625, -5.6845703125, -5.10888671875, -4.533203125, -3.95751953125, -3.3818359375, -2.80615234375, -2.23046875, -1.65478515625, -1.0791015625, -0.50341796875, 0.072265625, 0.64794921875, 1.2236328125, 1.79931640625, 2.375, 2.95068359375, 3.5263671875, 4.10205078125, 4.677734375, 5.25341796875, 5.8291015625, 6.40478515625, 6.98046875, 7.55615234375, 8.1318359375, 8.70751953125, 9.283203125, 9.85888671875, 10.4345703125, 11.01025390625, 11.5859375, 12.16162109375, 12.7373046875, 13.31298828125, 13.888671875, 14.46435546875, 15.0400390625, 15.61572265625, 16.19140625, 16.76708984375, 17.3427734375, 17.91845703125, 18.494140625, 19.06982421875, 19.6455078125, 20.22119140625, 20.796875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 8.0, 7.0, 14.0, 19.0, 21.0, 41.0, 37.0, 44.0, 45.0, 44.0, 68.0, 63.0, 84.0, 68.0, 72.0, 77.0, 43.0, 48.0, 51.0, 30.0, 28.0, 16.0, 17.0, 11.0, 8.0, 7.0, 10.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.07952880859375, -4.8660888671875, -4.65264892578125, -4.439208984375, -4.22576904296875, -4.0123291015625, -3.79888916015625, -3.58544921875, -3.37200927734375, -3.1585693359375, -2.94512939453125, -2.731689453125, -2.51824951171875, -2.3048095703125, -2.09136962890625, -1.8779296875, -1.66448974609375, -1.4510498046875, -1.23760986328125, -1.024169921875, -0.81072998046875, -0.5972900390625, -0.38385009765625, -0.17041015625, 0.04302978515625, 0.2564697265625, 0.46990966796875, 0.683349609375, 0.89678955078125, 1.1102294921875, 1.32366943359375, 1.537109375, 1.75054931640625, 1.9639892578125, 2.17742919921875, 2.390869140625, 2.60430908203125, 2.8177490234375, 3.03118896484375, 3.24462890625, 3.45806884765625, 3.6715087890625, 3.88494873046875, 4.098388671875, 4.31182861328125, 4.5252685546875, 4.73870849609375, 4.9521484375, 5.16558837890625, 5.3790283203125, 5.59246826171875, 5.805908203125, 6.01934814453125, 6.2327880859375, 6.44622802734375, 6.65966796875, 6.87310791015625, 7.0865478515625, 7.29998779296875, 7.513427734375, 7.72686767578125, 7.9403076171875, 8.15374755859375, 8.3671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 7.0, 11.0, 20.0, 27.0, 28.0, 55.0, 55.0, 78.0, 134.0, 179.0, 257.0, 367.0, 627.0, 961.0, 1449.0, 2447.0, 4113.0, 8271.0, 19687.0, 87157.0, 3879941.0, 141732.0, 25287.0, 9668.0, 4588.0, 2673.0, 1611.0, 937.0, 680.0, 377.0, 246.0, 163.0, 124.0, 90.0, 59.0, 44.0, 36.0, 22.0, 23.0, 16.0, 7.0, 3.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.375, -12.9378662109375, -12.500732421875, -12.0635986328125, -11.62646484375, -11.1893310546875, -10.752197265625, -10.3150634765625, -9.8779296875, -9.4407958984375, -9.003662109375, -8.5665283203125, -8.12939453125, -7.6922607421875, -7.255126953125, -6.8179931640625, -6.380859375, -5.9437255859375, -5.506591796875, -5.0694580078125, -4.63232421875, -4.1951904296875, -3.758056640625, -3.3209228515625, -2.8837890625, -2.4466552734375, -2.009521484375, -1.5723876953125, -1.13525390625, -0.6981201171875, -0.260986328125, 0.1761474609375, 0.61328125, 1.0504150390625, 1.487548828125, 1.9246826171875, 2.36181640625, 2.7989501953125, 3.236083984375, 3.6732177734375, 4.1103515625, 4.5474853515625, 4.984619140625, 5.4217529296875, 5.85888671875, 6.2960205078125, 6.733154296875, 7.1702880859375, 7.607421875, 8.0445556640625, 8.481689453125, 8.9188232421875, 9.35595703125, 9.7930908203125, 10.230224609375, 10.6673583984375, 11.1044921875, 11.5416259765625, 11.978759765625, 12.4158935546875, 12.85302734375, 13.2901611328125, 13.727294921875, 14.1644287109375, 14.6015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 6.0, 11.0, 14.0, 31.0, 104.0, 3213.0, 501.0, 81.0, 33.0, 25.0, 12.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.02734375, -6.831298828125, -6.63525390625, -6.439208984375, -6.2431640625, -6.047119140625, -5.85107421875, -5.655029296875, -5.458984375, -5.262939453125, -5.06689453125, -4.870849609375, -4.6748046875, -4.478759765625, -4.28271484375, -4.086669921875, -3.890625, -3.694580078125, -3.49853515625, -3.302490234375, -3.1064453125, -2.910400390625, -2.71435546875, -2.518310546875, -2.322265625, -2.126220703125, -1.93017578125, -1.734130859375, -1.5380859375, -1.342041015625, -1.14599609375, -0.949951171875, -0.75390625, -0.557861328125, -0.36181640625, -0.165771484375, 0.0302734375, 0.226318359375, 0.42236328125, 0.618408203125, 0.814453125, 1.010498046875, 1.20654296875, 1.402587890625, 1.5986328125, 1.794677734375, 1.99072265625, 2.186767578125, 2.3828125, 2.578857421875, 2.77490234375, 2.970947265625, 3.1669921875, 3.363037109375, 3.55908203125, 3.755126953125, 3.951171875, 4.147216796875, 4.34326171875, 4.539306640625, 4.7353515625, 4.931396484375, 5.12744140625, 5.323486328125, 5.51953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 5.0, 12.0, 20.0, 27.0, 51.0, 86.0, 154.0, 181.0, 177.0, 129.0, 68.0, 38.0, 20.0, 15.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.427258491516113, -10.73616886138916, -10.045079231262207, -9.353989601135254, -8.6628999710083, -7.971810340881348, -7.280721187591553, -6.5896315574646, -5.8985419273376465, -5.207452297210693, -4.51636266708374, -3.825273275375366, -3.134183645248413, -2.44309401512146, -1.752004623413086, -1.0609149932861328, -0.3698253631591797, 0.32126420736312866, 1.012353777885437, 1.7034432888031006, 2.3945329189300537, 3.085622549057007, 3.776711940765381, 4.467801570892334, 5.158891201019287, 5.84998083114624, 6.541070461273193, 7.232159614562988, 7.923249244689941, 8.614338874816895, 9.305428504943848, 9.9965181350708, 10.68760871887207, 11.378698348999023, 12.069787979125977, 12.76087760925293, 13.451967239379883, 14.143056869506836, 14.834146499633789, 15.525236129760742, 16.216325759887695, 16.90741539001465, 17.5985050201416, 18.289594650268555, 18.980684280395508, 19.67177391052246, 20.362863540649414, 21.053953170776367, 21.745040893554688, 22.43613052368164, 23.127220153808594, 23.818309783935547, 24.5093994140625, 25.200489044189453, 25.891578674316406, 26.58266830444336, 27.273757934570312, 27.964847564697266, 28.65593719482422, 29.347026824951172, 30.038116455078125, 30.729206085205078, 31.42029571533203, 32.111385345458984, 32.80247497558594]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 10.0, 5.0, 5.0, 14.0, 14.0, 17.0, 15.0, 21.0, 21.0, 22.0, 24.0, 24.0, 26.0, 29.0, 31.0, 39.0, 33.0, 53.0, 31.0, 44.0, 37.0, 33.0, 28.0, 40.0, 49.0, 36.0, 37.0, 27.0, 33.0, 26.0, 19.0, 21.0, 22.0, 17.0, 9.0, 17.0, 14.0, 11.0, 8.0, 5.0, 7.0, 3.0, 6.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.024789810180664, -7.766061782836914, -7.507333755493164, -7.248605728149414, -6.989877700805664, -6.731149673461914, -6.472421646118164, -6.213693618774414, -5.954965591430664, -5.696237564086914, -5.437509536743164, -5.178781509399414, -4.920053482055664, -4.661325454711914, -4.402597427368164, -4.143869400024414, -3.885141372680664, -3.626413345336914, -3.367685317993164, -3.108957290649414, -2.850229263305664, -2.591501235961914, -2.332773208618164, -2.074045181274414, -1.815317153930664, -1.556589126586914, -1.297861099243164, -1.039133071899414, -0.7804050445556641, -0.5216770172119141, -0.26294898986816406, -0.0042209625244140625, 0.25450801849365234, 0.5132360458374023, 0.7719640731811523, 1.0306921005249023, 1.2894201278686523, 1.5481481552124023, 1.8068761825561523, 2.0656042098999023, 2.3243322372436523, 2.5830602645874023, 2.8417882919311523, 3.1005163192749023, 3.3592443466186523, 3.6179723739624023, 3.8767004013061523, 4.135428428649902, 4.394156455993652, 4.652884483337402, 4.911612510681152, 5.170340538024902, 5.429068565368652, 5.687796592712402, 5.946524620056152, 6.205252647399902, 6.463980674743652, 6.722708702087402, 6.981436729431152, 7.240164756774902, 7.498892784118652, 7.757620811462402, 8.016348838806152, 8.275076866149902, 8.533804893493652]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 9.0, 8.0, 13.0, 27.0, 33.0, 35.0, 71.0, 129.0, 225.0, 426.0, 844.0, 1740.0, 3913.0, 9854.0, 26797.0, 83816.0, 261960.0, 400992.0, 173231.0, 53821.0, 18033.0, 6821.0, 2895.0, 1389.0, 689.0, 341.0, 172.0, 103.0, 58.0, 40.0, 20.0, 15.0, 11.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.541259765625, -9.19189453125, -8.842529296875, -8.4931640625, -8.143798828125, -7.79443359375, -7.445068359375, -7.095703125, -6.746337890625, -6.39697265625, -6.047607421875, -5.6982421875, -5.348876953125, -4.99951171875, -4.650146484375, -4.30078125, -3.951416015625, -3.60205078125, -3.252685546875, -2.9033203125, -2.553955078125, -2.20458984375, -1.855224609375, -1.505859375, -1.156494140625, -0.80712890625, -0.457763671875, -0.1083984375, 0.240966796875, 0.59033203125, 0.939697265625, 1.2890625, 1.638427734375, 1.98779296875, 2.337158203125, 2.6865234375, 3.035888671875, 3.38525390625, 3.734619140625, 4.083984375, 4.433349609375, 4.78271484375, 5.132080078125, 5.4814453125, 5.830810546875, 6.18017578125, 6.529541015625, 6.87890625, 7.228271484375, 7.57763671875, 7.927001953125, 8.2763671875, 8.625732421875, 8.97509765625, 9.324462890625, 9.673828125, 10.023193359375, 10.37255859375, 10.721923828125, 11.0712890625, 11.420654296875, 11.77001953125, 12.119384765625, 12.46875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 10.0, 4.0, 12.0, 6.0, 12.0, 18.0, 23.0, 29.0, 48.0, 35.0, 39.0, 47.0, 50.0, 58.0, 56.0, 54.0, 59.0, 63.0, 67.0, 45.0, 49.0, 50.0, 27.0, 31.0, 23.0, 21.0, 12.0, 11.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.60528564453125, -4.4176025390625, -4.22991943359375, -4.042236328125, -3.85455322265625, -3.6668701171875, -3.47918701171875, -3.29150390625, -3.10382080078125, -2.9161376953125, -2.72845458984375, -2.540771484375, -2.35308837890625, -2.1654052734375, -1.97772216796875, -1.7900390625, -1.60235595703125, -1.4146728515625, -1.22698974609375, -1.039306640625, -0.85162353515625, -0.6639404296875, -0.47625732421875, -0.28857421875, -0.10089111328125, 0.0867919921875, 0.27447509765625, 0.462158203125, 0.64984130859375, 0.8375244140625, 1.02520751953125, 1.212890625, 1.40057373046875, 1.5882568359375, 1.77593994140625, 1.963623046875, 2.15130615234375, 2.3389892578125, 2.52667236328125, 2.71435546875, 2.90203857421875, 3.0897216796875, 3.27740478515625, 3.465087890625, 3.65277099609375, 3.8404541015625, 4.02813720703125, 4.2158203125, 4.40350341796875, 4.5911865234375, 4.77886962890625, 4.966552734375, 5.15423583984375, 5.3419189453125, 5.52960205078125, 5.71728515625, 5.90496826171875, 6.0926513671875, 6.28033447265625, 6.468017578125, 6.65570068359375, 6.8433837890625, 7.03106689453125, 7.21875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 16.0, 17.0, 38.0, 47.0, 75.0, 136.0, 281.0, 574.0, 1391.0, 3976.0, 13138.0, 61301.0, 438157.0, 446490.0, 62896.0, 13399.0, 3892.0, 1467.0, 601.0, 291.0, 148.0, 82.0, 54.0, 17.0, 17.0, 14.0, 17.0, 5.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.248291015625, -19.65283203125, -19.057373046875, -18.4619140625, -17.866455078125, -17.27099609375, -16.675537109375, -16.080078125, -15.484619140625, -14.88916015625, -14.293701171875, -13.6982421875, -13.102783203125, -12.50732421875, -11.911865234375, -11.31640625, -10.720947265625, -10.12548828125, -9.530029296875, -8.9345703125, -8.339111328125, -7.74365234375, -7.148193359375, -6.552734375, -5.957275390625, -5.36181640625, -4.766357421875, -4.1708984375, -3.575439453125, -2.97998046875, -2.384521484375, -1.7890625, -1.193603515625, -0.59814453125, -0.002685546875, 0.5927734375, 1.188232421875, 1.78369140625, 2.379150390625, 2.974609375, 3.570068359375, 4.16552734375, 4.760986328125, 5.3564453125, 5.951904296875, 6.54736328125, 7.142822265625, 7.73828125, 8.333740234375, 8.92919921875, 9.524658203125, 10.1201171875, 10.715576171875, 11.31103515625, 11.906494140625, 12.501953125, 13.097412109375, 13.69287109375, 14.288330078125, 14.8837890625, 15.479248046875, 16.07470703125, 16.670166015625, 17.265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 4.0, 8.0, 9.0, 5.0, 19.0, 15.0, 24.0, 17.0, 33.0, 31.0, 28.0, 41.0, 51.0, 48.0, 53.0, 67.0, 29.0, 55.0, 47.0, 55.0, 41.0, 36.0, 51.0, 33.0, 39.0, 22.0, 24.0, 19.0, 16.0, 18.0, 13.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.46875, -29.512939453125, -28.55712890625, -27.601318359375, -26.6455078125, -25.689697265625, -24.73388671875, -23.778076171875, -22.822265625, -21.866455078125, -20.91064453125, -19.954833984375, -18.9990234375, -18.043212890625, -17.08740234375, -16.131591796875, -15.17578125, -14.219970703125, -13.26416015625, -12.308349609375, -11.3525390625, -10.396728515625, -9.44091796875, -8.485107421875, -7.529296875, -6.573486328125, -5.61767578125, -4.661865234375, -3.7060546875, -2.750244140625, -1.79443359375, -0.838623046875, 0.1171875, 1.072998046875, 2.02880859375, 2.984619140625, 3.9404296875, 4.896240234375, 5.85205078125, 6.807861328125, 7.763671875, 8.719482421875, 9.67529296875, 10.631103515625, 11.5869140625, 12.542724609375, 13.49853515625, 14.454345703125, 15.41015625, 16.365966796875, 17.32177734375, 18.277587890625, 19.2333984375, 20.189208984375, 21.14501953125, 22.100830078125, 23.056640625, 24.012451171875, 24.96826171875, 25.924072265625, 26.8798828125, 27.835693359375, 28.79150390625, 29.747314453125, 30.703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 5.0, 11.0, 10.0, 29.0, 46.0, 59.0, 107.0, 217.0, 446.0, 1106.0, 3069.0, 14161.0, 126259.0, 712414.0, 167122.0, 17671.0, 3617.0, 1132.0, 512.0, 232.0, 134.0, 71.0, 42.0, 24.0, 17.0, 12.0, 5.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.11328125, -6.86419677734375, -6.6151123046875, -6.36602783203125, -6.116943359375, -5.86785888671875, -5.6187744140625, -5.36968994140625, -5.12060546875, -4.87152099609375, -4.6224365234375, -4.37335205078125, -4.124267578125, -3.87518310546875, -3.6260986328125, -3.37701416015625, -3.1279296875, -2.87884521484375, -2.6297607421875, -2.38067626953125, -2.131591796875, -1.88250732421875, -1.6334228515625, -1.38433837890625, -1.13525390625, -0.88616943359375, -0.6370849609375, -0.38800048828125, -0.138916015625, 0.11016845703125, 0.3592529296875, 0.60833740234375, 0.857421875, 1.10650634765625, 1.3555908203125, 1.60467529296875, 1.853759765625, 2.10284423828125, 2.3519287109375, 2.60101318359375, 2.85009765625, 3.09918212890625, 3.3482666015625, 3.59735107421875, 3.846435546875, 4.09552001953125, 4.3446044921875, 4.59368896484375, 4.8427734375, 5.09185791015625, 5.3409423828125, 5.59002685546875, 5.839111328125, 6.08819580078125, 6.3372802734375, 6.58636474609375, 6.83544921875, 7.08453369140625, 7.3336181640625, 7.58270263671875, 7.831787109375, 8.08087158203125, 8.3299560546875, 8.57904052734375, 8.828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 2.0, 9.0, 9.0, 11.0, 20.0, 20.0, 25.0, 32.0, 24.0, 54.0, 49.0, 74.0, 60.0, 69.0, 74.0, 70.0, 72.0, 59.0, 51.0, 35.0, 35.0, 41.0, 28.0, 16.0, 17.0, 8.0, 10.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007123947143554688, -0.0006897896528244019, -0.000667184591293335, -0.0006445795297622681, -0.0006219744682312012, -0.0005993694067001343, -0.0005767643451690674, -0.0005541592836380005, -0.0005315542221069336, -0.0005089491605758667, -0.0004863440990447998, -0.0004637390375137329, -0.000441133975982666, -0.0004185289144515991, -0.0003959238529205322, -0.00037331879138946533, -0.00035071372985839844, -0.00032810866832733154, -0.00030550360679626465, -0.00028289854526519775, -0.00026029348373413086, -0.00023768842220306396, -0.00021508336067199707, -0.00019247829914093018, -0.00016987323760986328, -0.0001472681760787964, -0.0001246631145477295, -0.0001020580530166626, -7.94529914855957e-05, -5.684792995452881e-05, -3.4242868423461914e-05, -1.163780689239502e-05, 1.0967254638671875e-05, 3.357231616973877e-05, 5.6177377700805664e-05, 7.878243923187256e-05, 0.00010138750076293945, 0.00012399256229400635, 0.00014659762382507324, 0.00016920268535614014, 0.00019180774688720703, 0.00021441280841827393, 0.00023701786994934082, 0.0002596229314804077, 0.0002822279930114746, 0.0003048330545425415, 0.0003274381160736084, 0.0003500431776046753, 0.0003726482391357422, 0.0003952533006668091, 0.000417858362197876, 0.00044046342372894287, 0.00046306848526000977, 0.00048567354679107666, 0.0005082786083221436, 0.0005308836698532104, 0.0005534887313842773, 0.0005760937929153442, 0.0005986988544464111, 0.000621303915977478, 0.0006439089775085449, 0.0006665140390396118, 0.0006891191005706787, 0.0007117241621017456, 0.0007343292236328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 5.0, 11.0, 19.0, 19.0, 21.0, 45.0, 80.0, 135.0, 246.0, 480.0, 1020.0, 2300.0, 7290.0, 33893.0, 239688.0, 613818.0, 122121.0, 19326.0, 4651.0, 1730.0, 724.0, 399.0, 195.0, 131.0, 55.0, 42.0, 31.0, 13.0, 12.0, 11.0, 7.0, 7.0, 2.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.05859375, -6.83331298828125, -6.6080322265625, -6.38275146484375, -6.157470703125, -5.93218994140625, -5.7069091796875, -5.48162841796875, -5.25634765625, -5.03106689453125, -4.8057861328125, -4.58050537109375, -4.355224609375, -4.12994384765625, -3.9046630859375, -3.67938232421875, -3.4541015625, -3.22882080078125, -3.0035400390625, -2.77825927734375, -2.552978515625, -2.32769775390625, -2.1024169921875, -1.87713623046875, -1.65185546875, -1.42657470703125, -1.2012939453125, -0.97601318359375, -0.750732421875, -0.52545166015625, -0.3001708984375, -0.07489013671875, 0.150390625, 0.37567138671875, 0.6009521484375, 0.82623291015625, 1.051513671875, 1.27679443359375, 1.5020751953125, 1.72735595703125, 1.95263671875, 2.17791748046875, 2.4031982421875, 2.62847900390625, 2.853759765625, 3.07904052734375, 3.3043212890625, 3.52960205078125, 3.7548828125, 3.98016357421875, 4.2054443359375, 4.43072509765625, 4.656005859375, 4.88128662109375, 5.1065673828125, 5.33184814453125, 5.55712890625, 5.78240966796875, 6.0076904296875, 6.23297119140625, 6.458251953125, 6.68353271484375, 6.9088134765625, 7.13409423828125, 7.359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 9.0, 9.0, 12.0, 13.0, 25.0, 37.0, 56.0, 83.0, 95.0, 132.0, 118.0, 122.0, 98.0, 60.0, 40.0, 30.0, 18.0, 13.0, 12.0, 6.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8984375, -10.512939453125, -10.12744140625, -9.741943359375, -9.3564453125, -8.970947265625, -8.58544921875, -8.199951171875, -7.814453125, -7.428955078125, -7.04345703125, -6.657958984375, -6.2724609375, -5.886962890625, -5.50146484375, -5.115966796875, -4.73046875, -4.344970703125, -3.95947265625, -3.573974609375, -3.1884765625, -2.802978515625, -2.41748046875, -2.031982421875, -1.646484375, -1.260986328125, -0.87548828125, -0.489990234375, -0.1044921875, 0.281005859375, 0.66650390625, 1.052001953125, 1.4375, 1.822998046875, 2.20849609375, 2.593994140625, 2.9794921875, 3.364990234375, 3.75048828125, 4.135986328125, 4.521484375, 4.906982421875, 5.29248046875, 5.677978515625, 6.0634765625, 6.448974609375, 6.83447265625, 7.219970703125, 7.60546875, 7.990966796875, 8.37646484375, 8.761962890625, 9.1474609375, 9.532958984375, 9.91845703125, 10.303955078125, 10.689453125, 11.074951171875, 11.46044921875, 11.845947265625, 12.2314453125, 12.616943359375, 13.00244140625, 13.387939453125, 13.7734375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 16.0, 29.0, 105.0, 223.0, 271.0, 190.0, 88.0, 37.0, 21.0, 11.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.9130554199219, -271.9813232421875, -265.049560546875, -258.1178283691406, -251.1860809326172, -244.25433349609375, -237.3225860595703, -230.39083862304688, -223.4591064453125, -216.52735900878906, -209.59561157226562, -202.66387939453125, -195.7321319580078, -188.80038452148438, -181.86863708496094, -174.9368896484375, -168.00515747070312, -161.0734100341797, -154.14166259765625, -147.20993041992188, -140.27818298339844, -133.346435546875, -126.41468811035156, -119.48294830322266, -112.55119323730469, -105.61944580078125, -98.68770599365234, -91.7559585571289, -84.82421875, -77.89247131347656, -70.96072387695312, -64.02898406982422, -57.09724426269531, -50.16550064086914, -43.23375701904297, -36.30200958251953, -29.370267868041992, -22.438522338867188, -15.506778717041016, -8.575035095214844, -1.6432914733886719, 5.288452625274658, 12.220196723937988, 19.151941299438477, 26.08368492126465, 33.01543045043945, 39.947174072265625, 46.8789176940918, 53.81066131591797, 60.74240493774414, 67.67414855957031, 74.60589599609375, 81.53763580322266, 88.4693832397461, 95.401123046875, 102.33287048339844, 109.26461791992188, 116.19636535644531, 123.12810516357422, 130.05984497070312, 136.99159240722656, 143.92333984375, 150.85508728027344, 157.78683471679688, 164.71856689453125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 3.0, 5.0, 3.0, 8.0, 3.0, 11.0, 11.0, 12.0, 18.0, 19.0, 18.0, 22.0, 18.0, 25.0, 28.0, 41.0, 44.0, 47.0, 56.0, 47.0, 56.0, 60.0, 62.0, 52.0, 35.0, 51.0, 35.0, 36.0, 30.0, 33.0, 22.0, 14.0, 18.0, 14.0, 12.0, 8.0, 3.0, 7.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-156.32781982421875, -152.07965087890625, -147.83148193359375, -143.5832977294922, -139.3351287841797, -135.0869598388672, -130.8387908935547, -126.59062194824219, -122.34244537353516, -118.09427642822266, -113.84609985351562, -109.59793090820312, -105.34976196289062, -101.1015853881836, -96.8534164428711, -92.60523986816406, -88.35707092285156, -84.10890197753906, -79.86072540283203, -75.61255645751953, -71.3643798828125, -67.1162109375, -62.8680419921875, -58.619869232177734, -54.37169647216797, -50.1235237121582, -45.87535095214844, -41.62718200683594, -37.37900924682617, -33.130836486816406, -28.882665634155273, -24.63449478149414, -20.386337280273438, -16.138164520263672, -11.889993667602539, -7.64182186126709, -3.3936500549316406, 0.854522705078125, 5.102693557739258, 9.35086441040039, 13.599037170410156, 17.847209930419922, 22.095380783081055, 26.343551635742188, 30.591724395751953, 34.83989715576172, 39.08806610107422, 43.336238861083984, 47.58441162109375, 51.832584381103516, 56.08075714111328, 60.32892608642578, 64.57710266113281, 68.82527160644531, 73.07344055175781, 77.32160949707031, 81.56978607177734, 85.81795501708984, 90.06613159179688, 94.31430053710938, 98.56246948242188, 102.8106460571289, 107.0588150024414, 111.30699157714844, 115.55516052246094]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 13.0, 11.0, 11.0, 14.0, 20.0, 30.0, 35.0, 42.0, 61.0, 76.0, 86.0, 121.0, 227.0, 374.0, 1128.0, 4032.0, 33027.0, 4111410.0, 36752.0, 4344.0, 1207.0, 467.0, 237.0, 126.0, 100.0, 67.0, 48.0, 39.0, 33.0, 26.0, 23.0, 25.0, 16.0, 14.0, 8.0, 7.0, 1.0, 8.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.40625, -24.57373046875, -23.7412109375, -22.90869140625, -22.076171875, -21.24365234375, -20.4111328125, -19.57861328125, -18.74609375, -17.91357421875, -17.0810546875, -16.24853515625, -15.416015625, -14.58349609375, -13.7509765625, -12.91845703125, -12.0859375, -11.25341796875, -10.4208984375, -9.58837890625, -8.755859375, -7.92333984375, -7.0908203125, -6.25830078125, -5.42578125, -4.59326171875, -3.7607421875, -2.92822265625, -2.095703125, -1.26318359375, -0.4306640625, 0.40185546875, 1.234375, 2.06689453125, 2.8994140625, 3.73193359375, 4.564453125, 5.39697265625, 6.2294921875, 7.06201171875, 7.89453125, 8.72705078125, 9.5595703125, 10.39208984375, 11.224609375, 12.05712890625, 12.8896484375, 13.72216796875, 14.5546875, 15.38720703125, 16.2197265625, 17.05224609375, 17.884765625, 18.71728515625, 19.5498046875, 20.38232421875, 21.21484375, 22.04736328125, 22.8798828125, 23.71240234375, 24.544921875, 25.37744140625, 26.2099609375, 27.04248046875, 27.875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 1.0, 8.0, 4.0, 8.0, 8.0, 12.0, 18.0, 21.0, 24.0, 32.0, 32.0, 33.0, 36.0, 37.0, 46.0, 60.0, 49.0, 86.0, 52.0, 55.0, 46.0, 50.0, 47.0, 34.0, 37.0, 32.0, 27.0, 23.0, 17.0, 11.0, 9.0, 11.0, 7.0, 5.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0], "bins": [-7.71484375, -7.52978515625, -7.3447265625, -7.15966796875, -6.974609375, -6.78955078125, -6.6044921875, -6.41943359375, -6.234375, -6.04931640625, -5.8642578125, -5.67919921875, -5.494140625, -5.30908203125, -5.1240234375, -4.93896484375, -4.75390625, -4.56884765625, -4.3837890625, -4.19873046875, -4.013671875, -3.82861328125, -3.6435546875, -3.45849609375, -3.2734375, -3.08837890625, -2.9033203125, -2.71826171875, -2.533203125, -2.34814453125, -2.1630859375, -1.97802734375, -1.79296875, -1.60791015625, -1.4228515625, -1.23779296875, -1.052734375, -0.86767578125, -0.6826171875, -0.49755859375, -0.3125, -0.12744140625, 0.0576171875, 0.24267578125, 0.427734375, 0.61279296875, 0.7978515625, 0.98291015625, 1.16796875, 1.35302734375, 1.5380859375, 1.72314453125, 1.908203125, 2.09326171875, 2.2783203125, 2.46337890625, 2.6484375, 2.83349609375, 3.0185546875, 3.20361328125, 3.388671875, 3.57373046875, 3.7587890625, 3.94384765625, 4.12890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 4.0, 8.0, 7.0, 12.0, 15.0, 39.0, 20.0, 41.0, 46.0, 83.0, 104.0, 128.0, 185.0, 295.0, 438.0, 659.0, 1093.0, 1850.0, 3570.0, 8478.0, 26347.0, 233906.0, 3817566.0, 71594.0, 15224.0, 5690.0, 2724.0, 1509.0, 866.0, 588.0, 368.0, 208.0, 140.0, 129.0, 101.0, 65.0, 41.0, 44.0, 29.0, 21.0, 8.0, 10.0, 7.0, 2.0, 11.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.1171875, -14.67626953125, -14.2353515625, -13.79443359375, -13.353515625, -12.91259765625, -12.4716796875, -12.03076171875, -11.58984375, -11.14892578125, -10.7080078125, -10.26708984375, -9.826171875, -9.38525390625, -8.9443359375, -8.50341796875, -8.0625, -7.62158203125, -7.1806640625, -6.73974609375, -6.298828125, -5.85791015625, -5.4169921875, -4.97607421875, -4.53515625, -4.09423828125, -3.6533203125, -3.21240234375, -2.771484375, -2.33056640625, -1.8896484375, -1.44873046875, -1.0078125, -0.56689453125, -0.1259765625, 0.31494140625, 0.755859375, 1.19677734375, 1.6376953125, 2.07861328125, 2.51953125, 2.96044921875, 3.4013671875, 3.84228515625, 4.283203125, 4.72412109375, 5.1650390625, 5.60595703125, 6.046875, 6.48779296875, 6.9287109375, 7.36962890625, 7.810546875, 8.25146484375, 8.6923828125, 9.13330078125, 9.57421875, 10.01513671875, 10.4560546875, 10.89697265625, 11.337890625, 11.77880859375, 12.2197265625, 12.66064453125, 13.1015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 11.0, 12.0, 15.0, 31.0, 46.0, 201.0, 3202.0, 406.0, 79.0, 34.0, 13.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3828125, -8.16619873046875, -7.9495849609375, -7.73297119140625, -7.516357421875, -7.29974365234375, -7.0831298828125, -6.86651611328125, -6.64990234375, -6.43328857421875, -6.2166748046875, -6.00006103515625, -5.783447265625, -5.56683349609375, -5.3502197265625, -5.13360595703125, -4.9169921875, -4.70037841796875, -4.4837646484375, -4.26715087890625, -4.050537109375, -3.83392333984375, -3.6173095703125, -3.40069580078125, -3.18408203125, -2.96746826171875, -2.7508544921875, -2.53424072265625, -2.317626953125, -2.10101318359375, -1.8843994140625, -1.66778564453125, -1.451171875, -1.23455810546875, -1.0179443359375, -0.80133056640625, -0.584716796875, -0.36810302734375, -0.1514892578125, 0.06512451171875, 0.28173828125, 0.49835205078125, 0.7149658203125, 0.93157958984375, 1.148193359375, 1.36480712890625, 1.5814208984375, 1.79803466796875, 2.0146484375, 2.23126220703125, 2.4478759765625, 2.66448974609375, 2.881103515625, 3.09771728515625, 3.3143310546875, 3.53094482421875, 3.74755859375, 3.96417236328125, 4.1807861328125, 4.39739990234375, 4.614013671875, 4.83062744140625, 5.0472412109375, 5.26385498046875, 5.48046875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 12.0, 12.0, 28.0, 35.0, 66.0, 86.0, 108.0, 142.0, 145.0, 140.0, 85.0, 56.0, 32.0, 20.0, 6.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.008729934692383, -20.412391662597656, -19.816055297851562, -19.219717025756836, -18.62337875366211, -18.027042388916016, -17.43070411682129, -16.834365844726562, -16.23802947998047, -15.641692161560059, -15.045353889465332, -14.449016571044922, -13.852678298950195, -13.256340980529785, -12.660003662109375, -12.063665390014648, -11.467327117919922, -10.870989799499512, -10.274651527404785, -9.678314208984375, -9.081975936889648, -8.485638618469238, -7.889301300048828, -7.29296350479126, -6.696625709533691, -6.100287914276123, -5.503950119018555, -4.9076128005981445, -4.311275005340576, -3.714937210083008, -3.1185996532440186, -2.5222620964050293, -1.9259262084960938, -1.329588532447815, -0.7332508563995361, -0.13691318035125732, 0.4594244956970215, 1.0557622909545898, 1.652099847793579, 2.2484374046325684, 2.8447751998901367, 3.441112995147705, 4.037450790405273, 4.633788108825684, 5.230125904083252, 5.82646369934082, 6.4228010177612305, 7.019138813018799, 7.615476608276367, 8.211813926696777, 8.808152198791504, 9.404489517211914, 10.00082778930664, 10.59716510772705, 11.193502426147461, 11.789840698242188, 12.386178016662598, 12.982515335083008, 13.578853607177734, 14.175190925598145, 14.771528244018555, 15.367866516113281, 15.964203834533691, 16.5605411529541, 17.156879425048828]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 8.0, 11.0, 5.0, 11.0, 9.0, 13.0, 16.0, 25.0, 17.0, 29.0, 25.0, 28.0, 34.0, 27.0, 40.0, 37.0, 42.0, 48.0, 35.0, 52.0, 41.0, 41.0, 35.0, 47.0, 41.0, 37.0, 31.0, 27.0, 30.0, 20.0, 23.0, 21.0, 22.0, 10.0, 11.0, 9.0, 12.0, 11.0, 5.0, 4.0, 2.0, 2.0, 8.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.277486801147461, -8.947338104248047, -8.617189407348633, -8.287041664123535, -7.956892967224121, -7.626744270324707, -7.296595573425293, -6.966446876525879, -6.636298656463623, -6.306149959564209, -5.976001739501953, -5.645853042602539, -5.315704345703125, -4.985556125640869, -4.655407428741455, -4.325259208679199, -3.995110511779785, -3.66496205329895, -3.3348135948181152, -3.004664897918701, -2.674516439437866, -2.3443679809570312, -2.014219284057617, -1.6840708255767822, -1.3539223670959473, -1.0237739086151123, -0.6936253309249878, -0.36347681283950806, -0.03332829475402832, 0.29682016372680664, 0.6269687414169312, 0.9571173191070557, 1.2872648239135742, 1.6174132823944092, 1.9475618600845337, 2.277710437774658, 2.607858896255493, 2.938007354736328, 3.268156051635742, 3.598304510116577, 3.928452968597412, 4.258601665496826, 4.588749885559082, 4.918898582458496, 5.24904727935791, 5.579195499420166, 5.90934419631958, 6.239492416381836, 6.56964111328125, 6.899789810180664, 7.22993803024292, 7.560086727142334, 7.89023494720459, 8.220383644104004, 8.550532341003418, 8.880681037902832, 9.21082878112793, 9.540977478027344, 9.871126174926758, 10.201273918151855, 10.53142261505127, 10.861571311950684, 11.191720008850098, 11.521868705749512, 11.852017402648926]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 13.0, 20.0, 25.0, 41.0, 60.0, 106.0, 137.0, 245.0, 415.0, 685.0, 1252.0, 2601.0, 5721.0, 14299.0, 39410.0, 119624.0, 316177.0, 338669.0, 136059.0, 44668.0, 15835.0, 6445.0, 2844.0, 1364.0, 728.0, 400.0, 254.0, 138.0, 91.0, 58.0, 49.0, 23.0, 14.0, 20.0, 12.0, 13.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.765625, -8.4921875, -8.21875, -7.9453125, -7.671875, -7.3984375, -7.125, -6.8515625, -6.578125, -6.3046875, -6.03125, -5.7578125, -5.484375, -5.2109375, -4.9375, -4.6640625, -4.390625, -4.1171875, -3.84375, -3.5703125, -3.296875, -3.0234375, -2.75, -2.4765625, -2.203125, -1.9296875, -1.65625, -1.3828125, -1.109375, -0.8359375, -0.5625, -0.2890625, -0.015625, 0.2578125, 0.53125, 0.8046875, 1.078125, 1.3515625, 1.625, 1.8984375, 2.171875, 2.4453125, 2.71875, 2.9921875, 3.265625, 3.5390625, 3.8125, 4.0859375, 4.359375, 4.6328125, 4.90625, 5.1796875, 5.453125, 5.7265625, 6.0, 6.2734375, 6.546875, 6.8203125, 7.09375, 7.3671875, 7.640625, 7.9140625, 8.1875, 8.4609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 4.0, 6.0, 5.0, 6.0, 16.0, 19.0, 15.0, 20.0, 21.0, 27.0, 28.0, 38.0, 44.0, 30.0, 33.0, 56.0, 48.0, 55.0, 37.0, 44.0, 50.0, 43.0, 42.0, 42.0, 43.0, 42.0, 25.0, 24.0, 28.0, 25.0, 13.0, 16.0, 7.0, 7.0, 8.0, 3.0, 6.0, 4.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0], "bins": [-6.171875, -6.0108642578125, -5.849853515625, -5.6888427734375, -5.52783203125, -5.3668212890625, -5.205810546875, -5.0447998046875, -4.8837890625, -4.7227783203125, -4.561767578125, -4.4007568359375, -4.23974609375, -4.0787353515625, -3.917724609375, -3.7567138671875, -3.595703125, -3.4346923828125, -3.273681640625, -3.1126708984375, -2.95166015625, -2.7906494140625, -2.629638671875, -2.4686279296875, -2.3076171875, -2.1466064453125, -1.985595703125, -1.8245849609375, -1.66357421875, -1.5025634765625, -1.341552734375, -1.1805419921875, -1.01953125, -0.8585205078125, -0.697509765625, -0.5364990234375, -0.37548828125, -0.2144775390625, -0.053466796875, 0.1075439453125, 0.2685546875, 0.4295654296875, 0.590576171875, 0.7515869140625, 0.91259765625, 1.0736083984375, 1.234619140625, 1.3956298828125, 1.556640625, 1.7176513671875, 1.878662109375, 2.0396728515625, 2.20068359375, 2.3616943359375, 2.522705078125, 2.6837158203125, 2.8447265625, 3.0057373046875, 3.166748046875, 3.3277587890625, 3.48876953125, 3.6497802734375, 3.810791015625, 3.9718017578125, 4.1328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 10.0, 19.0, 29.0, 41.0, 70.0, 134.0, 253.0, 632.0, 1698.0, 6447.0, 44812.0, 614629.0, 346959.0, 26100.0, 4481.0, 1256.0, 494.0, 193.0, 128.0, 63.0, 36.0, 16.0, 22.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.484375, -17.796630859375, -17.10888671875, -16.421142578125, -15.7333984375, -15.045654296875, -14.35791015625, -13.670166015625, -12.982421875, -12.294677734375, -11.60693359375, -10.919189453125, -10.2314453125, -9.543701171875, -8.85595703125, -8.168212890625, -7.48046875, -6.792724609375, -6.10498046875, -5.417236328125, -4.7294921875, -4.041748046875, -3.35400390625, -2.666259765625, -1.978515625, -1.290771484375, -0.60302734375, 0.084716796875, 0.7724609375, 1.460205078125, 2.14794921875, 2.835693359375, 3.5234375, 4.211181640625, 4.89892578125, 5.586669921875, 6.2744140625, 6.962158203125, 7.64990234375, 8.337646484375, 9.025390625, 9.713134765625, 10.40087890625, 11.088623046875, 11.7763671875, 12.464111328125, 13.15185546875, 13.839599609375, 14.52734375, 15.215087890625, 15.90283203125, 16.590576171875, 17.2783203125, 17.966064453125, 18.65380859375, 19.341552734375, 20.029296875, 20.717041015625, 21.40478515625, 22.092529296875, 22.7802734375, 23.468017578125, 24.15576171875, 24.843505859375, 25.53125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 13.0, 21.0, 23.0, 29.0, 25.0, 27.0, 39.0, 42.0, 45.0, 57.0, 44.0, 40.0, 65.0, 54.0, 39.0, 39.0, 48.0, 40.0, 42.0, 33.0, 30.0, 31.0, 28.0, 27.0, 16.0, 16.0, 10.0, 7.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.296875, -24.46240234375, -23.6279296875, -22.79345703125, -21.958984375, -21.12451171875, -20.2900390625, -19.45556640625, -18.62109375, -17.78662109375, -16.9521484375, -16.11767578125, -15.283203125, -14.44873046875, -13.6142578125, -12.77978515625, -11.9453125, -11.11083984375, -10.2763671875, -9.44189453125, -8.607421875, -7.77294921875, -6.9384765625, -6.10400390625, -5.26953125, -4.43505859375, -3.6005859375, -2.76611328125, -1.931640625, -1.09716796875, -0.2626953125, 0.57177734375, 1.40625, 2.24072265625, 3.0751953125, 3.90966796875, 4.744140625, 5.57861328125, 6.4130859375, 7.24755859375, 8.08203125, 8.91650390625, 9.7509765625, 10.58544921875, 11.419921875, 12.25439453125, 13.0888671875, 13.92333984375, 14.7578125, 15.59228515625, 16.4267578125, 17.26123046875, 18.095703125, 18.93017578125, 19.7646484375, 20.59912109375, 21.43359375, 22.26806640625, 23.1025390625, 23.93701171875, 24.771484375, 25.60595703125, 26.4404296875, 27.27490234375, 28.109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 2.0, 2.0, 10.0, 8.0, 8.0, 15.0, 12.0, 15.0, 24.0, 51.0, 69.0, 121.0, 263.0, 699.0, 2644.0, 22429.0, 797491.0, 213513.0, 8661.0, 1543.0, 452.0, 203.0, 112.0, 53.0, 35.0, 22.0, 17.0, 17.0, 12.0, 7.0, 10.0, 6.0, 5.0, 3.0, 4.0, 5.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.921875, -14.4931640625, -14.064453125, -13.6357421875, -13.20703125, -12.7783203125, -12.349609375, -11.9208984375, -11.4921875, -11.0634765625, -10.634765625, -10.2060546875, -9.77734375, -9.3486328125, -8.919921875, -8.4912109375, -8.0625, -7.6337890625, -7.205078125, -6.7763671875, -6.34765625, -5.9189453125, -5.490234375, -5.0615234375, -4.6328125, -4.2041015625, -3.775390625, -3.3466796875, -2.91796875, -2.4892578125, -2.060546875, -1.6318359375, -1.203125, -0.7744140625, -0.345703125, 0.0830078125, 0.51171875, 0.9404296875, 1.369140625, 1.7978515625, 2.2265625, 2.6552734375, 3.083984375, 3.5126953125, 3.94140625, 4.3701171875, 4.798828125, 5.2275390625, 5.65625, 6.0849609375, 6.513671875, 6.9423828125, 7.37109375, 7.7998046875, 8.228515625, 8.6572265625, 9.0859375, 9.5146484375, 9.943359375, 10.3720703125, 10.80078125, 11.2294921875, 11.658203125, 12.0869140625, 12.515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 10.0, 17.0, 25.0, 37.0, 54.0, 78.0, 88.0, 128.0, 131.0, 115.0, 100.0, 71.0, 40.0, 28.0, 23.0, 17.0, 13.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001277923583984375, -0.0012341439723968506, -0.0011903643608093262, -0.0011465847492218018, -0.0011028051376342773, -0.001059025526046753, -0.0010152459144592285, -0.0009714663028717041, -0.0009276866912841797, -0.0008839070796966553, -0.0008401274681091309, -0.0007963478565216064, -0.000752568244934082, -0.0007087886333465576, -0.0006650090217590332, -0.0006212294101715088, -0.0005774497985839844, -0.00053367018699646, -0.0004898905754089355, -0.00044611096382141113, -0.0004023313522338867, -0.0003585517406463623, -0.0003147721290588379, -0.0002709925174713135, -0.00022721290588378906, -0.00018343329429626465, -0.00013965368270874023, -9.587407112121582e-05, -5.2094459533691406e-05, -8.314847946166992e-06, 3.546476364135742e-05, 7.924437522888184e-05, 0.00012302398681640625, 0.00016680359840393066, 0.00021058320999145508, 0.0002543628215789795, 0.0002981424331665039, 0.0003419220447540283, 0.00038570165634155273, 0.00042948126792907715, 0.00047326087951660156, 0.000517040491104126, 0.0005608201026916504, 0.0006045997142791748, 0.0006483793258666992, 0.0006921589374542236, 0.000735938549041748, 0.0007797181606292725, 0.0008234977722167969, 0.0008672773838043213, 0.0009110569953918457, 0.0009548366069793701, 0.0009986162185668945, 0.001042395830154419, 0.0010861754417419434, 0.0011299550533294678, 0.0011737346649169922, 0.0012175142765045166, 0.001261293888092041, 0.0013050734996795654, 0.0013488531112670898, 0.0013926327228546143, 0.0014364123344421387, 0.001480191946029663, 0.0015239715576171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 12.0, 12.0, 31.0, 44.0, 79.0, 175.0, 476.0, 2005.0, 22144.0, 951248.0, 67992.0, 3261.0, 672.0, 222.0, 92.0, 39.0, 30.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.3878173828125, -13.752197265625, -13.1165771484375, -12.48095703125, -11.8453369140625, -11.209716796875, -10.5740966796875, -9.9384765625, -9.3028564453125, -8.667236328125, -8.0316162109375, -7.39599609375, -6.7603759765625, -6.124755859375, -5.4891357421875, -4.853515625, -4.2178955078125, -3.582275390625, -2.9466552734375, -2.31103515625, -1.6754150390625, -1.039794921875, -0.4041748046875, 0.2314453125, 0.8670654296875, 1.502685546875, 2.1383056640625, 2.77392578125, 3.4095458984375, 4.045166015625, 4.6807861328125, 5.31640625, 5.9520263671875, 6.587646484375, 7.2232666015625, 7.85888671875, 8.4945068359375, 9.130126953125, 9.7657470703125, 10.4013671875, 11.0369873046875, 11.672607421875, 12.3082275390625, 12.94384765625, 13.5794677734375, 14.215087890625, 14.8507080078125, 15.486328125, 16.1219482421875, 16.757568359375, 17.3931884765625, 18.02880859375, 18.6644287109375, 19.300048828125, 19.9356689453125, 20.5712890625, 21.2069091796875, 21.842529296875, 22.4781494140625, 23.11376953125, 23.7493896484375, 24.385009765625, 25.0206298828125, 25.65625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 8.0, 8.0, 22.0, 19.0, 42.0, 67.0, 85.0, 133.0, 143.0, 115.0, 113.0, 85.0, 56.0, 32.0, 12.0, 13.0, 10.0, 12.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1015625, -13.7470703125, -13.392578125, -13.0380859375, -12.68359375, -12.3291015625, -11.974609375, -11.6201171875, -11.265625, -10.9111328125, -10.556640625, -10.2021484375, -9.84765625, -9.4931640625, -9.138671875, -8.7841796875, -8.4296875, -8.0751953125, -7.720703125, -7.3662109375, -7.01171875, -6.6572265625, -6.302734375, -5.9482421875, -5.59375, -5.2392578125, -4.884765625, -4.5302734375, -4.17578125, -3.8212890625, -3.466796875, -3.1123046875, -2.7578125, -2.4033203125, -2.048828125, -1.6943359375, -1.33984375, -0.9853515625, -0.630859375, -0.2763671875, 0.078125, 0.4326171875, 0.787109375, 1.1416015625, 1.49609375, 1.8505859375, 2.205078125, 2.5595703125, 2.9140625, 3.2685546875, 3.623046875, 3.9775390625, 4.33203125, 4.6865234375, 5.041015625, 5.3955078125, 5.75, 6.1044921875, 6.458984375, 6.8134765625, 7.16796875, 7.5224609375, 7.876953125, 8.2314453125, 8.5859375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 21.0, 58.0, 304.0, 449.0, 137.0, 25.0, 2.0, 3.0, 2.0, 4.0], "bins": [-755.94287109375, -742.769287109375, -729.595703125, -716.422119140625, -703.24853515625, -690.074951171875, -676.9013671875, -663.7278442382812, -650.5542602539062, -637.3806762695312, -624.2070922851562, -611.0335083007812, -597.8599243164062, -584.6864013671875, -571.5128173828125, -558.3392333984375, -545.1656494140625, -531.9920654296875, -518.8184814453125, -505.6448974609375, -492.4713439941406, -479.2977600097656, -466.1241760253906, -452.9505920410156, -439.7769775390625, -426.6033935546875, -413.4298095703125, -400.2562255859375, -387.0826721191406, -373.9090881347656, -360.7355041503906, -347.5619201660156, -334.38836669921875, -321.21478271484375, -308.04119873046875, -294.86761474609375, -281.6940612792969, -268.5204772949219, -255.34689331054688, -242.17330932617188, -228.99972534179688, -215.82614135742188, -202.65257263183594, -189.47898864746094, -176.305419921875, -163.1318359375, -149.958251953125, -136.78466796875, -123.61109924316406, -110.4375228881836, -97.26394653320312, -84.09036254882812, -70.91678619384766, -57.74320983886719, -44.56962585449219, -31.39604949951172, -18.22247314453125, -5.048894882202148, 8.124683380126953, 21.298263549804688, 34.471839904785156, 47.645416259765625, 60.819000244140625, 73.9925765991211, 87.16615295410156]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 3.0, 4.0, 11.0, 4.0, 12.0, 14.0, 16.0, 19.0, 27.0, 25.0, 37.0, 55.0, 49.0, 68.0, 59.0, 74.0, 68.0, 54.0, 64.0, 64.0, 42.0, 53.0, 32.0, 36.0, 31.0, 27.0, 12.0, 16.0, 9.0, 6.0, 8.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-200.82382202148438, -195.7283477783203, -190.6328582763672, -185.53738403320312, -180.44190979003906, -175.346435546875, -170.25094604492188, -165.1554718017578, -160.05999755859375, -154.9645233154297, -149.86903381347656, -144.7735595703125, -139.67808532714844, -134.58261108398438, -129.48712158203125, -124.39164733886719, -119.29615783691406, -114.20067596435547, -109.1052017211914, -104.00971984863281, -98.91424560546875, -93.81876373291016, -88.72328186035156, -83.6278076171875, -78.5323257446289, -73.43684387207031, -68.34136962890625, -63.245887756347656, -58.15040969848633, -53.054931640625, -47.959449768066406, -42.86397171020508, -37.76847839355469, -32.67300033569336, -27.5775203704834, -22.482040405273438, -17.38656234741211, -12.291084289550781, -7.19560432434082, -2.1001243591308594, 2.9953536987304688, 8.090832710266113, 13.186311721801758, 18.28179168701172, 23.377269744873047, 28.472747802734375, 33.56822967529297, 38.6637077331543, 43.759185791015625, 48.85466384887695, 53.95014190673828, 59.045623779296875, 64.14109802246094, 69.23657989501953, 74.33206176757812, 79.42753601074219, 84.52301788330078, 89.61849975585938, 94.71397399902344, 99.80945587158203, 104.90493774414062, 110.00041198730469, 115.09589385986328, 120.19137573242188, 125.28684997558594]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 5.0, 8.0, 16.0, 23.0, 18.0, 54.0, 55.0, 83.0, 136.0, 232.0, 358.0, 583.0, 930.0, 1648.0, 3245.0, 7260.0, 21701.0, 148895.0, 3940536.0, 46002.0, 12078.0, 4839.0, 2396.0, 1278.0, 733.0, 410.0, 269.0, 180.0, 103.0, 72.0, 44.0, 36.0, 20.0, 16.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.9375, -11.6170654296875, -11.296630859375, -10.9761962890625, -10.65576171875, -10.3353271484375, -10.014892578125, -9.6944580078125, -9.3740234375, -9.0535888671875, -8.733154296875, -8.4127197265625, -8.09228515625, -7.7718505859375, -7.451416015625, -7.1309814453125, -6.810546875, -6.4901123046875, -6.169677734375, -5.8492431640625, -5.52880859375, -5.2083740234375, -4.887939453125, -4.5675048828125, -4.2470703125, -3.9266357421875, -3.606201171875, -3.2857666015625, -2.96533203125, -2.6448974609375, -2.324462890625, -2.0040283203125, -1.68359375, -1.3631591796875, -1.042724609375, -0.7222900390625, -0.40185546875, -0.0814208984375, 0.239013671875, 0.5594482421875, 0.8798828125, 1.2003173828125, 1.520751953125, 1.8411865234375, 2.16162109375, 2.4820556640625, 2.802490234375, 3.1229248046875, 3.443359375, 3.7637939453125, 4.084228515625, 4.4046630859375, 4.72509765625, 5.0455322265625, 5.365966796875, 5.6864013671875, 6.0068359375, 6.3272705078125, 6.647705078125, 6.9681396484375, 7.28857421875, 7.6090087890625, 7.929443359375, 8.2498779296875, 8.5703125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 13.0, 21.0, 31.0, 36.0, 49.0, 46.0, 47.0, 53.0, 83.0, 72.0, 74.0, 69.0, 74.0, 53.0, 71.0, 55.0, 34.0, 25.0, 30.0, 22.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.1231689453125, -8.871337890625, -8.6195068359375, -8.36767578125, -8.1158447265625, -7.864013671875, -7.6121826171875, -7.3603515625, -7.1085205078125, -6.856689453125, -6.6048583984375, -6.35302734375, -6.1011962890625, -5.849365234375, -5.5975341796875, -5.345703125, -5.0938720703125, -4.842041015625, -4.5902099609375, -4.33837890625, -4.0865478515625, -3.834716796875, -3.5828857421875, -3.3310546875, -3.0792236328125, -2.827392578125, -2.5755615234375, -2.32373046875, -2.0718994140625, -1.820068359375, -1.5682373046875, -1.31640625, -1.0645751953125, -0.812744140625, -0.5609130859375, -0.30908203125, -0.0572509765625, 0.194580078125, 0.4464111328125, 0.6982421875, 0.9500732421875, 1.201904296875, 1.4537353515625, 1.70556640625, 1.9573974609375, 2.209228515625, 2.4610595703125, 2.712890625, 2.9647216796875, 3.216552734375, 3.4683837890625, 3.72021484375, 3.9720458984375, 4.223876953125, 4.4757080078125, 4.7275390625, 4.9793701171875, 5.231201171875, 5.4830322265625, 5.73486328125, 5.9866943359375, 6.238525390625, 6.4903564453125, 6.7421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 12.0, 10.0, 8.0, 22.0, 32.0, 41.0, 53.0, 60.0, 88.0, 98.0, 182.0, 243.0, 369.0, 663.0, 1465.0, 3455.0, 11201.0, 70694.0, 4004215.0, 81947.0, 12170.0, 3727.0, 1512.0, 700.0, 376.0, 240.0, 164.0, 106.0, 73.0, 69.0, 69.0, 45.0, 32.0, 32.0, 22.0, 19.0, 15.0, 4.0, 12.0, 8.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.640625, -16.144287109375, -15.64794921875, -15.151611328125, -14.6552734375, -14.158935546875, -13.66259765625, -13.166259765625, -12.669921875, -12.173583984375, -11.67724609375, -11.180908203125, -10.6845703125, -10.188232421875, -9.69189453125, -9.195556640625, -8.69921875, -8.202880859375, -7.70654296875, -7.210205078125, -6.7138671875, -6.217529296875, -5.72119140625, -5.224853515625, -4.728515625, -4.232177734375, -3.73583984375, -3.239501953125, -2.7431640625, -2.246826171875, -1.75048828125, -1.254150390625, -0.7578125, -0.261474609375, 0.23486328125, 0.731201171875, 1.2275390625, 1.723876953125, 2.22021484375, 2.716552734375, 3.212890625, 3.709228515625, 4.20556640625, 4.701904296875, 5.1982421875, 5.694580078125, 6.19091796875, 6.687255859375, 7.18359375, 7.679931640625, 8.17626953125, 8.672607421875, 9.1689453125, 9.665283203125, 10.16162109375, 10.657958984375, 11.154296875, 11.650634765625, 12.14697265625, 12.643310546875, 13.1396484375, 13.635986328125, 14.13232421875, 14.628662109375, 15.125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 1.0, 1.0, 9.0, 5.0, 2.0, 15.0, 23.0, 48.0, 76.0, 235.0, 3245.0, 231.0, 80.0, 32.0, 19.0, 18.0, 10.0, 3.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.2442626953125, -2.129150390625, -2.0140380859375, -1.89892578125, -1.7838134765625, -1.668701171875, -1.5535888671875, -1.4384765625, -1.3233642578125, -1.208251953125, -1.0931396484375, -0.97802734375, -0.8629150390625, -0.747802734375, -0.6326904296875, -0.517578125, -0.4024658203125, -0.287353515625, -0.1722412109375, -0.05712890625, 0.0579833984375, 0.173095703125, 0.2882080078125, 0.4033203125, 0.5184326171875, 0.633544921875, 0.7486572265625, 0.86376953125, 0.9788818359375, 1.093994140625, 1.2091064453125, 1.32421875, 1.4393310546875, 1.554443359375, 1.6695556640625, 1.78466796875, 1.8997802734375, 2.014892578125, 2.1300048828125, 2.2451171875, 2.3602294921875, 2.475341796875, 2.5904541015625, 2.70556640625, 2.8206787109375, 2.935791015625, 3.0509033203125, 3.166015625, 3.2811279296875, 3.396240234375, 3.5113525390625, 3.62646484375, 3.7415771484375, 3.856689453125, 3.9718017578125, 4.0869140625, 4.2020263671875, 4.317138671875, 4.4322509765625, 4.54736328125, 4.6624755859375, 4.777587890625, 4.8927001953125, 5.0078125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 12.0, 26.0, 41.0, 71.0, 109.0, 159.0, 119.0, 142.0, 102.0, 68.0, 57.0, 34.0, 11.0, 8.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03124713897705, -9.516375541687012, -9.001503944396973, -8.486631393432617, -7.971759796142578, -7.456888198852539, -6.9420166015625, -6.427145004272461, -5.912272930145264, -5.397401332855225, -4.882529258728027, -4.367657661437988, -3.85278582572937, -3.337913990020752, -2.823042392730713, -2.3081705570220947, -1.7932987213134766, -1.2784268856048584, -0.7635551691055298, -0.24868345260620117, 0.266188383102417, 0.7810602188110352, 1.2959318161010742, 1.8108036518096924, 2.3256754875183105, 2.8405473232269287, 3.355419158935547, 3.870290756225586, 4.385162353515625, 4.900034427642822, 5.414906024932861, 5.929778099060059, 6.444648742675781, 6.95952033996582, 7.474392414093018, 7.989264011383057, 8.504136085510254, 9.019007682800293, 9.533879280090332, 10.048750877380371, 10.563623428344727, 11.078495025634766, 11.593366622924805, 12.108238220214844, 12.6231107711792, 13.137982368469238, 13.652853965759277, 14.167725563049316, 14.682597160339355, 15.197468757629395, 15.712340354919434, 16.22721290588379, 16.742084503173828, 17.256956100463867, 17.771827697753906, 18.286699295043945, 18.801570892333984, 19.316442489624023, 19.831314086914062, 20.3461856842041, 20.86105728149414, 21.375930786132812, 21.89080047607422, 22.40567398071289, 22.92054557800293]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 8.0, 6.0, 8.0, 17.0, 14.0, 13.0, 11.0, 15.0, 23.0, 31.0, 30.0, 33.0, 40.0, 41.0, 34.0, 33.0, 36.0, 52.0, 40.0, 39.0, 41.0, 37.0, 40.0, 42.0, 36.0, 46.0, 25.0, 30.0, 23.0, 22.0, 24.0, 18.0, 15.0, 11.0, 10.0, 12.0, 7.0, 10.0, 4.0, 5.0, 2.0, 0.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.5951948165893555, -5.411416530609131, -5.227637767791748, -5.043859481811523, -4.860081195831299, -4.676302909851074, -4.492524147033691, -4.308745861053467, -4.124967575073242, -3.9411890506744385, -3.757410764694214, -3.57363224029541, -3.3898539543151855, -3.206075429916382, -3.022296905517578, -2.8385186195373535, -2.6547398567199707, -2.470961332321167, -2.2871830463409424, -2.1034045219421387, -1.9196261167526245, -1.7358477115631104, -1.5520691871643066, -1.3682907819747925, -1.1845123767852783, -1.0007339715957642, -0.8169555068016052, -0.6331770420074463, -0.44939863681793213, -0.26562023162841797, -0.08184170722961426, 0.1019366979598999, 0.28571510314941406, 0.4694935381412506, 0.6532719731330872, 0.8370504379272461, 1.0208288431167603, 1.2046072483062744, 1.3883857727050781, 1.5721641778945923, 1.7559425830841064, 1.9397209882736206, 2.1234993934631348, 2.3072779178619385, 2.491056442260742, 2.674834728240967, 2.8586132526397705, 3.042391777038574, 3.226170063018799, 3.4099485874176025, 3.593726873397827, 3.777505397796631, 3.9612836837768555, 4.145062446594238, 4.328840732574463, 4.5126190185546875, 4.69639778137207, 4.880176067352295, 5.063954830169678, 5.247733116149902, 5.431511402130127, 5.615289688110352, 5.799068450927734, 5.982846736907959, 6.166625022888184]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 12.0, 13.0, 15.0, 28.0, 37.0, 60.0, 109.0, 199.0, 278.0, 524.0, 1055.0, 2143.0, 4987.0, 12508.0, 35257.0, 108838.0, 306704.0, 361673.0, 141077.0, 45877.0, 15878.0, 6048.0, 2572.0, 1225.0, 586.0, 322.0, 211.0, 123.0, 61.0, 54.0, 21.0, 22.0, 10.0, 13.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91015625, -6.64556884765625, -6.3809814453125, -6.11639404296875, -5.851806640625, -5.58721923828125, -5.3226318359375, -5.05804443359375, -4.79345703125, -4.52886962890625, -4.2642822265625, -3.99969482421875, -3.735107421875, -3.47052001953125, -3.2059326171875, -2.94134521484375, -2.6767578125, -2.41217041015625, -2.1475830078125, -1.88299560546875, -1.618408203125, -1.35382080078125, -1.0892333984375, -0.82464599609375, -0.56005859375, -0.29547119140625, -0.0308837890625, 0.23370361328125, 0.498291015625, 0.76287841796875, 1.0274658203125, 1.29205322265625, 1.556640625, 1.82122802734375, 2.0858154296875, 2.35040283203125, 2.614990234375, 2.87957763671875, 3.1441650390625, 3.40875244140625, 3.67333984375, 3.93792724609375, 4.2025146484375, 4.46710205078125, 4.731689453125, 4.99627685546875, 5.2608642578125, 5.52545166015625, 5.7900390625, 6.05462646484375, 6.3192138671875, 6.58380126953125, 6.848388671875, 7.11297607421875, 7.3775634765625, 7.64215087890625, 7.90673828125, 8.17132568359375, 8.4359130859375, 8.70050048828125, 8.965087890625, 9.22967529296875, 9.4942626953125, 9.75885009765625, 10.0234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 9.0, 16.0, 15.0, 32.0, 23.0, 43.0, 41.0, 54.0, 62.0, 65.0, 74.0, 66.0, 80.0, 72.0, 66.0, 61.0, 48.0, 50.0, 33.0, 20.0, 22.0, 16.0, 4.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.8695068359375, -9.614013671875, -9.3585205078125, -9.10302734375, -8.8475341796875, -8.592041015625, -8.3365478515625, -8.0810546875, -7.8255615234375, -7.570068359375, -7.3145751953125, -7.05908203125, -6.8035888671875, -6.548095703125, -6.2926025390625, -6.037109375, -5.7816162109375, -5.526123046875, -5.2706298828125, -5.01513671875, -4.7596435546875, -4.504150390625, -4.2486572265625, -3.9931640625, -3.7376708984375, -3.482177734375, -3.2266845703125, -2.97119140625, -2.7156982421875, -2.460205078125, -2.2047119140625, -1.94921875, -1.6937255859375, -1.438232421875, -1.1827392578125, -0.92724609375, -0.6717529296875, -0.416259765625, -0.1607666015625, 0.0947265625, 0.3502197265625, 0.605712890625, 0.8612060546875, 1.11669921875, 1.3721923828125, 1.627685546875, 1.8831787109375, 2.138671875, 2.3941650390625, 2.649658203125, 2.9051513671875, 3.16064453125, 3.4161376953125, 3.671630859375, 3.9271240234375, 4.1826171875, 4.4381103515625, 4.693603515625, 4.9490966796875, 5.20458984375, 5.4600830078125, 5.715576171875, 5.9710693359375, 6.2265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 7.0, 12.0, 13.0, 11.0, 23.0, 23.0, 43.0, 76.0, 121.0, 229.0, 472.0, 1609.0, 7665.0, 91835.0, 846145.0, 90022.0, 7531.0, 1569.0, 545.0, 248.0, 134.0, 68.0, 49.0, 25.0, 23.0, 11.0, 15.0, 10.0, 6.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.71875, -20.016357421875, -19.31396484375, -18.611572265625, -17.9091796875, -17.206787109375, -16.50439453125, -15.802001953125, -15.099609375, -14.397216796875, -13.69482421875, -12.992431640625, -12.2900390625, -11.587646484375, -10.88525390625, -10.182861328125, -9.48046875, -8.778076171875, -8.07568359375, -7.373291015625, -6.6708984375, -5.968505859375, -5.26611328125, -4.563720703125, -3.861328125, -3.158935546875, -2.45654296875, -1.754150390625, -1.0517578125, -0.349365234375, 0.35302734375, 1.055419921875, 1.7578125, 2.460205078125, 3.16259765625, 3.864990234375, 4.5673828125, 5.269775390625, 5.97216796875, 6.674560546875, 7.376953125, 8.079345703125, 8.78173828125, 9.484130859375, 10.1865234375, 10.888916015625, 11.59130859375, 12.293701171875, 12.99609375, 13.698486328125, 14.40087890625, 15.103271484375, 15.8056640625, 16.508056640625, 17.21044921875, 17.912841796875, 18.615234375, 19.317626953125, 20.02001953125, 20.722412109375, 21.4248046875, 22.127197265625, 22.82958984375, 23.531982421875, 24.234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 7.0, 8.0, 10.0, 12.0, 16.0, 15.0, 22.0, 22.0, 32.0, 26.0, 38.0, 37.0, 32.0, 42.0, 40.0, 47.0, 38.0, 34.0, 34.0, 41.0, 41.0, 44.0, 28.0, 36.0, 41.0, 26.0, 26.0, 29.0, 22.0, 20.0, 14.0, 19.0, 14.0, 7.0, 10.0, 11.0, 10.0, 6.0, 2.0, 3.0, 4.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-23.265625, -22.579833984375, -21.89404296875, -21.208251953125, -20.5224609375, -19.836669921875, -19.15087890625, -18.465087890625, -17.779296875, -17.093505859375, -16.40771484375, -15.721923828125, -15.0361328125, -14.350341796875, -13.66455078125, -12.978759765625, -12.29296875, -11.607177734375, -10.92138671875, -10.235595703125, -9.5498046875, -8.864013671875, -8.17822265625, -7.492431640625, -6.806640625, -6.120849609375, -5.43505859375, -4.749267578125, -4.0634765625, -3.377685546875, -2.69189453125, -2.006103515625, -1.3203125, -0.634521484375, 0.05126953125, 0.737060546875, 1.4228515625, 2.108642578125, 2.79443359375, 3.480224609375, 4.166015625, 4.851806640625, 5.53759765625, 6.223388671875, 6.9091796875, 7.594970703125, 8.28076171875, 8.966552734375, 9.65234375, 10.338134765625, 11.02392578125, 11.709716796875, 12.3955078125, 13.081298828125, 13.76708984375, 14.452880859375, 15.138671875, 15.824462890625, 16.51025390625, 17.196044921875, 17.8818359375, 18.567626953125, 19.25341796875, 19.939208984375, 20.625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 16.0, 28.0, 54.0, 110.0, 267.0, 817.0, 4167.0, 166633.0, 865119.0, 9480.0, 1240.0, 365.0, 109.0, 54.0, 36.0, 17.0, 15.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.84375, -23.3038330078125, -22.763916015625, -22.2239990234375, -21.68408203125, -21.1441650390625, -20.604248046875, -20.0643310546875, -19.5244140625, -18.9844970703125, -18.444580078125, -17.9046630859375, -17.36474609375, -16.8248291015625, -16.284912109375, -15.7449951171875, -15.205078125, -14.6651611328125, -14.125244140625, -13.5853271484375, -13.04541015625, -12.5054931640625, -11.965576171875, -11.4256591796875, -10.8857421875, -10.3458251953125, -9.805908203125, -9.2659912109375, -8.72607421875, -8.1861572265625, -7.646240234375, -7.1063232421875, -6.56640625, -6.0264892578125, -5.486572265625, -4.9466552734375, -4.40673828125, -3.8668212890625, -3.326904296875, -2.7869873046875, -2.2470703125, -1.7071533203125, -1.167236328125, -0.6273193359375, -0.08740234375, 0.4525146484375, 0.992431640625, 1.5323486328125, 2.072265625, 2.6121826171875, 3.152099609375, 3.6920166015625, 4.23193359375, 4.7718505859375, 5.311767578125, 5.8516845703125, 6.3916015625, 6.9315185546875, 7.471435546875, 8.0113525390625, 8.55126953125, 9.0911865234375, 9.631103515625, 10.1710205078125, 10.7109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 16.0, 23.0, 48.0, 100.0, 151.0, 284.0, 163.0, 106.0, 49.0, 25.0, 17.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017795562744140625, -0.0017101466655731201, -0.0016407370567321777, -0.0015713274478912354, -0.001501917839050293, -0.0014325082302093506, -0.0013630986213684082, -0.0012936890125274658, -0.0012242794036865234, -0.001154869794845581, -0.0010854601860046387, -0.0010160505771636963, -0.0009466409683227539, -0.0008772313594818115, -0.0008078217506408691, -0.0007384121417999268, -0.0006690025329589844, -0.000599592924118042, -0.0005301833152770996, -0.0004607737064361572, -0.00039136409759521484, -0.00032195448875427246, -0.0002525448799133301, -0.0001831352710723877, -0.00011372566223144531, -4.431605339050293e-05, 2.5093555450439453e-05, 9.450316429138184e-05, 0.00016391277313232422, 0.0002333223819732666, 0.000302731990814209, 0.00037214159965515137, 0.00044155120849609375, 0.0005109608173370361, 0.0005803704261779785, 0.0006497800350189209, 0.0007191896438598633, 0.0007885992527008057, 0.000858008861541748, 0.0009274184703826904, 0.0009968280792236328, 0.0010662376880645752, 0.0011356472969055176, 0.00120505690574646, 0.0012744665145874023, 0.0013438761234283447, 0.0014132857322692871, 0.0014826953411102295, 0.0015521049499511719, 0.0016215145587921143, 0.0016909241676330566, 0.001760333776473999, 0.0018297433853149414, 0.0018991529941558838, 0.001968562602996826, 0.0020379722118377686, 0.002107381820678711, 0.0021767914295196533, 0.0022462010383605957, 0.002315610647201538, 0.0023850202560424805, 0.002454429864883423, 0.0025238394737243652, 0.0025932490825653076, 0.00266265869140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 8.0, 4.0, 6.0, 10.0, 14.0, 20.0, 22.0, 39.0, 64.0, 71.0, 102.0, 183.0, 289.0, 640.0, 1312.0, 3539.0, 12615.0, 78548.0, 701639.0, 214865.0, 24930.0, 5737.0, 1995.0, 869.0, 439.0, 210.0, 126.0, 69.0, 50.0, 34.0, 19.0, 20.0, 12.0, 11.0, 8.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.55859375, -6.33782958984375, -6.1170654296875, -5.89630126953125, -5.675537109375, -5.45477294921875, -5.2340087890625, -5.01324462890625, -4.79248046875, -4.57171630859375, -4.3509521484375, -4.13018798828125, -3.909423828125, -3.68865966796875, -3.4678955078125, -3.24713134765625, -3.0263671875, -2.80560302734375, -2.5848388671875, -2.36407470703125, -2.143310546875, -1.92254638671875, -1.7017822265625, -1.48101806640625, -1.26025390625, -1.03948974609375, -0.8187255859375, -0.59796142578125, -0.377197265625, -0.15643310546875, 0.0643310546875, 0.28509521484375, 0.505859375, 0.72662353515625, 0.9473876953125, 1.16815185546875, 1.388916015625, 1.60968017578125, 1.8304443359375, 2.05120849609375, 2.27197265625, 2.49273681640625, 2.7135009765625, 2.93426513671875, 3.155029296875, 3.37579345703125, 3.5965576171875, 3.81732177734375, 4.0380859375, 4.25885009765625, 4.4796142578125, 4.70037841796875, 4.921142578125, 5.14190673828125, 5.3626708984375, 5.58343505859375, 5.80419921875, 6.02496337890625, 6.2457275390625, 6.46649169921875, 6.687255859375, 6.90802001953125, 7.1287841796875, 7.34954833984375, 7.5703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 21.0, 14.0, 22.0, 25.0, 52.0, 67.0, 70.0, 92.0, 122.0, 112.0, 106.0, 58.0, 56.0, 50.0, 35.0, 23.0, 10.0, 11.0, 6.0, 12.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.93896484375, -7.6748046875, -7.41064453125, -7.146484375, -6.88232421875, -6.6181640625, -6.35400390625, -6.08984375, -5.82568359375, -5.5615234375, -5.29736328125, -5.033203125, -4.76904296875, -4.5048828125, -4.24072265625, -3.9765625, -3.71240234375, -3.4482421875, -3.18408203125, -2.919921875, -2.65576171875, -2.3916015625, -2.12744140625, -1.86328125, -1.59912109375, -1.3349609375, -1.07080078125, -0.806640625, -0.54248046875, -0.2783203125, -0.01416015625, 0.25, 0.51416015625, 0.7783203125, 1.04248046875, 1.306640625, 1.57080078125, 1.8349609375, 2.09912109375, 2.36328125, 2.62744140625, 2.8916015625, 3.15576171875, 3.419921875, 3.68408203125, 3.9482421875, 4.21240234375, 4.4765625, 4.74072265625, 5.0048828125, 5.26904296875, 5.533203125, 5.79736328125, 6.0615234375, 6.32568359375, 6.58984375, 6.85400390625, 7.1181640625, 7.38232421875, 7.646484375, 7.91064453125, 8.1748046875, 8.43896484375, 8.703125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 27.0, 112.0, 439.0, 324.0, 82.0, 18.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-580.33740234375, -568.9228515625, -557.5083618164062, -546.0938110351562, -534.6792602539062, -523.2647094726562, -511.8502197265625, -500.4356689453125, -489.0211181640625, -477.6065979003906, -466.1920471191406, -454.77752685546875, -443.36297607421875, -431.9484558105469, -420.533935546875, -409.119384765625, -397.7048645019531, -386.29034423828125, -374.87579345703125, -363.4612731933594, -352.0467224121094, -340.6322021484375, -329.2176513671875, -317.8031311035156, -306.38861083984375, -294.9740905761719, -283.5595397949219, -272.14501953125, -260.73046875, -249.31594848632812, -237.9014129638672, -226.48687744140625, -215.0723114013672, -203.65777587890625, -192.2432403564453, -180.82870483398438, -169.4141845703125, -157.9996337890625, -146.58511352539062, -135.1705780029297, -123.75604248046875, -112.34150695800781, -100.92697143554688, -89.51244354248047, -78.09790802001953, -66.6833724975586, -55.26884460449219, -43.85430908203125, -32.43977355957031, -21.025239944458008, -9.610706329345703, 1.8038253784179688, 13.218360900878906, 24.632896423339844, 36.04742431640625, 47.46195983886719, 58.876495361328125, 70.29103088378906, 81.70556640625, 93.1200942993164, 104.53462982177734, 115.94916534423828, 127.36369323730469, 138.77822875976562, 150.19276428222656]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 12.0, 19.0, 14.0, 16.0, 24.0, 25.0, 30.0, 27.0, 30.0, 38.0, 44.0, 44.0, 57.0, 62.0, 59.0, 70.0, 47.0, 54.0, 52.0, 45.0, 33.0, 42.0, 34.0, 18.0, 18.0, 18.0, 13.0, 12.0, 11.0, 4.0, 6.0, 1.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-172.0580596923828, -167.5946807861328, -163.1313018798828, -158.66790771484375, -154.20452880859375, -149.74114990234375, -145.27777099609375, -140.81439208984375, -136.35101318359375, -131.88763427734375, -127.42424774169922, -122.96086883544922, -118.49748992919922, -114.03410339355469, -109.57072448730469, -105.10734558105469, -100.64395904541016, -96.18058013916016, -91.71719360351562, -87.25381469726562, -82.79043579101562, -78.32705688476562, -73.8636703491211, -69.4002914428711, -64.93690490722656, -60.4735221862793, -56.0101432800293, -51.54676055908203, -47.08338165283203, -42.619998931884766, -38.1566162109375, -33.6932373046875, -29.2298583984375, -24.766477584838867, -20.303096771240234, -15.839714050292969, -11.376333236694336, -6.912952423095703, -2.4495697021484375, 2.0138111114501953, 6.477191925048828, 10.940572738647461, 15.40395450592041, 19.86733627319336, 24.330717086791992, 28.794097900390625, 33.25748062133789, 37.720863342285156, 42.184242248535156, 46.64762496948242, 51.11100387573242, 55.57438659667969, 60.03776550292969, 64.50114440917969, 68.96453094482422, 73.42790985107422, 77.89129638671875, 82.35467529296875, 86.81806182861328, 91.28144073486328, 95.74481964111328, 100.20820617675781, 104.67158508300781, 109.13496398925781, 113.59834289550781]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 13.0, 26.0, 24.0, 46.0, 70.0, 187.0, 436.0, 1389.0, 7204.0, 124636.0, 4036028.0, 20182.0, 2796.0, 679.0, 275.0, 113.0, 58.0, 41.0, 19.0, 18.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.41943359375, -16.6357421875, -15.85205078125, -15.068359375, -14.28466796875, -13.5009765625, -12.71728515625, -11.93359375, -11.14990234375, -10.3662109375, -9.58251953125, -8.798828125, -8.01513671875, -7.2314453125, -6.44775390625, -5.6640625, -4.88037109375, -4.0966796875, -3.31298828125, -2.529296875, -1.74560546875, -0.9619140625, -0.17822265625, 0.60546875, 1.38916015625, 2.1728515625, 2.95654296875, 3.740234375, 4.52392578125, 5.3076171875, 6.09130859375, 6.875, 7.65869140625, 8.4423828125, 9.22607421875, 10.009765625, 10.79345703125, 11.5771484375, 12.36083984375, 13.14453125, 13.92822265625, 14.7119140625, 15.49560546875, 16.279296875, 17.06298828125, 17.8466796875, 18.63037109375, 19.4140625, 20.19775390625, 20.9814453125, 21.76513671875, 22.548828125, 23.33251953125, 24.1162109375, 24.89990234375, 25.68359375, 26.46728515625, 27.2509765625, 28.03466796875, 28.818359375, 29.60205078125, 30.3857421875, 31.16943359375, 31.953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 9.0, 7.0, 13.0, 22.0, 24.0, 26.0, 41.0, 34.0, 54.0, 43.0, 45.0, 47.0, 61.0, 54.0, 61.0, 70.0, 46.0, 48.0, 49.0, 49.0, 29.0, 33.0, 19.0, 20.0, 24.0, 19.0, 11.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-7.22265625, -7.0313720703125, -6.840087890625, -6.6488037109375, -6.45751953125, -6.2662353515625, -6.074951171875, -5.8836669921875, -5.6923828125, -5.5010986328125, -5.309814453125, -5.1185302734375, -4.92724609375, -4.7359619140625, -4.544677734375, -4.3533935546875, -4.162109375, -3.9708251953125, -3.779541015625, -3.5882568359375, -3.39697265625, -3.2056884765625, -3.014404296875, -2.8231201171875, -2.6318359375, -2.4405517578125, -2.249267578125, -2.0579833984375, -1.86669921875, -1.6754150390625, -1.484130859375, -1.2928466796875, -1.1015625, -0.9102783203125, -0.718994140625, -0.5277099609375, -0.33642578125, -0.1451416015625, 0.046142578125, 0.2374267578125, 0.4287109375, 0.6199951171875, 0.811279296875, 1.0025634765625, 1.19384765625, 1.3851318359375, 1.576416015625, 1.7677001953125, 1.958984375, 2.1502685546875, 2.341552734375, 2.5328369140625, 2.72412109375, 2.9154052734375, 3.106689453125, 3.2979736328125, 3.4892578125, 3.6805419921875, 3.871826171875, 4.0631103515625, 4.25439453125, 4.4456787109375, 4.636962890625, 4.8282470703125, 5.01953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 10.0, 21.0, 32.0, 26.0, 48.0, 70.0, 95.0, 126.0, 185.0, 278.0, 456.0, 1165.0, 3515.0, 14701.0, 228286.0, 3900238.0, 35236.0, 6170.0, 1822.0, 710.0, 334.0, 200.0, 163.0, 87.0, 90.0, 57.0, 37.0, 34.0, 28.0, 18.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.734375, -21.1171875, -20.5, -19.8828125, -19.265625, -18.6484375, -18.03125, -17.4140625, -16.796875, -16.1796875, -15.5625, -14.9453125, -14.328125, -13.7109375, -13.09375, -12.4765625, -11.859375, -11.2421875, -10.625, -10.0078125, -9.390625, -8.7734375, -8.15625, -7.5390625, -6.921875, -6.3046875, -5.6875, -5.0703125, -4.453125, -3.8359375, -3.21875, -2.6015625, -1.984375, -1.3671875, -0.75, -0.1328125, 0.484375, 1.1015625, 1.71875, 2.3359375, 2.953125, 3.5703125, 4.1875, 4.8046875, 5.421875, 6.0390625, 6.65625, 7.2734375, 7.890625, 8.5078125, 9.125, 9.7421875, 10.359375, 10.9765625, 11.59375, 12.2109375, 12.828125, 13.4453125, 14.0625, 14.6796875, 15.296875, 15.9140625, 16.53125, 17.1484375, 17.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 5.0, 10.0, 26.0, 31.0, 45.0, 146.0, 569.0, 2714.0, 280.0, 95.0, 55.0, 21.0, 12.0, 14.0, 12.0, 9.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.359375, -4.14453125, -3.9296875, -3.71484375, -3.5, -3.28515625, -3.0703125, -2.85546875, -2.640625, -2.42578125, -2.2109375, -1.99609375, -1.78125, -1.56640625, -1.3515625, -1.13671875, -0.921875, -0.70703125, -0.4921875, -0.27734375, -0.0625, 0.15234375, 0.3671875, 0.58203125, 0.796875, 1.01171875, 1.2265625, 1.44140625, 1.65625, 1.87109375, 2.0859375, 2.30078125, 2.515625, 2.73046875, 2.9453125, 3.16015625, 3.375, 3.58984375, 3.8046875, 4.01953125, 4.234375, 4.44921875, 4.6640625, 4.87890625, 5.09375, 5.30859375, 5.5234375, 5.73828125, 5.953125, 6.16796875, 6.3828125, 6.59765625, 6.8125, 7.02734375, 7.2421875, 7.45703125, 7.671875, 7.88671875, 8.1015625, 8.31640625, 8.53125, 8.74609375, 8.9609375, 9.17578125, 9.390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 18.0, 43.0, 59.0, 111.0, 180.0, 178.0, 172.0, 105.0, 62.0, 24.0, 18.0, 14.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.73705291748047, -24.437726974487305, -23.13840103149414, -21.839075088500977, -20.539749145507812, -19.24042320251465, -17.941097259521484, -16.64177131652832, -15.342445373535156, -14.043119430541992, -12.743793487548828, -11.444467544555664, -10.1451416015625, -8.845815658569336, -7.546489715576172, -6.247163772583008, -4.947837829589844, -3.6485118865966797, -2.3491859436035156, -1.0498600006103516, 0.2494659423828125, 1.5487918853759766, 2.8481178283691406, 4.147443771362305, 5.446769714355469, 6.746095657348633, 8.045421600341797, 9.344747543334961, 10.644073486328125, 11.943399429321289, 13.242725372314453, 14.542051315307617, 15.841381072998047, 17.14070701599121, 18.440032958984375, 19.73935890197754, 21.038684844970703, 22.338010787963867, 23.63733673095703, 24.936662673950195, 26.23598861694336, 27.535314559936523, 28.834640502929688, 30.13396644592285, 31.433292388916016, 32.73262023925781, 34.031944274902344, 35.331268310546875, 36.63059616088867, 37.92992401123047, 39.229248046875, 40.52857208251953, 41.82789993286133, 43.127227783203125, 44.426551818847656, 45.72587585449219, 47.025203704833984, 48.32453155517578, 49.62385559082031, 50.923179626464844, 52.22250747680664, 53.52183532714844, 54.82115936279297, 56.1204833984375, 57.4198112487793]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 14.0, 11.0, 14.0, 17.0, 16.0, 34.0, 27.0, 29.0, 31.0, 38.0, 49.0, 48.0, 44.0, 49.0, 60.0, 43.0, 50.0, 38.0, 56.0, 37.0, 45.0, 27.0, 40.0, 24.0, 30.0, 29.0, 14.0, 13.0, 14.0, 8.0, 11.0, 8.0, 7.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.011672973632812, -14.417015075683594, -13.822356224060059, -13.227697372436523, -12.633039474487305, -12.038381576538086, -11.44372272491455, -10.849063873291016, -10.254405975341797, -9.659748077392578, -9.065089225769043, -8.470430374145508, -7.875772476196289, -7.281114101409912, -6.686455726623535, -6.091797351837158, -5.497138977050781, -4.902480602264404, -4.307822227478027, -3.7131638526916504, -3.1185054779052734, -2.5238471031188965, -1.9291887283325195, -1.3345303535461426, -0.7398719787597656, -0.14521360397338867, 0.4494447708129883, 1.0441031455993652, 1.6387615203857422, 2.233419895172119, 2.828078269958496, 3.422736644744873, 4.017393112182617, 4.612051486968994, 5.206709861755371, 5.801368236541748, 6.396026611328125, 6.990684986114502, 7.585343360900879, 8.180002212524414, 8.774660110473633, 9.369318008422852, 9.963976860046387, 10.558635711669922, 11.15329360961914, 11.74795150756836, 12.342610359191895, 12.93726921081543, 13.531927108764648, 14.126585006713867, 14.721243858337402, 15.315902709960938, 15.910560607910156, 16.505218505859375, 17.099876403808594, 17.694536209106445, 18.289194107055664, 18.883852005004883, 19.478511810302734, 20.073169708251953, 20.667827606201172, 21.26248550415039, 21.85714340209961, 22.45180320739746, 23.04646110534668]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 4.0, 7.0, 5.0, 14.0, 17.0, 35.0, 29.0, 55.0, 83.0, 122.0, 187.0, 249.0, 399.0, 639.0, 1141.0, 2219.0, 4517.0, 10278.0, 27920.0, 87801.0, 270955.0, 396687.0, 163082.0, 50667.0, 17272.0, 6848.0, 3133.0, 1647.0, 933.0, 586.0, 342.0, 214.0, 148.0, 99.0, 57.0, 37.0, 35.0, 17.0, 14.0, 13.0, 10.0, 10.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9140625, -8.6539306640625, -8.393798828125, -8.1336669921875, -7.87353515625, -7.6134033203125, -7.353271484375, -7.0931396484375, -6.8330078125, -6.5728759765625, -6.312744140625, -6.0526123046875, -5.79248046875, -5.5323486328125, -5.272216796875, -5.0120849609375, -4.751953125, -4.4918212890625, -4.231689453125, -3.9715576171875, -3.71142578125, -3.4512939453125, -3.191162109375, -2.9310302734375, -2.6708984375, -2.4107666015625, -2.150634765625, -1.8905029296875, -1.63037109375, -1.3702392578125, -1.110107421875, -0.8499755859375, -0.58984375, -0.3297119140625, -0.069580078125, 0.1905517578125, 0.45068359375, 0.7108154296875, 0.970947265625, 1.2310791015625, 1.4912109375, 1.7513427734375, 2.011474609375, 2.2716064453125, 2.53173828125, 2.7918701171875, 3.052001953125, 3.3121337890625, 3.572265625, 3.8323974609375, 4.092529296875, 4.3526611328125, 4.61279296875, 4.8729248046875, 5.133056640625, 5.3931884765625, 5.6533203125, 5.9134521484375, 6.173583984375, 6.4337158203125, 6.69384765625, 6.9539794921875, 7.214111328125, 7.4742431640625, 7.734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 0.0, 4.0, 2.0, 5.0, 3.0, 16.0, 4.0, 13.0, 10.0, 23.0, 30.0, 29.0, 41.0, 36.0, 52.0, 48.0, 60.0, 56.0, 69.0, 61.0, 58.0, 63.0, 50.0, 47.0, 40.0, 40.0, 38.0, 14.0, 22.0, 14.0, 7.0, 13.0, 15.0, 5.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.5, -7.296142578125, -7.09228515625, -6.888427734375, -6.6845703125, -6.480712890625, -6.27685546875, -6.072998046875, -5.869140625, -5.665283203125, -5.46142578125, -5.257568359375, -5.0537109375, -4.849853515625, -4.64599609375, -4.442138671875, -4.23828125, -4.034423828125, -3.83056640625, -3.626708984375, -3.4228515625, -3.218994140625, -3.01513671875, -2.811279296875, -2.607421875, -2.403564453125, -2.19970703125, -1.995849609375, -1.7919921875, -1.588134765625, -1.38427734375, -1.180419921875, -0.9765625, -0.772705078125, -0.56884765625, -0.364990234375, -0.1611328125, 0.042724609375, 0.24658203125, 0.450439453125, 0.654296875, 0.858154296875, 1.06201171875, 1.265869140625, 1.4697265625, 1.673583984375, 1.87744140625, 2.081298828125, 2.28515625, 2.489013671875, 2.69287109375, 2.896728515625, 3.1005859375, 3.304443359375, 3.50830078125, 3.712158203125, 3.916015625, 4.119873046875, 4.32373046875, 4.527587890625, 4.7314453125, 4.935302734375, 5.13916015625, 5.343017578125, 5.546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 4.0, 9.0, 8.0, 12.0, 15.0, 22.0, 32.0, 50.0, 71.0, 127.0, 191.0, 390.0, 758.0, 2071.0, 8619.0, 100205.0, 835462.0, 89129.0, 7737.0, 1993.0, 746.0, 326.0, 185.0, 126.0, 78.0, 55.0, 36.0, 23.0, 17.0, 9.0, 12.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.015625, -18.37060546875, -17.7255859375, -17.08056640625, -16.435546875, -15.79052734375, -15.1455078125, -14.50048828125, -13.85546875, -13.21044921875, -12.5654296875, -11.92041015625, -11.275390625, -10.63037109375, -9.9853515625, -9.34033203125, -8.6953125, -8.05029296875, -7.4052734375, -6.76025390625, -6.115234375, -5.47021484375, -4.8251953125, -4.18017578125, -3.53515625, -2.89013671875, -2.2451171875, -1.60009765625, -0.955078125, -0.31005859375, 0.3349609375, 0.97998046875, 1.625, 2.27001953125, 2.9150390625, 3.56005859375, 4.205078125, 4.85009765625, 5.4951171875, 6.14013671875, 6.78515625, 7.43017578125, 8.0751953125, 8.72021484375, 9.365234375, 10.01025390625, 10.6552734375, 11.30029296875, 11.9453125, 12.59033203125, 13.2353515625, 13.88037109375, 14.525390625, 15.17041015625, 15.8154296875, 16.46044921875, 17.10546875, 17.75048828125, 18.3955078125, 19.04052734375, 19.685546875, 20.33056640625, 20.9755859375, 21.62060546875, 22.265625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 9.0, 19.0, 26.0, 28.0, 25.0, 32.0, 48.0, 50.0, 46.0, 62.0, 48.0, 59.0, 56.0, 61.0, 45.0, 67.0, 54.0, 51.0, 32.0, 35.0, 18.0, 18.0, 25.0, 12.0, 12.0, 10.0, 13.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.921875, -29.079345703125, -28.23681640625, -27.394287109375, -26.5517578125, -25.709228515625, -24.86669921875, -24.024169921875, -23.181640625, -22.339111328125, -21.49658203125, -20.654052734375, -19.8115234375, -18.968994140625, -18.12646484375, -17.283935546875, -16.44140625, -15.598876953125, -14.75634765625, -13.913818359375, -13.0712890625, -12.228759765625, -11.38623046875, -10.543701171875, -9.701171875, -8.858642578125, -8.01611328125, -7.173583984375, -6.3310546875, -5.488525390625, -4.64599609375, -3.803466796875, -2.9609375, -2.118408203125, -1.27587890625, -0.433349609375, 0.4091796875, 1.251708984375, 2.09423828125, 2.936767578125, 3.779296875, 4.621826171875, 5.46435546875, 6.306884765625, 7.1494140625, 7.991943359375, 8.83447265625, 9.677001953125, 10.51953125, 11.362060546875, 12.20458984375, 13.047119140625, 13.8896484375, 14.732177734375, 15.57470703125, 16.417236328125, 17.259765625, 18.102294921875, 18.94482421875, 19.787353515625, 20.6298828125, 21.472412109375, 22.31494140625, 23.157470703125, 24.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 6.0, 13.0, 19.0, 15.0, 46.0, 68.0, 158.0, 375.0, 1175.0, 6710.0, 181758.0, 836023.0, 19009.0, 2147.0, 548.0, 215.0, 94.0, 52.0, 35.0, 15.0, 19.0, 10.0, 3.0, 11.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.671875, -11.3203125, -10.96875, -10.6171875, -10.265625, -9.9140625, -9.5625, -9.2109375, -8.859375, -8.5078125, -8.15625, -7.8046875, -7.453125, -7.1015625, -6.75, -6.3984375, -6.046875, -5.6953125, -5.34375, -4.9921875, -4.640625, -4.2890625, -3.9375, -3.5859375, -3.234375, -2.8828125, -2.53125, -2.1796875, -1.828125, -1.4765625, -1.125, -0.7734375, -0.421875, -0.0703125, 0.28125, 0.6328125, 0.984375, 1.3359375, 1.6875, 2.0390625, 2.390625, 2.7421875, 3.09375, 3.4453125, 3.796875, 4.1484375, 4.5, 4.8515625, 5.203125, 5.5546875, 5.90625, 6.2578125, 6.609375, 6.9609375, 7.3125, 7.6640625, 8.015625, 8.3671875, 8.71875, 9.0703125, 9.421875, 9.7734375, 10.125, 10.4765625, 10.828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 6.0, 6.0, 4.0, 4.0, 12.0, 8.0, 23.0, 16.0, 30.0, 36.0, 44.0, 59.0, 80.0, 100.0, 117.0, 102.0, 70.0, 68.0, 49.0, 33.0, 37.0, 21.0, 18.0, 15.0, 6.0, 3.0, 4.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.001312255859375, -0.0012772083282470703, -0.0012421607971191406, -0.001207113265991211, -0.0011720657348632812, -0.0011370182037353516, -0.0011019706726074219, -0.0010669231414794922, -0.0010318756103515625, -0.0009968280792236328, -0.0009617805480957031, -0.0009267330169677734, -0.0008916854858398438, -0.0008566379547119141, -0.0008215904235839844, -0.0007865428924560547, -0.000751495361328125, -0.0007164478302001953, -0.0006814002990722656, -0.0006463527679443359, -0.0006113052368164062, -0.0005762577056884766, -0.0005412101745605469, -0.0005061626434326172, -0.0004711151123046875, -0.0004360675811767578, -0.0004010200500488281, -0.00036597251892089844, -0.00033092498779296875, -0.00029587745666503906, -0.0002608299255371094, -0.0002257823944091797, -0.00019073486328125, -0.0001556873321533203, -0.00012063980102539062, -8.559226989746094e-05, -5.054473876953125e-05, -1.5497207641601562e-05, 1.9550323486328125e-05, 5.459785461425781e-05, 8.96453857421875e-05, 0.0001246929168701172, 0.00015974044799804688, 0.00019478797912597656, 0.00022983551025390625, 0.00026488304138183594, 0.0002999305725097656, 0.0003349781036376953, 0.000370025634765625, 0.0004050731658935547, 0.0004401206970214844, 0.00047516822814941406, 0.0005102157592773438, 0.0005452632904052734, 0.0005803108215332031, 0.0006153583526611328, 0.0006504058837890625, 0.0006854534149169922, 0.0007205009460449219, 0.0007555484771728516, 0.0007905960083007812, 0.0008256435394287109, 0.0008606910705566406, 0.0008957386016845703, 0.0009307861328125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 9.0, 26.0, 42.0, 117.0, 264.0, 705.0, 4349.0, 344566.0, 691064.0, 6067.0, 837.0, 271.0, 119.0, 46.0, 34.0, 15.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.158447265625, -15.58251953125, -15.006591796875, -14.4306640625, -13.854736328125, -13.27880859375, -12.702880859375, -12.126953125, -11.551025390625, -10.97509765625, -10.399169921875, -9.8232421875, -9.247314453125, -8.67138671875, -8.095458984375, -7.51953125, -6.943603515625, -6.36767578125, -5.791748046875, -5.2158203125, -4.639892578125, -4.06396484375, -3.488037109375, -2.912109375, -2.336181640625, -1.76025390625, -1.184326171875, -0.6083984375, -0.032470703125, 0.54345703125, 1.119384765625, 1.6953125, 2.271240234375, 2.84716796875, 3.423095703125, 3.9990234375, 4.574951171875, 5.15087890625, 5.726806640625, 6.302734375, 6.878662109375, 7.45458984375, 8.030517578125, 8.6064453125, 9.182373046875, 9.75830078125, 10.334228515625, 10.91015625, 11.486083984375, 12.06201171875, 12.637939453125, 13.2138671875, 13.789794921875, 14.36572265625, 14.941650390625, 15.517578125, 16.093505859375, 16.66943359375, 17.245361328125, 17.8212890625, 18.397216796875, 18.97314453125, 19.549072265625, 20.125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 12.0, 10.0, 43.0, 155.0, 335.0, 286.0, 113.0, 37.0, 14.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.890625, -19.1767578125, -18.462890625, -17.7490234375, -17.03515625, -16.3212890625, -15.607421875, -14.8935546875, -14.1796875, -13.4658203125, -12.751953125, -12.0380859375, -11.32421875, -10.6103515625, -9.896484375, -9.1826171875, -8.46875, -7.7548828125, -7.041015625, -6.3271484375, -5.61328125, -4.8994140625, -4.185546875, -3.4716796875, -2.7578125, -2.0439453125, -1.330078125, -0.6162109375, 0.09765625, 0.8115234375, 1.525390625, 2.2392578125, 2.953125, 3.6669921875, 4.380859375, 5.0947265625, 5.80859375, 6.5224609375, 7.236328125, 7.9501953125, 8.6640625, 9.3779296875, 10.091796875, 10.8056640625, 11.51953125, 12.2333984375, 12.947265625, 13.6611328125, 14.375, 15.0888671875, 15.802734375, 16.5166015625, 17.23046875, 17.9443359375, 18.658203125, 19.3720703125, 20.0859375, 20.7998046875, 21.513671875, 22.2275390625, 22.94140625, 23.6552734375, 24.369140625, 25.0830078125, 25.796875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 16.0, 19.0, 47.0, 90.0, 152.0, 203.0, 211.0, 115.0, 70.0, 33.0, 15.0, 8.0, 10.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.285888671875, -169.7859344482422, -165.2859649658203, -160.7860107421875, -156.28604125976562, -151.7860870361328, -147.2861328125, -142.78616333007812, -138.2862091064453, -133.7862548828125, -129.28628540039062, -124.78633117675781, -120.28636932373047, -115.78640747070312, -111.28645324707031, -106.78649139404297, -102.28652954101562, -97.78656768798828, -93.28660583496094, -88.78665161132812, -84.28668975830078, -79.78672790527344, -75.28677368164062, -70.78681182861328, -66.28684997558594, -61.786888122558594, -57.286930084228516, -52.78697204589844, -48.287010192871094, -43.78704833984375, -39.28709030151367, -34.787132263183594, -30.28717041015625, -25.78721046447754, -21.287250518798828, -16.787290573120117, -12.287330627441406, -7.787370681762695, -3.2874107360839844, 1.2125492095947266, 5.7125091552734375, 10.212469100952148, 14.71242904663086, 19.21238899230957, 23.71234893798828, 28.212308883666992, 32.7122688293457, 37.21222686767578, 41.712188720703125, 46.21215057373047, 50.71210861206055, 55.212066650390625, 59.71202850341797, 64.21199035644531, 68.71194458007812, 73.21190643310547, 77.71186828613281, 82.21183013916016, 86.7117919921875, 91.21174621582031, 95.71170806884766, 100.211669921875, 104.71162414550781, 109.21158599853516, 113.7115478515625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 0.0, 5.0, 11.0, 8.0, 12.0, 18.0, 25.0, 20.0, 19.0, 23.0, 43.0, 38.0, 34.0, 56.0, 47.0, 68.0, 56.0, 64.0, 47.0, 62.0, 45.0, 54.0, 40.0, 37.0, 21.0, 30.0, 27.0, 17.0, 23.0, 11.0, 6.0, 6.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.69227600097656, -105.95861053466797, -102.22493743896484, -98.49127197265625, -94.75760650634766, -91.02393341064453, -87.29026794433594, -83.55659484863281, -79.82292938232422, -76.08926391601562, -72.3555908203125, -68.6219253540039, -64.88825988769531, -61.15458679199219, -57.420921325683594, -53.687252044677734, -49.95358657836914, -46.21991729736328, -42.48625183105469, -38.75258255004883, -35.01891326904297, -31.285245895385742, -27.551578521728516, -23.817909240722656, -20.08424186706543, -16.350574493408203, -12.616905212402344, -8.883237838745117, -5.149569511413574, -1.4159011840820312, 2.3177661895751953, 6.051435470581055, 9.785102844238281, 13.518771171569824, 17.252439498901367, 20.986106872558594, 24.719776153564453, 28.45344352722168, 32.187110900878906, 35.920780181884766, 39.654449462890625, 43.388118743896484, 47.12178421020508, 50.85545349121094, 54.5891227722168, 58.322792053222656, 62.05645751953125, 65.79013061523438, 69.52378845214844, 73.25745391845703, 76.99112701416016, 80.72479248046875, 84.45845794677734, 88.19213104248047, 91.92579650878906, 95.65946960449219, 99.39313507080078, 103.12680053710938, 106.8604736328125, 110.5941390991211, 114.32780456542969, 118.06147766113281, 121.7951431274414, 125.52880859375, 129.26248168945312]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 0.0, 4.0, 7.0, 9.0, 19.0, 24.0, 39.0, 61.0, 119.0, 199.0, 368.0, 635.0, 1314.0, 2826.0, 7158.0, 22599.0, 147180.0, 2919787.0, 1007230.0, 61262.0, 14128.0, 5019.0, 2096.0, 1013.0, 544.0, 260.0, 159.0, 89.0, 56.0, 26.0, 20.0, 9.0, 9.0, 7.0, 3.0, 2.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.34100341796875, -9.0726318359375, -8.80426025390625, -8.535888671875, -8.26751708984375, -7.9991455078125, -7.73077392578125, -7.46240234375, -7.19403076171875, -6.9256591796875, -6.65728759765625, -6.388916015625, -6.12054443359375, -5.8521728515625, -5.58380126953125, -5.3154296875, -5.04705810546875, -4.7786865234375, -4.51031494140625, -4.241943359375, -3.97357177734375, -3.7052001953125, -3.43682861328125, -3.16845703125, -2.90008544921875, -2.6317138671875, -2.36334228515625, -2.094970703125, -1.82659912109375, -1.5582275390625, -1.28985595703125, -1.021484375, -0.75311279296875, -0.4847412109375, -0.21636962890625, 0.052001953125, 0.32037353515625, 0.5887451171875, 0.85711669921875, 1.12548828125, 1.39385986328125, 1.6622314453125, 1.93060302734375, 2.198974609375, 2.46734619140625, 2.7357177734375, 3.00408935546875, 3.2724609375, 3.54083251953125, 3.8092041015625, 4.07757568359375, 4.345947265625, 4.61431884765625, 4.8826904296875, 5.15106201171875, 5.41943359375, 5.68780517578125, 5.9561767578125, 6.22454833984375, 6.492919921875, 6.76129150390625, 7.0296630859375, 7.29803466796875, 7.56640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 1.0, 10.0, 6.0, 12.0, 17.0, 16.0, 19.0, 17.0, 21.0, 47.0, 37.0, 34.0, 39.0, 60.0, 58.0, 48.0, 51.0, 48.0, 65.0, 56.0, 39.0, 38.0, 37.0, 37.0, 40.0, 28.0, 23.0, 27.0, 15.0, 17.0, 9.0, 6.0, 7.0, 8.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-5.64453125, -5.483154296875, -5.32177734375, -5.160400390625, -4.9990234375, -4.837646484375, -4.67626953125, -4.514892578125, -4.353515625, -4.192138671875, -4.03076171875, -3.869384765625, -3.7080078125, -3.546630859375, -3.38525390625, -3.223876953125, -3.0625, -2.901123046875, -2.73974609375, -2.578369140625, -2.4169921875, -2.255615234375, -2.09423828125, -1.932861328125, -1.771484375, -1.610107421875, -1.44873046875, -1.287353515625, -1.1259765625, -0.964599609375, -0.80322265625, -0.641845703125, -0.48046875, -0.319091796875, -0.15771484375, 0.003662109375, 0.1650390625, 0.326416015625, 0.48779296875, 0.649169921875, 0.810546875, 0.971923828125, 1.13330078125, 1.294677734375, 1.4560546875, 1.617431640625, 1.77880859375, 1.940185546875, 2.1015625, 2.262939453125, 2.42431640625, 2.585693359375, 2.7470703125, 2.908447265625, 3.06982421875, 3.231201171875, 3.392578125, 3.553955078125, 3.71533203125, 3.876708984375, 4.0380859375, 4.199462890625, 4.36083984375, 4.522216796875, 4.68359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 16.0, 14.0, 18.0, 23.0, 40.0, 62.0, 103.0, 182.0, 327.0, 650.0, 1552.0, 4005.0, 12067.0, 48019.0, 487735.0, 3435559.0, 162891.0, 27475.0, 8111.0, 2952.0, 1268.0, 555.0, 246.0, 128.0, 74.0, 64.0, 28.0, 19.0, 21.0, 15.0, 3.0, 11.0, 5.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.5579833984375, -10.209716796875, -9.8614501953125, -9.51318359375, -9.1649169921875, -8.816650390625, -8.4683837890625, -8.1201171875, -7.7718505859375, -7.423583984375, -7.0753173828125, -6.72705078125, -6.3787841796875, -6.030517578125, -5.6822509765625, -5.333984375, -4.9857177734375, -4.637451171875, -4.2891845703125, -3.94091796875, -3.5926513671875, -3.244384765625, -2.8961181640625, -2.5478515625, -2.1995849609375, -1.851318359375, -1.5030517578125, -1.15478515625, -0.8065185546875, -0.458251953125, -0.1099853515625, 0.23828125, 0.5865478515625, 0.934814453125, 1.2830810546875, 1.63134765625, 1.9796142578125, 2.327880859375, 2.6761474609375, 3.0244140625, 3.3726806640625, 3.720947265625, 4.0692138671875, 4.41748046875, 4.7657470703125, 5.114013671875, 5.4622802734375, 5.810546875, 6.1588134765625, 6.507080078125, 6.8553466796875, 7.20361328125, 7.5518798828125, 7.900146484375, 8.2484130859375, 8.5966796875, 8.9449462890625, 9.293212890625, 9.6414794921875, 9.98974609375, 10.3380126953125, 10.686279296875, 11.0345458984375, 11.3828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 4.0, 15.0, 24.0, 21.0, 46.0, 64.0, 86.0, 142.0, 232.0, 483.0, 842.0, 889.0, 516.0, 256.0, 151.0, 66.0, 47.0, 35.0, 31.0, 22.0, 20.0, 11.0, 9.0, 10.0, 7.0, 6.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.1578369140625, -7.831298828125, -7.5047607421875, -7.17822265625, -6.8516845703125, -6.525146484375, -6.1986083984375, -5.8720703125, -5.5455322265625, -5.218994140625, -4.8924560546875, -4.56591796875, -4.2393798828125, -3.912841796875, -3.5863037109375, -3.259765625, -2.9332275390625, -2.606689453125, -2.2801513671875, -1.95361328125, -1.6270751953125, -1.300537109375, -0.9739990234375, -0.6474609375, -0.3209228515625, 0.005615234375, 0.3321533203125, 0.65869140625, 0.9852294921875, 1.311767578125, 1.6383056640625, 1.96484375, 2.2913818359375, 2.617919921875, 2.9444580078125, 3.27099609375, 3.5975341796875, 3.924072265625, 4.2506103515625, 4.5771484375, 4.9036865234375, 5.230224609375, 5.5567626953125, 5.88330078125, 6.2098388671875, 6.536376953125, 6.8629150390625, 7.189453125, 7.5159912109375, 7.842529296875, 8.1690673828125, 8.49560546875, 8.8221435546875, 9.148681640625, 9.4752197265625, 9.8017578125, 10.1282958984375, 10.454833984375, 10.7813720703125, 11.10791015625, 11.4344482421875, 11.760986328125, 12.0875244140625, 12.4140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 32.0, 125.0, 244.0, 333.0, 188.0, 39.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-301.28814697265625, -295.3007507324219, -289.3133850097656, -283.32598876953125, -277.338623046875, -271.3512268066406, -265.36383056640625, -259.37646484375, -253.38906860351562, -247.4016876220703, -241.414306640625, -235.42691040039062, -229.4395294189453, -223.4521484375, -217.46475219726562, -211.4773712158203, -205.489990234375, -199.5026092529297, -193.51522827148438, -187.52783203125, -181.5404510498047, -175.55307006835938, -169.565673828125, -163.5782928466797, -157.59091186523438, -151.60353088378906, -145.61614990234375, -139.62875366210938, -133.64137268066406, -127.65399169921875, -121.6666030883789, -115.67921447753906, -109.69182586669922, -103.70443725585938, -97.71705627441406, -91.72967529296875, -85.7422866821289, -79.75489807128906, -73.76751708984375, -67.78013610839844, -61.792747497558594, -55.805362701416016, -49.81797790527344, -43.83059310913086, -37.84320831298828, -31.855823516845703, -25.868438720703125, -19.881053924560547, -13.893669128417969, -7.906284332275391, -1.9188995361328125, 4.068485260009766, 10.055870056152344, 16.043254852294922, 22.0306396484375, 28.018024444580078, 34.005409240722656, 39.992794036865234, 45.98017883300781, 51.96756362915039, 57.95494842529297, 63.94233322143555, 69.92971801757812, 75.91709899902344, 81.90448760986328]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 8.0, 9.0, 13.0, 12.0, 11.0, 24.0, 27.0, 21.0, 28.0, 49.0, 28.0, 51.0, 35.0, 43.0, 51.0, 47.0, 32.0, 41.0, 63.0, 58.0, 40.0, 30.0, 33.0, 36.0, 38.0, 34.0, 25.0, 23.0, 19.0, 11.0, 10.0, 4.0, 7.0, 6.0, 3.0, 4.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.74684524536133, -46.208980560302734, -44.671119689941406, -43.13325500488281, -41.59539031982422, -40.057525634765625, -38.51966094970703, -36.9818000793457, -35.44393539428711, -33.906070709228516, -32.36820983886719, -30.830345153808594, -29.29248046875, -27.754615783691406, -26.216753005981445, -24.678890228271484, -23.14102554321289, -21.603160858154297, -20.065298080444336, -18.527435302734375, -16.98957061767578, -15.451706886291504, -13.913843154907227, -12.37597942352295, -10.838115692138672, -9.300251960754395, -7.762388229370117, -6.22452449798584, -4.6866607666015625, -3.148797035217285, -1.6109333038330078, -0.07306957244873047, 1.4647903442382812, 3.0026540756225586, 4.540517807006836, 6.078381538391113, 7.616245269775391, 9.154109001159668, 10.691972732543945, 12.229836463928223, 13.7677001953125, 15.305563926696777, 16.843427658081055, 18.381290435791016, 19.91915512084961, 21.457019805908203, 22.994882583618164, 24.532745361328125, 26.07061004638672, 27.608474731445312, 29.146337509155273, 30.684200286865234, 32.22206497192383, 33.75992965698242, 35.29779052734375, 36.835655212402344, 38.37351989746094, 39.91138458251953, 41.449249267578125, 42.98711013793945, 44.52497482299805, 46.06283950805664, 47.60070037841797, 49.13856506347656, 50.676429748535156]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 12.0, 6.0, 12.0, 19.0, 38.0, 51.0, 80.0, 106.0, 143.0, 239.0, 321.0, 531.0, 878.0, 1612.0, 2673.0, 4711.0, 8903.0, 17802.0, 35865.0, 73589.0, 151784.0, 272341.0, 237262.0, 121259.0, 58674.0, 28477.0, 14252.0, 7248.0, 3973.0, 2182.0, 1308.0, 762.0, 455.0, 345.0, 209.0, 151.0, 92.0, 52.0, 40.0, 29.0, 25.0, 11.0, 9.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.80078125, -4.65460205078125, -4.5084228515625, -4.36224365234375, -4.216064453125, -4.06988525390625, -3.9237060546875, -3.77752685546875, -3.63134765625, -3.48516845703125, -3.3389892578125, -3.19281005859375, -3.046630859375, -2.90045166015625, -2.7542724609375, -2.60809326171875, -2.4619140625, -2.31573486328125, -2.1695556640625, -2.02337646484375, -1.877197265625, -1.73101806640625, -1.5848388671875, -1.43865966796875, -1.29248046875, -1.14630126953125, -1.0001220703125, -0.85394287109375, -0.707763671875, -0.56158447265625, -0.4154052734375, -0.26922607421875, -0.123046875, 0.02313232421875, 0.1693115234375, 0.31549072265625, 0.461669921875, 0.60784912109375, 0.7540283203125, 0.90020751953125, 1.04638671875, 1.19256591796875, 1.3387451171875, 1.48492431640625, 1.631103515625, 1.77728271484375, 1.9234619140625, 2.06964111328125, 2.2158203125, 2.36199951171875, 2.5081787109375, 2.65435791015625, 2.800537109375, 2.94671630859375, 3.0928955078125, 3.23907470703125, 3.38525390625, 3.53143310546875, 3.6776123046875, 3.82379150390625, 3.969970703125, 4.11614990234375, 4.2623291015625, 4.40850830078125, 4.5546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 9.0, 6.0, 6.0, 15.0, 10.0, 16.0, 19.0, 21.0, 28.0, 24.0, 30.0, 30.0, 36.0, 33.0, 37.0, 52.0, 50.0, 43.0, 47.0, 45.0, 43.0, 51.0, 39.0, 41.0, 39.0, 24.0, 36.0, 23.0, 28.0, 18.0, 22.0, 24.0, 17.0, 9.0, 13.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.62109375, -4.4796142578125, -4.338134765625, -4.1966552734375, -4.05517578125, -3.9136962890625, -3.772216796875, -3.6307373046875, -3.4892578125, -3.3477783203125, -3.206298828125, -3.0648193359375, -2.92333984375, -2.7818603515625, -2.640380859375, -2.4989013671875, -2.357421875, -2.2159423828125, -2.074462890625, -1.9329833984375, -1.79150390625, -1.6500244140625, -1.508544921875, -1.3670654296875, -1.2255859375, -1.0841064453125, -0.942626953125, -0.8011474609375, -0.65966796875, -0.5181884765625, -0.376708984375, -0.2352294921875, -0.09375, 0.0477294921875, 0.189208984375, 0.3306884765625, 0.47216796875, 0.6136474609375, 0.755126953125, 0.8966064453125, 1.0380859375, 1.1795654296875, 1.321044921875, 1.4625244140625, 1.60400390625, 1.7454833984375, 1.886962890625, 2.0284423828125, 2.169921875, 2.3114013671875, 2.452880859375, 2.5943603515625, 2.73583984375, 2.8773193359375, 3.018798828125, 3.1602783203125, 3.3017578125, 3.4432373046875, 3.584716796875, 3.7261962890625, 3.86767578125, 4.0091552734375, 4.150634765625, 4.2921142578125, 4.43359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 6.0, 12.0, 11.0, 18.0, 49.0, 41.0, 91.0, 169.0, 282.0, 492.0, 1114.0, 3025.0, 19929.0, 469168.0, 527873.0, 20706.0, 3192.0, 1092.0, 518.0, 292.0, 162.0, 97.0, 59.0, 30.0, 25.0, 20.0, 19.0, 12.0, 14.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.078125, -21.428955078125, -20.77978515625, -20.130615234375, -19.4814453125, -18.832275390625, -18.18310546875, -17.533935546875, -16.884765625, -16.235595703125, -15.58642578125, -14.937255859375, -14.2880859375, -13.638916015625, -12.98974609375, -12.340576171875, -11.69140625, -11.042236328125, -10.39306640625, -9.743896484375, -9.0947265625, -8.445556640625, -7.79638671875, -7.147216796875, -6.498046875, -5.848876953125, -5.19970703125, -4.550537109375, -3.9013671875, -3.252197265625, -2.60302734375, -1.953857421875, -1.3046875, -0.655517578125, -0.00634765625, 0.642822265625, 1.2919921875, 1.941162109375, 2.59033203125, 3.239501953125, 3.888671875, 4.537841796875, 5.18701171875, 5.836181640625, 6.4853515625, 7.134521484375, 7.78369140625, 8.432861328125, 9.08203125, 9.731201171875, 10.38037109375, 11.029541015625, 11.6787109375, 12.327880859375, 12.97705078125, 13.626220703125, 14.275390625, 14.924560546875, 15.57373046875, 16.222900390625, 16.8720703125, 17.521240234375, 18.17041015625, 18.819580078125, 19.46875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 10.0, 4.0, 8.0, 14.0, 4.0, 14.0, 14.0, 19.0, 13.0, 23.0, 26.0, 36.0, 32.0, 44.0, 42.0, 52.0, 49.0, 50.0, 48.0, 47.0, 44.0, 56.0, 48.0, 51.0, 36.0, 39.0, 31.0, 27.0, 17.0, 18.0, 14.0, 17.0, 12.0, 10.0, 8.0, 4.0, 1.0, 4.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.734375, -21.07275390625, -20.4111328125, -19.74951171875, -19.087890625, -18.42626953125, -17.7646484375, -17.10302734375, -16.44140625, -15.77978515625, -15.1181640625, -14.45654296875, -13.794921875, -13.13330078125, -12.4716796875, -11.81005859375, -11.1484375, -10.48681640625, -9.8251953125, -9.16357421875, -8.501953125, -7.84033203125, -7.1787109375, -6.51708984375, -5.85546875, -5.19384765625, -4.5322265625, -3.87060546875, -3.208984375, -2.54736328125, -1.8857421875, -1.22412109375, -0.5625, 0.09912109375, 0.7607421875, 1.42236328125, 2.083984375, 2.74560546875, 3.4072265625, 4.06884765625, 4.73046875, 5.39208984375, 6.0537109375, 6.71533203125, 7.376953125, 8.03857421875, 8.7001953125, 9.36181640625, 10.0234375, 10.68505859375, 11.3466796875, 12.00830078125, 12.669921875, 13.33154296875, 13.9931640625, 14.65478515625, 15.31640625, 15.97802734375, 16.6396484375, 17.30126953125, 17.962890625, 18.62451171875, 19.2861328125, 19.94775390625, 20.609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 6.0, 12.0, 24.0, 26.0, 44.0, 81.0, 118.0, 255.0, 626.0, 2045.0, 12326.0, 279040.0, 729075.0, 20539.0, 2851.0, 808.0, 304.0, 152.0, 68.0, 47.0, 45.0, 11.0, 15.0, 10.0, 4.0, 5.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.256591796875, -8.92724609375, -8.597900390625, -8.2685546875, -7.939208984375, -7.60986328125, -7.280517578125, -6.951171875, -6.621826171875, -6.29248046875, -5.963134765625, -5.6337890625, -5.304443359375, -4.97509765625, -4.645751953125, -4.31640625, -3.987060546875, -3.65771484375, -3.328369140625, -2.9990234375, -2.669677734375, -2.34033203125, -2.010986328125, -1.681640625, -1.352294921875, -1.02294921875, -0.693603515625, -0.3642578125, -0.034912109375, 0.29443359375, 0.623779296875, 0.953125, 1.282470703125, 1.61181640625, 1.941162109375, 2.2705078125, 2.599853515625, 2.92919921875, 3.258544921875, 3.587890625, 3.917236328125, 4.24658203125, 4.575927734375, 4.9052734375, 5.234619140625, 5.56396484375, 5.893310546875, 6.22265625, 6.552001953125, 6.88134765625, 7.210693359375, 7.5400390625, 7.869384765625, 8.19873046875, 8.528076171875, 8.857421875, 9.186767578125, 9.51611328125, 9.845458984375, 10.1748046875, 10.504150390625, 10.83349609375, 11.162841796875, 11.4921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 7.0, 20.0, 12.0, 13.0, 32.0, 35.0, 46.0, 64.0, 103.0, 170.0, 148.0, 84.0, 64.0, 43.0, 33.0, 19.0, 18.0, 18.0, 13.0, 12.0, 8.0, 10.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016412734985351562, -0.001597866415977478, -0.0015544593334197998, -0.0015110522508621216, -0.0014676451683044434, -0.0014242380857467651, -0.001380831003189087, -0.0013374239206314087, -0.0012940168380737305, -0.0012506097555160522, -0.001207202672958374, -0.0011637955904006958, -0.0011203885078430176, -0.0010769814252853394, -0.0010335743427276611, -0.000990167260169983, -0.0009467601776123047, -0.0009033530950546265, -0.0008599460124969482, -0.00081653892993927, -0.0007731318473815918, -0.0007297247648239136, -0.0006863176822662354, -0.0006429105997085571, -0.0005995035171508789, -0.0005560964345932007, -0.0005126893520355225, -0.00046928226947784424, -0.000425875186920166, -0.0003824681043624878, -0.00033906102180480957, -0.00029565393924713135, -0.0002522468566894531, -0.0002088397741317749, -0.00016543269157409668, -0.00012202560901641846, -7.861852645874023e-05, -3.521144390106201e-05, 8.195638656616211e-06, 5.1602721214294434e-05, 9.500980377197266e-05, 0.00013841688632965088, 0.0001818239688873291, 0.00022523105144500732, 0.00026863813400268555, 0.00031204521656036377, 0.000355452299118042, 0.0003988593816757202, 0.00044226646423339844, 0.00048567354679107666, 0.0005290806293487549, 0.0005724877119064331, 0.0006158947944641113, 0.0006593018770217896, 0.0007027089595794678, 0.000746116042137146, 0.0007895231246948242, 0.0008329302072525024, 0.0008763372898101807, 0.0009197443723678589, 0.0009631514549255371, 0.0010065585374832153, 0.0010499656200408936, 0.0010933727025985718, 0.00113677978515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 12.0, 16.0, 17.0, 43.0, 43.0, 73.0, 144.0, 225.0, 448.0, 945.0, 2598.0, 10818.0, 85530.0, 829588.0, 100775.0, 12385.0, 2791.0, 1022.0, 471.0, 259.0, 144.0, 76.0, 39.0, 28.0, 23.0, 17.0, 10.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1796875, -8.8790283203125, -8.578369140625, -8.2777099609375, -7.97705078125, -7.6763916015625, -7.375732421875, -7.0750732421875, -6.7744140625, -6.4737548828125, -6.173095703125, -5.8724365234375, -5.57177734375, -5.2711181640625, -4.970458984375, -4.6697998046875, -4.369140625, -4.0684814453125, -3.767822265625, -3.4671630859375, -3.16650390625, -2.8658447265625, -2.565185546875, -2.2645263671875, -1.9638671875, -1.6632080078125, -1.362548828125, -1.0618896484375, -0.76123046875, -0.4605712890625, -0.159912109375, 0.1407470703125, 0.44140625, 0.7420654296875, 1.042724609375, 1.3433837890625, 1.64404296875, 1.9447021484375, 2.245361328125, 2.5460205078125, 2.8466796875, 3.1473388671875, 3.447998046875, 3.7486572265625, 4.04931640625, 4.3499755859375, 4.650634765625, 4.9512939453125, 5.251953125, 5.5526123046875, 5.853271484375, 6.1539306640625, 6.45458984375, 6.7552490234375, 7.055908203125, 7.3565673828125, 7.6572265625, 7.9578857421875, 8.258544921875, 8.5592041015625, 8.85986328125, 9.1605224609375, 9.461181640625, 9.7618408203125, 10.0625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 12.0, 11.0, 19.0, 21.0, 37.0, 61.0, 69.0, 95.0, 124.0, 128.0, 103.0, 91.0, 58.0, 51.0, 32.0, 19.0, 20.0, 13.0, 12.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.03125, -11.75262451171875, -11.4739990234375, -11.19537353515625, -10.916748046875, -10.63812255859375, -10.3594970703125, -10.08087158203125, -9.80224609375, -9.52362060546875, -9.2449951171875, -8.96636962890625, -8.687744140625, -8.40911865234375, -8.1304931640625, -7.85186767578125, -7.5732421875, -7.29461669921875, -7.0159912109375, -6.73736572265625, -6.458740234375, -6.18011474609375, -5.9014892578125, -5.62286376953125, -5.34423828125, -5.06561279296875, -4.7869873046875, -4.50836181640625, -4.229736328125, -3.95111083984375, -3.6724853515625, -3.39385986328125, -3.115234375, -2.83660888671875, -2.5579833984375, -2.27935791015625, -2.000732421875, -1.72210693359375, -1.4434814453125, -1.16485595703125, -0.88623046875, -0.60760498046875, -0.3289794921875, -0.05035400390625, 0.228271484375, 0.50689697265625, 0.7855224609375, 1.06414794921875, 1.3427734375, 1.62139892578125, 1.9000244140625, 2.17864990234375, 2.457275390625, 2.73590087890625, 3.0145263671875, 3.29315185546875, 3.57177734375, 3.85040283203125, 4.1290283203125, 4.40765380859375, 4.686279296875, 4.96490478515625, 5.2435302734375, 5.52215576171875, 5.80078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 7.0, 7.0, 29.0, 69.0, 173.0, 286.0, 230.0, 123.0, 44.0, 17.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-263.8902282714844, -258.71234130859375, -253.5344696044922, -248.35658264160156, -243.17869567871094, -238.00082397460938, -232.82293701171875, -227.64505004882812, -222.4671630859375, -217.28927612304688, -212.1114044189453, -206.9335174560547, -201.75563049316406, -196.5777587890625, -191.39987182617188, -186.22198486328125, -181.0441131591797, -175.86622619628906, -170.6883544921875, -165.51046752929688, -160.33258056640625, -155.15469360351562, -149.97682189941406, -144.79893493652344, -139.62106323242188, -134.44317626953125, -129.2653045654297, -124.08741760253906, -118.90953063964844, -113.73165130615234, -108.55377197265625, -103.37588500976562, -98.19800567626953, -93.02012634277344, -87.84223937988281, -82.66436004638672, -77.48648071289062, -72.30859375, -67.1307144165039, -61.95283126831055, -56.77494812011719, -51.59706497192383, -46.41918182373047, -41.241302490234375, -36.063419342041016, -30.885536193847656, -25.70765495300293, -20.529773712158203, -15.351890563964844, -10.1740083694458, -4.996126174926758, 0.18175601959228516, 5.359638214111328, 10.537521362304688, 15.715402603149414, 20.89328384399414, 26.0711669921875, 31.24905014038086, 36.42693328857422, 41.60481262207031, 46.78269577026367, 51.96057891845703, 57.138458251953125, 62.316341400146484, 67.49422454833984]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 5.0, 4.0, 8.0, 9.0, 11.0, 16.0, 25.0, 19.0, 21.0, 24.0, 32.0, 28.0, 28.0, 42.0, 39.0, 44.0, 42.0, 42.0, 59.0, 44.0, 49.0, 44.0, 39.0, 37.0, 32.0, 35.0, 27.0, 32.0, 32.0, 20.0, 14.0, 19.0, 10.0, 10.0, 8.0, 6.0, 5.0, 9.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-70.36729431152344, -68.22250366210938, -66.07771301269531, -63.93292236328125, -61.78813171386719, -59.643341064453125, -57.49855422973633, -55.353763580322266, -53.2089729309082, -51.06418228149414, -48.91939163208008, -46.774600982666016, -44.62981414794922, -42.485023498535156, -40.340232849121094, -38.19544219970703, -36.05065155029297, -33.905860900878906, -31.761070251464844, -29.616281509399414, -27.47149085998535, -25.32670021057129, -23.18191146850586, -21.037120819091797, -18.892330169677734, -16.747539520263672, -14.602749824523926, -12.45796012878418, -10.313169479370117, -8.168378829956055, -6.023589134216309, -3.8787994384765625, -1.7340087890625, 0.4107813835144043, 2.5555715560913086, 4.700361728668213, 6.845151901245117, 8.98994255065918, 11.134732246398926, 13.279521942138672, 15.424312591552734, 17.569103240966797, 19.71389389038086, 21.85868263244629, 24.00347328186035, 26.148263931274414, 28.293052673339844, 30.437843322753906, 32.58263397216797, 34.72742462158203, 36.872215270996094, 39.017005920410156, 41.16179656982422, 43.30658721923828, 45.45137405395508, 47.59616470336914, 49.7409553527832, 51.885746002197266, 54.03053665161133, 56.17532730102539, 58.32011413574219, 60.46490478515625, 62.60969543457031, 64.75448608398438, 66.89927673339844]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 12.0, 6.0, 8.0, 13.0, 22.0, 35.0, 40.0, 57.0, 81.0, 129.0, 176.0, 502.0, 7916.0, 4156474.0, 27321.0, 785.0, 243.0, 146.0, 82.0, 59.0, 45.0, 24.0, 24.0, 18.0, 13.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-51.0, -49.607421875, -48.21484375, -46.822265625, -45.4296875, -44.037109375, -42.64453125, -41.251953125, -39.859375, -38.466796875, -37.07421875, -35.681640625, -34.2890625, -32.896484375, -31.50390625, -30.111328125, -28.71875, -27.326171875, -25.93359375, -24.541015625, -23.1484375, -21.755859375, -20.36328125, -18.970703125, -17.578125, -16.185546875, -14.79296875, -13.400390625, -12.0078125, -10.615234375, -9.22265625, -7.830078125, -6.4375, -5.044921875, -3.65234375, -2.259765625, -0.8671875, 0.525390625, 1.91796875, 3.310546875, 4.703125, 6.095703125, 7.48828125, 8.880859375, 10.2734375, 11.666015625, 13.05859375, 14.451171875, 15.84375, 17.236328125, 18.62890625, 20.021484375, 21.4140625, 22.806640625, 24.19921875, 25.591796875, 26.984375, 28.376953125, 29.76953125, 31.162109375, 32.5546875, 33.947265625, 35.33984375, 36.732421875, 38.125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 10.0, 16.0, 21.0, 29.0, 38.0, 49.0, 45.0, 68.0, 62.0, 81.0, 86.0, 82.0, 112.0, 77.0, 53.0, 53.0, 40.0, 30.0, 17.0, 12.0, 7.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.8763427734375, -7.627685546875, -7.3790283203125, -7.13037109375, -6.8817138671875, -6.633056640625, -6.3843994140625, -6.1357421875, -5.8870849609375, -5.638427734375, -5.3897705078125, -5.14111328125, -4.8924560546875, -4.643798828125, -4.3951416015625, -4.146484375, -3.8978271484375, -3.649169921875, -3.4005126953125, -3.15185546875, -2.9031982421875, -2.654541015625, -2.4058837890625, -2.1572265625, -1.9085693359375, -1.659912109375, -1.4112548828125, -1.16259765625, -0.9139404296875, -0.665283203125, -0.4166259765625, -0.16796875, 0.0806884765625, 0.329345703125, 0.5780029296875, 0.82666015625, 1.0753173828125, 1.323974609375, 1.5726318359375, 1.8212890625, 2.0699462890625, 2.318603515625, 2.5672607421875, 2.81591796875, 3.0645751953125, 3.313232421875, 3.5618896484375, 3.810546875, 4.0592041015625, 4.307861328125, 4.5565185546875, 4.80517578125, 5.0538330078125, 5.302490234375, 5.5511474609375, 5.7998046875, 6.0484619140625, 6.297119140625, 6.5457763671875, 6.79443359375, 7.0430908203125, 7.291748046875, 7.5404052734375, 7.7890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 15.0, 25.0, 26.0, 42.0, 86.0, 148.0, 251.0, 481.0, 882.0, 1862.0, 3928.0, 10466.0, 35082.0, 238416.0, 3240534.0, 579594.0, 57287.0, 15000.0, 5387.0, 2332.0, 1093.0, 599.0, 323.0, 169.0, 116.0, 48.0, 30.0, 20.0, 13.0, 5.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.8687744140625, -7.573486328125, -7.2781982421875, -6.98291015625, -6.6876220703125, -6.392333984375, -6.0970458984375, -5.8017578125, -5.5064697265625, -5.211181640625, -4.9158935546875, -4.62060546875, -4.3253173828125, -4.030029296875, -3.7347412109375, -3.439453125, -3.1441650390625, -2.848876953125, -2.5535888671875, -2.25830078125, -1.9630126953125, -1.667724609375, -1.3724365234375, -1.0771484375, -0.7818603515625, -0.486572265625, -0.1912841796875, 0.10400390625, 0.3992919921875, 0.694580078125, 0.9898681640625, 1.28515625, 1.5804443359375, 1.875732421875, 2.1710205078125, 2.46630859375, 2.7615966796875, 3.056884765625, 3.3521728515625, 3.6474609375, 3.9427490234375, 4.238037109375, 4.5333251953125, 4.82861328125, 5.1239013671875, 5.419189453125, 5.7144775390625, 6.009765625, 6.3050537109375, 6.600341796875, 6.8956298828125, 7.19091796875, 7.4862060546875, 7.781494140625, 8.0767822265625, 8.3720703125, 8.6673583984375, 8.962646484375, 9.2579345703125, 9.55322265625, 9.8485107421875, 10.143798828125, 10.4390869140625, 10.734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 7.0, 14.0, 8.0, 10.0, 13.0, 18.0, 28.0, 44.0, 85.0, 168.0, 331.0, 709.0, 1008.0, 782.0, 354.0, 194.0, 99.0, 74.0, 37.0, 31.0, 18.0, 13.0, 10.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-14.0859375, -13.7210693359375, -13.356201171875, -12.9913330078125, -12.62646484375, -12.2615966796875, -11.896728515625, -11.5318603515625, -11.1669921875, -10.8021240234375, -10.437255859375, -10.0723876953125, -9.70751953125, -9.3426513671875, -8.977783203125, -8.6129150390625, -8.248046875, -7.8831787109375, -7.518310546875, -7.1534423828125, -6.78857421875, -6.4237060546875, -6.058837890625, -5.6939697265625, -5.3291015625, -4.9642333984375, -4.599365234375, -4.2344970703125, -3.86962890625, -3.5047607421875, -3.139892578125, -2.7750244140625, -2.41015625, -2.0452880859375, -1.680419921875, -1.3155517578125, -0.95068359375, -0.5858154296875, -0.220947265625, 0.1439208984375, 0.5087890625, 0.8736572265625, 1.238525390625, 1.6033935546875, 1.96826171875, 2.3331298828125, 2.697998046875, 3.0628662109375, 3.427734375, 3.7926025390625, 4.157470703125, 4.5223388671875, 4.88720703125, 5.2520751953125, 5.616943359375, 5.9818115234375, 6.3466796875, 6.7115478515625, 7.076416015625, 7.4412841796875, 7.80615234375, 8.1710205078125, 8.535888671875, 8.9007568359375, 9.265625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 30.0, 58.0, 203.0, 311.0, 212.0, 100.0, 42.0, 16.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.87675476074219, -81.71676635742188, -77.55677795410156, -73.39678955078125, -69.23680877685547, -65.07682037353516, -60.916831970214844, -56.75684356689453, -52.596858978271484, -48.43687057495117, -44.276885986328125, -40.11689758300781, -35.9569091796875, -31.796924591064453, -27.63693618774414, -23.47694969177246, -19.31696319580078, -15.156976699829102, -10.996989250183105, -6.837001800537109, -2.6770153045654297, 1.48297119140625, 5.6429595947265625, 9.802946090698242, 13.962932586669922, 18.1229190826416, 22.28290557861328, 26.442893981933594, 30.602880477905273, 34.76286697387695, 38.922855377197266, 43.08283996582031, 47.242828369140625, 51.40281677246094, 55.562801361083984, 59.7227897644043, 63.882774353027344, 68.04276275634766, 72.20275115966797, 76.36273956298828, 80.52272033691406, 84.68270874023438, 88.84269714355469, 93.002685546875, 97.16266632080078, 101.3226547241211, 105.4826431274414, 109.64263153076172, 113.80261993408203, 117.96260833740234, 122.12259674072266, 126.28257751464844, 130.44256591796875, 134.60255432128906, 138.76254272460938, 142.9225311279297, 147.08251953125, 151.2425079345703, 155.40249633789062, 159.56248474121094, 163.72247314453125, 167.8824462890625, 172.04244995117188, 176.20242309570312, 180.36241149902344]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 10.0, 8.0, 12.0, 15.0, 19.0, 16.0, 18.0, 25.0, 39.0, 41.0, 47.0, 39.0, 55.0, 55.0, 36.0, 59.0, 67.0, 59.0, 54.0, 45.0, 50.0, 31.0, 44.0, 32.0, 29.0, 19.0, 17.0, 14.0, 4.0, 6.0, 11.0, 8.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.28738021850586, -47.83977508544922, -46.39216995239258, -44.94456481933594, -43.4969596862793, -42.049354553222656, -40.60174560546875, -39.154144287109375, -37.70653533935547, -36.25893020629883, -34.81132507324219, -33.36371994018555, -31.916114807128906, -30.468509674072266, -29.020902633666992, -27.57329750061035, -26.125694274902344, -24.678089141845703, -23.230484008789062, -21.782878875732422, -20.33527374267578, -18.88766860961914, -17.440061569213867, -15.992456436157227, -14.544851303100586, -13.097246170043945, -11.649641036987305, -10.202034950256348, -8.754429817199707, -7.306824684143066, -5.859218597412109, -4.411613464355469, -2.9640045166015625, -1.5163991451263428, -0.06879377365112305, 1.3788118362426758, 2.8264169692993164, 4.274022102355957, 5.721628189086914, 7.169233322143555, 8.616838455200195, 10.064443588256836, 11.512048721313477, 12.959654808044434, 14.407259941101074, 15.854865074157715, 17.302471160888672, 18.750076293945312, 20.197681427001953, 21.645286560058594, 23.092891693115234, 24.540496826171875, 25.988101959228516, 27.435707092285156, 28.88331413269043, 30.33091926574707, 31.77852439880371, 33.226131439208984, 34.673736572265625, 36.121341705322266, 37.568946838378906, 39.01655197143555, 40.46415710449219, 41.91176223754883, 43.35936737060547]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 22.0, 22.0, 46.0, 61.0, 108.0, 182.0, 288.0, 494.0, 855.0, 1591.0, 3016.0, 5524.0, 11425.0, 25043.0, 58091.0, 152241.0, 365459.0, 257978.0, 94021.0, 38071.0, 17006.0, 8055.0, 3989.0, 2148.0, 1166.0, 651.0, 388.0, 217.0, 142.0, 88.0, 52.0, 36.0, 15.0, 16.0, 10.0, 4.0, 5.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.88671875, -5.70135498046875, -5.5159912109375, -5.33062744140625, -5.145263671875, -4.95989990234375, -4.7745361328125, -4.58917236328125, -4.40380859375, -4.21844482421875, -4.0330810546875, -3.84771728515625, -3.662353515625, -3.47698974609375, -3.2916259765625, -3.10626220703125, -2.9208984375, -2.73553466796875, -2.5501708984375, -2.36480712890625, -2.179443359375, -1.99407958984375, -1.8087158203125, -1.62335205078125, -1.43798828125, -1.25262451171875, -1.0672607421875, -0.88189697265625, -0.696533203125, -0.51116943359375, -0.3258056640625, -0.14044189453125, 0.044921875, 0.23028564453125, 0.4156494140625, 0.60101318359375, 0.786376953125, 0.97174072265625, 1.1571044921875, 1.34246826171875, 1.52783203125, 1.71319580078125, 1.8985595703125, 2.08392333984375, 2.269287109375, 2.45465087890625, 2.6400146484375, 2.82537841796875, 3.0107421875, 3.19610595703125, 3.3814697265625, 3.56683349609375, 3.752197265625, 3.93756103515625, 4.1229248046875, 4.30828857421875, 4.49365234375, 4.67901611328125, 4.8643798828125, 5.04974365234375, 5.235107421875, 5.42047119140625, 5.6058349609375, 5.79119873046875, 5.9765625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 6.0, 8.0, 5.0, 16.0, 17.0, 15.0, 20.0, 19.0, 22.0, 26.0, 26.0, 22.0, 48.0, 51.0, 40.0, 45.0, 63.0, 47.0, 51.0, 55.0, 63.0, 45.0, 40.0, 29.0, 28.0, 30.0, 34.0, 29.0, 19.0, 19.0, 15.0, 9.0, 11.0, 10.0, 10.0, 0.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.706329345703125, -3.55914306640625, -3.411956787109375, -3.2647705078125, -3.117584228515625, -2.97039794921875, -2.823211669921875, -2.676025390625, -2.528839111328125, -2.38165283203125, -2.234466552734375, -2.0872802734375, -1.940093994140625, -1.79290771484375, -1.645721435546875, -1.49853515625, -1.351348876953125, -1.20416259765625, -1.056976318359375, -0.9097900390625, -0.762603759765625, -0.61541748046875, -0.468231201171875, -0.321044921875, -0.173858642578125, -0.02667236328125, 0.120513916015625, 0.2677001953125, 0.414886474609375, 0.56207275390625, 0.709259033203125, 0.8564453125, 1.003631591796875, 1.15081787109375, 1.298004150390625, 1.4451904296875, 1.592376708984375, 1.73956298828125, 1.886749267578125, 2.033935546875, 2.181121826171875, 2.32830810546875, 2.475494384765625, 2.6226806640625, 2.769866943359375, 2.91705322265625, 3.064239501953125, 3.21142578125, 3.358612060546875, 3.50579833984375, 3.652984619140625, 3.8001708984375, 3.947357177734375, 4.09454345703125, 4.241729736328125, 4.388916015625, 4.536102294921875, 4.68328857421875, 4.830474853515625, 4.9776611328125, 5.124847412109375, 5.27203369140625, 5.419219970703125, 5.56640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 6.0, 5.0, 10.0, 6.0, 7.0, 9.0, 26.0, 27.0, 51.0, 76.0, 107.0, 145.0, 287.0, 540.0, 1058.0, 3041.0, 11865.0, 77104.0, 724426.0, 198187.0, 23594.0, 4813.0, 1567.0, 721.0, 337.0, 192.0, 109.0, 68.0, 43.0, 32.0, 30.0, 13.0, 14.0, 6.0, 15.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.546875, -16.0833740234375, -15.619873046875, -15.1563720703125, -14.69287109375, -14.2293701171875, -13.765869140625, -13.3023681640625, -12.8388671875, -12.3753662109375, -11.911865234375, -11.4483642578125, -10.98486328125, -10.5213623046875, -10.057861328125, -9.5943603515625, -9.130859375, -8.6673583984375, -8.203857421875, -7.7403564453125, -7.27685546875, -6.8133544921875, -6.349853515625, -5.8863525390625, -5.4228515625, -4.9593505859375, -4.495849609375, -4.0323486328125, -3.56884765625, -3.1053466796875, -2.641845703125, -2.1783447265625, -1.71484375, -1.2513427734375, -0.787841796875, -0.3243408203125, 0.13916015625, 0.6026611328125, 1.066162109375, 1.5296630859375, 1.9931640625, 2.4566650390625, 2.920166015625, 3.3836669921875, 3.84716796875, 4.3106689453125, 4.774169921875, 5.2376708984375, 5.701171875, 6.1646728515625, 6.628173828125, 7.0916748046875, 7.55517578125, 8.0186767578125, 8.482177734375, 8.9456787109375, 9.4091796875, 9.8726806640625, 10.336181640625, 10.7996826171875, 11.26318359375, 11.7266845703125, 12.190185546875, 12.6536865234375, 13.1171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 7.0, 9.0, 8.0, 17.0, 11.0, 15.0, 17.0, 27.0, 37.0, 32.0, 37.0, 36.0, 59.0, 52.0, 60.0, 58.0, 45.0, 61.0, 56.0, 48.0, 54.0, 47.0, 38.0, 25.0, 23.0, 20.0, 18.0, 16.0, 12.0, 13.0, 5.0, 10.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.078125, -21.457275390625, -20.83642578125, -20.215576171875, -19.5947265625, -18.973876953125, -18.35302734375, -17.732177734375, -17.111328125, -16.490478515625, -15.86962890625, -15.248779296875, -14.6279296875, -14.007080078125, -13.38623046875, -12.765380859375, -12.14453125, -11.523681640625, -10.90283203125, -10.281982421875, -9.6611328125, -9.040283203125, -8.41943359375, -7.798583984375, -7.177734375, -6.556884765625, -5.93603515625, -5.315185546875, -4.6943359375, -4.073486328125, -3.45263671875, -2.831787109375, -2.2109375, -1.590087890625, -0.96923828125, -0.348388671875, 0.2724609375, 0.893310546875, 1.51416015625, 2.135009765625, 2.755859375, 3.376708984375, 3.99755859375, 4.618408203125, 5.2392578125, 5.860107421875, 6.48095703125, 7.101806640625, 7.72265625, 8.343505859375, 8.96435546875, 9.585205078125, 10.2060546875, 10.826904296875, 11.44775390625, 12.068603515625, 12.689453125, 13.310302734375, 13.93115234375, 14.552001953125, 15.1728515625, 15.793701171875, 16.41455078125, 17.035400390625, 17.65625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 3.0, 5.0, 7.0, 7.0, 21.0, 25.0, 49.0, 106.0, 253.0, 756.0, 3149.0, 30383.0, 877432.0, 127014.0, 7278.0, 1318.0, 366.0, 175.0, 83.0, 37.0, 18.0, 16.0, 14.0, 12.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.91796875, -10.5625, -10.20703125, -9.8515625, -9.49609375, -9.140625, -8.78515625, -8.4296875, -8.07421875, -7.71875, -7.36328125, -7.0078125, -6.65234375, -6.296875, -5.94140625, -5.5859375, -5.23046875, -4.875, -4.51953125, -4.1640625, -3.80859375, -3.453125, -3.09765625, -2.7421875, -2.38671875, -2.03125, -1.67578125, -1.3203125, -0.96484375, -0.609375, -0.25390625, 0.1015625, 0.45703125, 0.8125, 1.16796875, 1.5234375, 1.87890625, 2.234375, 2.58984375, 2.9453125, 3.30078125, 3.65625, 4.01171875, 4.3671875, 4.72265625, 5.078125, 5.43359375, 5.7890625, 6.14453125, 6.5, 6.85546875, 7.2109375, 7.56640625, 7.921875, 8.27734375, 8.6328125, 8.98828125, 9.34375, 9.69921875, 10.0546875, 10.41015625, 10.765625, 11.12109375, 11.4765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 9.0, 6.0, 6.0, 15.0, 15.0, 29.0, 37.0, 57.0, 61.0, 94.0, 116.0, 125.0, 118.0, 86.0, 63.0, 35.0, 18.0, 15.0, 21.0, 9.0, 9.0, 8.0, 8.0, 4.0, 6.0, 5.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012149810791015625, -0.0011805295944213867, -0.001146078109741211, -0.0011116266250610352, -0.0010771751403808594, -0.0010427236557006836, -0.0010082721710205078, -0.000973820686340332, -0.0009393692016601562, -0.0009049177169799805, -0.0008704662322998047, -0.0008360147476196289, -0.0008015632629394531, -0.0007671117782592773, -0.0007326602935791016, -0.0006982088088989258, -0.00066375732421875, -0.0006293058395385742, -0.0005948543548583984, -0.0005604028701782227, -0.0005259513854980469, -0.0004914999008178711, -0.0004570484161376953, -0.00042259693145751953, -0.00038814544677734375, -0.00035369396209716797, -0.0003192424774169922, -0.0002847909927368164, -0.0002503395080566406, -0.00021588802337646484, -0.00018143653869628906, -0.00014698505401611328, -0.0001125335693359375, -7.808208465576172e-05, -4.363059997558594e-05, -9.179115295410156e-06, 2.5272369384765625e-05, 5.9723854064941406e-05, 9.417533874511719e-05, 0.00012862682342529297, 0.00016307830810546875, 0.00019752979278564453, 0.0002319812774658203, 0.0002664327621459961, 0.0003008842468261719, 0.00033533573150634766, 0.00036978721618652344, 0.0004042387008666992, 0.000438690185546875, 0.0004731416702270508, 0.0005075931549072266, 0.0005420446395874023, 0.0005764961242675781, 0.0006109476089477539, 0.0006453990936279297, 0.0006798505783081055, 0.0007143020629882812, 0.000748753547668457, 0.0007832050323486328, 0.0008176565170288086, 0.0008521080017089844, 0.0008865594863891602, 0.0009210109710693359, 0.0009554624557495117, 0.0009899139404296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 8.0, 8.0, 17.0, 34.0, 52.0, 92.0, 155.0, 366.0, 777.0, 2161.0, 8029.0, 44676.0, 646346.0, 309173.0, 27889.0, 5784.0, 1685.0, 641.0, 295.0, 137.0, 83.0, 52.0, 25.0, 18.0, 13.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.66510009765625, -5.4278564453125, -5.19061279296875, -4.953369140625, -4.71612548828125, -4.4788818359375, -4.24163818359375, -4.00439453125, -3.76715087890625, -3.5299072265625, -3.29266357421875, -3.055419921875, -2.81817626953125, -2.5809326171875, -2.34368896484375, -2.1064453125, -1.86920166015625, -1.6319580078125, -1.39471435546875, -1.157470703125, -0.92022705078125, -0.6829833984375, -0.44573974609375, -0.20849609375, 0.02874755859375, 0.2659912109375, 0.50323486328125, 0.740478515625, 0.97772216796875, 1.2149658203125, 1.45220947265625, 1.689453125, 1.92669677734375, 2.1639404296875, 2.40118408203125, 2.638427734375, 2.87567138671875, 3.1129150390625, 3.35015869140625, 3.58740234375, 3.82464599609375, 4.0618896484375, 4.29913330078125, 4.536376953125, 4.77362060546875, 5.0108642578125, 5.24810791015625, 5.4853515625, 5.72259521484375, 5.9598388671875, 6.19708251953125, 6.434326171875, 6.67156982421875, 6.9088134765625, 7.14605712890625, 7.38330078125, 7.62054443359375, 7.8577880859375, 8.09503173828125, 8.332275390625, 8.56951904296875, 8.8067626953125, 9.04400634765625, 9.28125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 6.0, 11.0, 6.0, 15.0, 13.0, 19.0, 27.0, 26.0, 37.0, 46.0, 59.0, 86.0, 91.0, 94.0, 73.0, 65.0, 85.0, 50.0, 41.0, 25.0, 18.0, 16.0, 19.0, 12.0, 12.0, 9.0, 9.0, 9.0, 4.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.96343994140625, -4.8057861328125, -4.64813232421875, -4.490478515625, -4.33282470703125, -4.1751708984375, -4.01751708984375, -3.85986328125, -3.70220947265625, -3.5445556640625, -3.38690185546875, -3.229248046875, -3.07159423828125, -2.9139404296875, -2.75628662109375, -2.5986328125, -2.44097900390625, -2.2833251953125, -2.12567138671875, -1.968017578125, -1.81036376953125, -1.6527099609375, -1.49505615234375, -1.33740234375, -1.17974853515625, -1.0220947265625, -0.86444091796875, -0.706787109375, -0.54913330078125, -0.3914794921875, -0.23382568359375, -0.076171875, 0.08148193359375, 0.2391357421875, 0.39678955078125, 0.554443359375, 0.71209716796875, 0.8697509765625, 1.02740478515625, 1.18505859375, 1.34271240234375, 1.5003662109375, 1.65802001953125, 1.815673828125, 1.97332763671875, 2.1309814453125, 2.28863525390625, 2.4462890625, 2.60394287109375, 2.7615966796875, 2.91925048828125, 3.076904296875, 3.23455810546875, 3.3922119140625, 3.54986572265625, 3.70751953125, 3.86517333984375, 4.0228271484375, 4.18048095703125, 4.338134765625, 4.49578857421875, 4.6534423828125, 4.81109619140625, 4.96875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 9.0, 33.0, 92.0, 314.0, 373.0, 127.0, 23.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.34764099121094, -122.90054321289062, -116.45343780517578, -110.00634002685547, -103.55923461914062, -97.11213684082031, -90.6650390625, -84.21794128417969, -77.77083587646484, -71.32373809814453, -64.87663269042969, -58.429534912109375, -51.9824333190918, -45.53533172607422, -39.088233947753906, -32.64113235473633, -26.19403076171875, -19.746929168701172, -13.299829483032227, -6.852729797363281, -0.4056282043457031, 6.041473388671875, 12.488571166992188, 18.935672760009766, 25.382774353027344, 31.829875946044922, 38.2769775390625, 44.72407531738281, 51.17117691040039, 57.61827850341797, 64.06537628173828, 70.51248168945312, 76.9595947265625, 83.40669250488281, 89.85379791259766, 96.30089569091797, 102.74800109863281, 109.19509887695312, 115.64219665527344, 122.08929443359375, 128.53640747070312, 134.98350524902344, 141.43060302734375, 147.87771606445312, 154.32481384277344, 160.77191162109375, 167.21900939941406, 173.66610717773438, 180.1132049560547, 186.560302734375, 193.0074005126953, 199.45449829101562, 205.901611328125, 212.3487091064453, 218.79580688476562, 225.24290466308594, 231.69000244140625, 238.13710021972656, 244.58419799804688, 251.03131103515625, 257.4783935546875, 263.9255065917969, 270.37261962890625, 276.8197021484375, 283.2668151855469]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 10.0, 8.0, 9.0, 23.0, 15.0, 15.0, 23.0, 22.0, 36.0, 28.0, 48.0, 36.0, 50.0, 62.0, 57.0, 57.0, 69.0, 46.0, 52.0, 39.0, 38.0, 35.0, 38.0, 27.0, 18.0, 22.0, 19.0, 15.0, 15.0, 11.0, 13.0, 4.0, 9.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.213623046875, -72.89950561523438, -70.58538818359375, -68.27127075195312, -65.9571533203125, -63.643035888671875, -61.328914642333984, -59.01479721069336, -56.700679779052734, -54.38656234741211, -52.072444915771484, -49.75832748413086, -47.44420623779297, -45.130088806152344, -42.81597137451172, -40.501853942871094, -38.18773651123047, -35.873619079589844, -33.55950164794922, -31.24538230895996, -28.931264877319336, -26.61714744567871, -24.303028106689453, -21.988910675048828, -19.674793243408203, -17.360675811767578, -15.046557426452637, -12.732439041137695, -10.41832160949707, -8.104204177856445, -5.790085792541504, -3.4759674072265625, -1.1618499755859375, 1.1522679328918457, 3.466385841369629, 5.780503749847412, 8.094621658325195, 10.40873908996582, 12.722857475280762, 15.036975860595703, 17.351093292236328, 19.665210723876953, 21.979328155517578, 24.293447494506836, 26.60756492614746, 28.921682357788086, 31.235801696777344, 33.54991912841797, 35.864036560058594, 38.17815399169922, 40.492271423339844, 42.80638885498047, 45.120506286621094, 47.43462371826172, 49.74874496459961, 52.062862396240234, 54.37697982788086, 56.691097259521484, 59.00521469116211, 61.319332122802734, 63.633453369140625, 65.94757080078125, 68.26168823242188, 70.5758056640625, 72.88992309570312]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 16.0, 9.0, 21.0, 29.0, 35.0, 55.0, 104.0, 155.0, 284.0, 493.0, 889.0, 1682.0, 3440.0, 7669.0, 19620.0, 70516.0, 494427.0, 2579530.0, 864646.0, 106542.0, 25816.0, 9611.0, 4223.0, 1982.0, 1056.0, 608.0, 308.0, 179.0, 113.0, 64.0, 51.0, 33.0, 23.0, 14.0, 14.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-6.98828125, -6.7974853515625, -6.606689453125, -6.4158935546875, -6.22509765625, -6.0343017578125, -5.843505859375, -5.6527099609375, -5.4619140625, -5.2711181640625, -5.080322265625, -4.8895263671875, -4.69873046875, -4.5079345703125, -4.317138671875, -4.1263427734375, -3.935546875, -3.7447509765625, -3.553955078125, -3.3631591796875, -3.17236328125, -2.9815673828125, -2.790771484375, -2.5999755859375, -2.4091796875, -2.2183837890625, -2.027587890625, -1.8367919921875, -1.64599609375, -1.4552001953125, -1.264404296875, -1.0736083984375, -0.8828125, -0.6920166015625, -0.501220703125, -0.3104248046875, -0.11962890625, 0.0711669921875, 0.261962890625, 0.4527587890625, 0.6435546875, 0.8343505859375, 1.025146484375, 1.2159423828125, 1.40673828125, 1.5975341796875, 1.788330078125, 1.9791259765625, 2.169921875, 2.3607177734375, 2.551513671875, 2.7423095703125, 2.93310546875, 3.1239013671875, 3.314697265625, 3.5054931640625, 3.6962890625, 3.8870849609375, 4.077880859375, 4.2686767578125, 4.45947265625, 4.6502685546875, 4.841064453125, 5.0318603515625, 5.22265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 13.0, 14.0, 16.0, 23.0, 27.0, 37.0, 35.0, 27.0, 28.0, 43.0, 45.0, 46.0, 53.0, 34.0, 62.0, 67.0, 42.0, 42.0, 47.0, 37.0, 37.0, 40.0, 23.0, 21.0, 21.0, 18.0, 22.0, 9.0, 8.0, 11.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.539825439453125, -3.40972900390625, -3.279632568359375, -3.1495361328125, -3.019439697265625, -2.88934326171875, -2.759246826171875, -2.629150390625, -2.499053955078125, -2.36895751953125, -2.238861083984375, -2.1087646484375, -1.978668212890625, -1.84857177734375, -1.718475341796875, -1.58837890625, -1.458282470703125, -1.32818603515625, -1.198089599609375, -1.0679931640625, -0.937896728515625, -0.80780029296875, -0.677703857421875, -0.547607421875, -0.417510986328125, -0.28741455078125, -0.157318115234375, -0.0272216796875, 0.102874755859375, 0.23297119140625, 0.363067626953125, 0.4931640625, 0.623260498046875, 0.75335693359375, 0.883453369140625, 1.0135498046875, 1.143646240234375, 1.27374267578125, 1.403839111328125, 1.533935546875, 1.664031982421875, 1.79412841796875, 1.924224853515625, 2.0543212890625, 2.184417724609375, 2.31451416015625, 2.444610595703125, 2.57470703125, 2.704803466796875, 2.83489990234375, 2.964996337890625, 3.0950927734375, 3.225189208984375, 3.35528564453125, 3.485382080078125, 3.615478515625, 3.745574951171875, 3.87567138671875, 4.005767822265625, 4.1358642578125, 4.265960693359375, 4.39605712890625, 4.526153564453125, 4.65625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 15.0, 25.0, 15.0, 29.0, 32.0, 59.0, 87.0, 132.0, 244.0, 517.0, 979.0, 2215.0, 5011.0, 14441.0, 48753.0, 289734.0, 2954984.0, 752150.0, 89316.0, 22695.0, 7467.0, 2818.0, 1163.0, 575.0, 306.0, 175.0, 97.0, 46.0, 46.0, 35.0, 17.0, 20.0, 14.0, 7.0, 7.0, 6.0, 2.0, 2.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40625, -7.138671875, -6.87109375, -6.603515625, -6.3359375, -6.068359375, -5.80078125, -5.533203125, -5.265625, -4.998046875, -4.73046875, -4.462890625, -4.1953125, -3.927734375, -3.66015625, -3.392578125, -3.125, -2.857421875, -2.58984375, -2.322265625, -2.0546875, -1.787109375, -1.51953125, -1.251953125, -0.984375, -0.716796875, -0.44921875, -0.181640625, 0.0859375, 0.353515625, 0.62109375, 0.888671875, 1.15625, 1.423828125, 1.69140625, 1.958984375, 2.2265625, 2.494140625, 2.76171875, 3.029296875, 3.296875, 3.564453125, 3.83203125, 4.099609375, 4.3671875, 4.634765625, 4.90234375, 5.169921875, 5.4375, 5.705078125, 5.97265625, 6.240234375, 6.5078125, 6.775390625, 7.04296875, 7.310546875, 7.578125, 7.845703125, 8.11328125, 8.380859375, 8.6484375, 8.916015625, 9.18359375, 9.451171875, 9.71875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 11.0, 16.0, 25.0, 19.0, 39.0, 40.0, 82.0, 124.0, 230.0, 376.0, 577.0, 722.0, 639.0, 384.0, 247.0, 181.0, 105.0, 70.0, 43.0, 38.0, 21.0, 16.0, 15.0, 6.0, 10.0, 6.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3828125, -10.0443115234375, -9.705810546875, -9.3673095703125, -9.02880859375, -8.6903076171875, -8.351806640625, -8.0133056640625, -7.6748046875, -7.3363037109375, -6.997802734375, -6.6593017578125, -6.32080078125, -5.9822998046875, -5.643798828125, -5.3052978515625, -4.966796875, -4.6282958984375, -4.289794921875, -3.9512939453125, -3.61279296875, -3.2742919921875, -2.935791015625, -2.5972900390625, -2.2587890625, -1.9202880859375, -1.581787109375, -1.2432861328125, -0.90478515625, -0.5662841796875, -0.227783203125, 0.1107177734375, 0.44921875, 0.7877197265625, 1.126220703125, 1.4647216796875, 1.80322265625, 2.1417236328125, 2.480224609375, 2.8187255859375, 3.1572265625, 3.4957275390625, 3.834228515625, 4.1727294921875, 4.51123046875, 4.8497314453125, 5.188232421875, 5.5267333984375, 5.865234375, 6.2037353515625, 6.542236328125, 6.8807373046875, 7.21923828125, 7.5577392578125, 7.896240234375, 8.2347412109375, 8.5732421875, 8.9117431640625, 9.250244140625, 9.5887451171875, 9.92724609375, 10.2657470703125, 10.604248046875, 10.9427490234375, 11.28125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 22.0, 94.0, 279.0, 332.0, 176.0, 54.0, 15.0, 10.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.1763916015625, -186.99813842773438, -180.81988525390625, -174.64163208007812, -168.46337890625, -162.28512573242188, -156.10687255859375, -149.92861938476562, -143.7503662109375, -137.57211303710938, -131.39385986328125, -125.21560668945312, -119.037353515625, -112.85910034179688, -106.68084716796875, -100.50259399414062, -94.32433319091797, -88.14608001708984, -81.96782684326172, -75.7895736694336, -69.61132049560547, -63.433067321777344, -57.25481033325195, -51.07655715942383, -44.8983039855957, -38.72005081176758, -32.54179763793945, -26.363542556762695, -20.18528938293457, -14.007036209106445, -7.8287811279296875, -1.6505279541015625, 4.5277252197265625, 10.705978393554688, 16.884231567382812, 23.06248664855957, 29.240739822387695, 35.41899108886719, 41.59724807739258, 47.7755012512207, 53.95375442504883, 60.13200759887695, 66.31026458740234, 72.48851776123047, 78.6667709350586, 84.84502410888672, 91.02327728271484, 97.20153045654297, 103.3797836303711, 109.55803680419922, 115.73628997802734, 121.91454315185547, 128.09280395507812, 134.27105712890625, 140.44931030273438, 146.6275634765625, 152.80581665039062, 158.98406982421875, 165.16232299804688, 171.340576171875, 177.51882934570312, 183.69708251953125, 189.87533569335938, 196.0535888671875, 202.23184204101562]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 9.0, 9.0, 10.0, 15.0, 16.0, 15.0, 17.0, 31.0, 29.0, 27.0, 40.0, 21.0, 24.0, 38.0, 37.0, 55.0, 53.0, 51.0, 42.0, 40.0, 48.0, 46.0, 35.0, 34.0, 39.0, 25.0, 32.0, 25.0, 28.0, 14.0, 13.0, 14.0, 13.0, 11.0, 8.0, 8.0, 3.0, 5.0, 2.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.9694709777832, -44.469940185546875, -42.97040939331055, -41.47087860107422, -39.97134780883789, -38.47181701660156, -36.9722900390625, -35.472755432128906, -33.973228454589844, -32.473697662353516, -30.974166870117188, -29.47463607788086, -27.97510528564453, -26.475574493408203, -24.976045608520508, -23.47651481628418, -21.97698211669922, -20.47745132446289, -18.977920532226562, -17.478389739990234, -15.978859901428223, -14.479329109191895, -12.979799270629883, -11.480268478393555, -9.980737686157227, -8.481206893920898, -6.9816765785217285, -5.482146263122559, -3.9826154708862305, -2.4830846786499023, -0.9835548400878906, 0.5159759521484375, 2.0155105590820312, 3.5150411128997803, 5.014571666717529, 6.514101982116699, 8.013632774353027, 9.513163566589355, 11.012693405151367, 12.512224197387695, 14.011754989624023, 15.511285781860352, 17.01081657409668, 18.510345458984375, 20.009876251220703, 21.50940704345703, 23.00893783569336, 24.508468627929688, 26.007999420166016, 27.507530212402344, 29.007061004638672, 30.506591796875, 32.00612258911133, 33.505653381347656, 35.00518035888672, 36.50471496582031, 38.004241943359375, 39.5037727355957, 41.00330352783203, 42.50283432006836, 44.00236511230469, 45.501895904541016, 47.001426696777344, 48.500953674316406, 50.00048828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 11.0, 12.0, 17.0, 20.0, 26.0, 46.0, 72.0, 92.0, 172.0, 243.0, 416.0, 783.0, 1375.0, 2686.0, 5485.0, 11499.0, 24417.0, 53221.0, 115245.0, 240214.0, 294375.0, 159680.0, 73638.0, 34049.0, 15720.0, 7213.0, 3615.0, 1810.0, 972.0, 543.0, 319.0, 202.0, 116.0, 73.0, 63.0, 39.0, 17.0, 19.0, 9.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.36480712890625, -4.2100830078125, -4.05535888671875, -3.900634765625, -3.74591064453125, -3.5911865234375, -3.43646240234375, -3.28173828125, -3.12701416015625, -2.9722900390625, -2.81756591796875, -2.662841796875, -2.50811767578125, -2.3533935546875, -2.19866943359375, -2.0439453125, -1.88922119140625, -1.7344970703125, -1.57977294921875, -1.425048828125, -1.27032470703125, -1.1156005859375, -0.96087646484375, -0.80615234375, -0.65142822265625, -0.4967041015625, -0.34197998046875, -0.187255859375, -0.03253173828125, 0.1221923828125, 0.27691650390625, 0.431640625, 0.58636474609375, 0.7410888671875, 0.89581298828125, 1.050537109375, 1.20526123046875, 1.3599853515625, 1.51470947265625, 1.66943359375, 1.82415771484375, 1.9788818359375, 2.13360595703125, 2.288330078125, 2.44305419921875, 2.5977783203125, 2.75250244140625, 2.9072265625, 3.06195068359375, 3.2166748046875, 3.37139892578125, 3.526123046875, 3.68084716796875, 3.8355712890625, 3.99029541015625, 4.14501953125, 4.29974365234375, 4.4544677734375, 4.60919189453125, 4.763916015625, 4.91864013671875, 5.0733642578125, 5.22808837890625, 5.3828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 4.0, 7.0, 8.0, 6.0, 15.0, 12.0, 14.0, 22.0, 23.0, 33.0, 45.0, 32.0, 39.0, 57.0, 37.0, 36.0, 49.0, 48.0, 47.0, 56.0, 42.0, 42.0, 42.0, 43.0, 36.0, 34.0, 33.0, 20.0, 20.0, 24.0, 13.0, 12.0, 14.0, 12.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.564453125, -3.437103271484375, -3.30975341796875, -3.182403564453125, -3.0550537109375, -2.927703857421875, -2.80035400390625, -2.673004150390625, -2.545654296875, -2.418304443359375, -2.29095458984375, -2.163604736328125, -2.0362548828125, -1.908905029296875, -1.78155517578125, -1.654205322265625, -1.52685546875, -1.399505615234375, -1.27215576171875, -1.144805908203125, -1.0174560546875, -0.890106201171875, -0.76275634765625, -0.635406494140625, -0.508056640625, -0.380706787109375, -0.25335693359375, -0.126007080078125, 0.0013427734375, 0.128692626953125, 0.25604248046875, 0.383392333984375, 0.5107421875, 0.638092041015625, 0.76544189453125, 0.892791748046875, 1.0201416015625, 1.147491455078125, 1.27484130859375, 1.402191162109375, 1.529541015625, 1.656890869140625, 1.78424072265625, 1.911590576171875, 2.0389404296875, 2.166290283203125, 2.29364013671875, 2.420989990234375, 2.54833984375, 2.675689697265625, 2.80303955078125, 2.930389404296875, 3.0577392578125, 3.185089111328125, 3.31243896484375, 3.439788818359375, 3.567138671875, 3.694488525390625, 3.82183837890625, 3.949188232421875, 4.0765380859375, 4.203887939453125, 4.33123779296875, 4.458587646484375, 4.5859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 2.0, 7.0, 6.0, 3.0, 14.0, 20.0, 18.0, 34.0, 43.0, 80.0, 89.0, 143.0, 252.0, 400.0, 621.0, 1206.0, 2482.0, 7750.0, 45632.0, 649921.0, 301866.0, 27685.0, 5735.0, 1992.0, 1014.0, 521.0, 335.0, 218.0, 152.0, 92.0, 70.0, 45.0, 28.0, 18.0, 23.0, 7.0, 6.0, 3.0, 12.0, 8.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-17.234375, -16.7540283203125, -16.273681640625, -15.7933349609375, -15.31298828125, -14.8326416015625, -14.352294921875, -13.8719482421875, -13.3916015625, -12.9112548828125, -12.430908203125, -11.9505615234375, -11.47021484375, -10.9898681640625, -10.509521484375, -10.0291748046875, -9.548828125, -9.0684814453125, -8.588134765625, -8.1077880859375, -7.62744140625, -7.1470947265625, -6.666748046875, -6.1864013671875, -5.7060546875, -5.2257080078125, -4.745361328125, -4.2650146484375, -3.78466796875, -3.3043212890625, -2.823974609375, -2.3436279296875, -1.86328125, -1.3829345703125, -0.902587890625, -0.4222412109375, 0.05810546875, 0.5384521484375, 1.018798828125, 1.4991455078125, 1.9794921875, 2.4598388671875, 2.940185546875, 3.4205322265625, 3.90087890625, 4.3812255859375, 4.861572265625, 5.3419189453125, 5.822265625, 6.3026123046875, 6.782958984375, 7.2633056640625, 7.74365234375, 8.2239990234375, 8.704345703125, 9.1846923828125, 9.6650390625, 10.1453857421875, 10.625732421875, 11.1060791015625, 11.58642578125, 12.0667724609375, 12.547119140625, 13.0274658203125, 13.5078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 3.0, 6.0, 6.0, 7.0, 4.0, 7.0, 17.0, 11.0, 20.0, 11.0, 34.0, 34.0, 36.0, 44.0, 37.0, 33.0, 41.0, 52.0, 54.0, 56.0, 52.0, 41.0, 53.0, 37.0, 44.0, 41.0, 26.0, 37.0, 20.0, 28.0, 21.0, 23.0, 13.0, 7.0, 6.0, 11.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.578125, -16.022216796875, -15.46630859375, -14.910400390625, -14.3544921875, -13.798583984375, -13.24267578125, -12.686767578125, -12.130859375, -11.574951171875, -11.01904296875, -10.463134765625, -9.9072265625, -9.351318359375, -8.79541015625, -8.239501953125, -7.68359375, -7.127685546875, -6.57177734375, -6.015869140625, -5.4599609375, -4.904052734375, -4.34814453125, -3.792236328125, -3.236328125, -2.680419921875, -2.12451171875, -1.568603515625, -1.0126953125, -0.456787109375, 0.09912109375, 0.655029296875, 1.2109375, 1.766845703125, 2.32275390625, 2.878662109375, 3.4345703125, 3.990478515625, 4.54638671875, 5.102294921875, 5.658203125, 6.214111328125, 6.77001953125, 7.325927734375, 7.8818359375, 8.437744140625, 8.99365234375, 9.549560546875, 10.10546875, 10.661376953125, 11.21728515625, 11.773193359375, 12.3291015625, 12.885009765625, 13.44091796875, 13.996826171875, 14.552734375, 15.108642578125, 15.66455078125, 16.220458984375, 16.7763671875, 17.332275390625, 17.88818359375, 18.444091796875, 19.0]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 16.0, 18.0, 27.0, 41.0, 62.0, 113.0, 154.0, 266.0, 425.0, 835.0, 1901.0, 5364.0, 23170.0, 138958.0, 737189.0, 112293.0, 19288.0, 4881.0, 1745.0, 769.0, 426.0, 233.0, 145.0, 79.0, 37.0, 37.0, 29.0, 19.0, 9.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.8359375, -6.65338134765625, -6.4708251953125, -6.28826904296875, -6.105712890625, -5.92315673828125, -5.7406005859375, -5.55804443359375, -5.37548828125, -5.19293212890625, -5.0103759765625, -4.82781982421875, -4.645263671875, -4.46270751953125, -4.2801513671875, -4.09759521484375, -3.9150390625, -3.73248291015625, -3.5499267578125, -3.36737060546875, -3.184814453125, -3.00225830078125, -2.8197021484375, -2.63714599609375, -2.45458984375, -2.27203369140625, -2.0894775390625, -1.90692138671875, -1.724365234375, -1.54180908203125, -1.3592529296875, -1.17669677734375, -0.994140625, -0.81158447265625, -0.6290283203125, -0.44647216796875, -0.263916015625, -0.08135986328125, 0.1011962890625, 0.28375244140625, 0.46630859375, 0.64886474609375, 0.8314208984375, 1.01397705078125, 1.196533203125, 1.37908935546875, 1.5616455078125, 1.74420166015625, 1.9267578125, 2.10931396484375, 2.2918701171875, 2.47442626953125, 2.656982421875, 2.83953857421875, 3.0220947265625, 3.20465087890625, 3.38720703125, 3.56976318359375, 3.7523193359375, 3.93487548828125, 4.117431640625, 4.29998779296875, 4.4825439453125, 4.66510009765625, 4.84765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 11.0, 12.0, 12.0, 18.0, 14.0, 14.0, 23.0, 29.0, 28.0, 31.0, 39.0, 64.0, 90.0, 116.0, 108.0, 73.0, 47.0, 35.0, 32.0, 34.0, 20.0, 28.0, 17.0, 11.0, 10.0, 11.0, 8.0, 7.0, 5.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0011053085327148438, -0.001072719693183899, -0.001040130853652954, -0.0010075420141220093, -0.0009749531745910645, -0.0009423643350601196, -0.0009097754955291748, -0.00087718665599823, -0.0008445978164672852, -0.0008120089769363403, -0.0007794201374053955, -0.0007468312978744507, -0.0007142424583435059, -0.000681653618812561, -0.0006490647792816162, -0.0006164759397506714, -0.0005838871002197266, -0.0005512982606887817, -0.0005187094211578369, -0.0004861205816268921, -0.00045353174209594727, -0.00042094290256500244, -0.0003883540630340576, -0.0003557652235031128, -0.00032317638397216797, -0.00029058754444122314, -0.0002579987049102783, -0.0002254098653793335, -0.00019282102584838867, -0.00016023218631744385, -0.00012764334678649902, -9.50545072555542e-05, -6.246566772460938e-05, -2.987682819366455e-05, 2.7120113372802734e-06, 3.53008508682251e-05, 6.788969039916992e-05, 0.00010047852993011475, 0.00013306736946105957, 0.0001656562089920044, 0.00019824504852294922, 0.00023083388805389404, 0.00026342272758483887, 0.0002960115671157837, 0.0003286004066467285, 0.00036118924617767334, 0.00039377808570861816, 0.000426366925239563, 0.0004589557647705078, 0.0004915446043014526, 0.0005241334438323975, 0.0005567222833633423, 0.0005893111228942871, 0.0006218999624252319, 0.0006544888019561768, 0.0006870776414871216, 0.0007196664810180664, 0.0007522553205490112, 0.0007848441600799561, 0.0008174329996109009, 0.0008500218391418457, 0.0008826106786727905, 0.0009151995182037354, 0.0009477883577346802, 0.000980377197265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 0.0, 3.0, 5.0, 7.0, 22.0, 29.0, 35.0, 35.0, 65.0, 68.0, 110.0, 133.0, 198.0, 310.0, 527.0, 945.0, 1786.0, 3914.0, 10468.0, 37252.0, 184946.0, 666731.0, 103724.0, 23334.0, 7413.0, 2975.0, 1403.0, 786.0, 438.0, 268.0, 175.0, 122.0, 104.0, 48.0, 46.0, 24.0, 29.0, 22.0, 8.0, 14.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.6171875, -5.44866943359375, -5.2801513671875, -5.11163330078125, -4.943115234375, -4.77459716796875, -4.6060791015625, -4.43756103515625, -4.26904296875, -4.10052490234375, -3.9320068359375, -3.76348876953125, -3.594970703125, -3.42645263671875, -3.2579345703125, -3.08941650390625, -2.9208984375, -2.75238037109375, -2.5838623046875, -2.41534423828125, -2.246826171875, -2.07830810546875, -1.9097900390625, -1.74127197265625, -1.57275390625, -1.40423583984375, -1.2357177734375, -1.06719970703125, -0.898681640625, -0.73016357421875, -0.5616455078125, -0.39312744140625, -0.224609375, -0.05609130859375, 0.1124267578125, 0.28094482421875, 0.449462890625, 0.61798095703125, 0.7864990234375, 0.95501708984375, 1.12353515625, 1.29205322265625, 1.4605712890625, 1.62908935546875, 1.797607421875, 1.96612548828125, 2.1346435546875, 2.30316162109375, 2.4716796875, 2.64019775390625, 2.8087158203125, 2.97723388671875, 3.145751953125, 3.31427001953125, 3.4827880859375, 3.65130615234375, 3.81982421875, 3.98834228515625, 4.1568603515625, 4.32537841796875, 4.493896484375, 4.66241455078125, 4.8309326171875, 4.99945068359375, 5.16796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 7.0, 13.0, 14.0, 11.0, 14.0, 22.0, 21.0, 27.0, 35.0, 30.0, 45.0, 57.0, 78.0, 89.0, 73.0, 87.0, 54.0, 56.0, 47.0, 31.0, 32.0, 26.0, 20.0, 24.0, 12.0, 8.0, 8.0, 11.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.8046875, -4.66387939453125, -4.5230712890625, -4.38226318359375, -4.241455078125, -4.10064697265625, -3.9598388671875, -3.81903076171875, -3.67822265625, -3.53741455078125, -3.3966064453125, -3.25579833984375, -3.114990234375, -2.97418212890625, -2.8333740234375, -2.69256591796875, -2.5517578125, -2.41094970703125, -2.2701416015625, -2.12933349609375, -1.988525390625, -1.84771728515625, -1.7069091796875, -1.56610107421875, -1.42529296875, -1.28448486328125, -1.1436767578125, -1.00286865234375, -0.862060546875, -0.72125244140625, -0.5804443359375, -0.43963623046875, -0.298828125, -0.15802001953125, -0.0172119140625, 0.12359619140625, 0.264404296875, 0.40521240234375, 0.5460205078125, 0.68682861328125, 0.82763671875, 0.96844482421875, 1.1092529296875, 1.25006103515625, 1.390869140625, 1.53167724609375, 1.6724853515625, 1.81329345703125, 1.9541015625, 2.09490966796875, 2.2357177734375, 2.37652587890625, 2.517333984375, 2.65814208984375, 2.7989501953125, 2.93975830078125, 3.08056640625, 3.22137451171875, 3.3621826171875, 3.50299072265625, 3.643798828125, 3.78460693359375, 3.9254150390625, 4.06622314453125, 4.20703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 10.0, 11.0, 27.0, 193.0, 510.0, 200.0, 34.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.8846435546875, -288.7700500488281, -280.6554870605469, -272.5408935546875, -264.42633056640625, -256.3117370605469, -248.1971435546875, -240.0825653076172, -231.96798706054688, -223.85340881347656, -215.73883056640625, -207.62423706054688, -199.50965881347656, -191.39508056640625, -183.28048706054688, -175.16590881347656, -167.05133056640625, -158.93675231933594, -150.82217407226562, -142.70758056640625, -134.59300231933594, -126.47842407226562, -118.36383819580078, -110.24925231933594, -102.13467407226562, -94.02009582519531, -85.90550994873047, -77.79092407226562, -69.67634582519531, -61.561763763427734, -53.447181701660156, -45.33259963989258, -37.217987060546875, -29.103404998779297, -20.98882293701172, -12.87424087524414, -4.7596588134765625, 3.3549232482910156, 11.469505310058594, 19.584087371826172, 27.69866943359375, 35.81325149536133, 43.927833557128906, 52.042415618896484, 60.15699768066406, 68.27157592773438, 76.38616180419922, 84.50074768066406, 92.61532592773438, 100.72990417480469, 108.84449005126953, 116.95907592773438, 125.07365417480469, 133.188232421875, 141.30282592773438, 149.4174041748047, 157.531982421875, 165.6465606689453, 173.76113891601562, 181.875732421875, 189.9903106689453, 198.10488891601562, 206.219482421875, 214.3340606689453, 222.44863891601562]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 16.0, 10.0, 9.0, 16.0, 28.0, 20.0, 30.0, 33.0, 48.0, 46.0, 50.0, 57.0, 90.0, 102.0, 84.0, 60.0, 50.0, 44.0, 33.0, 50.0, 23.0, 32.0, 21.0, 18.0, 7.0, 8.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.2222900390625, -68.44380950927734, -65.66533660888672, -62.88685607910156, -60.10837936401367, -57.32990264892578, -54.55142593383789, -51.77294921875, -48.994468688964844, -46.21599197387695, -43.43751525878906, -40.659034729003906, -37.880558013916016, -35.102081298828125, -32.323604583740234, -29.54512596130371, -26.766651153564453, -23.988174438476562, -21.20969581604004, -18.43121910095215, -15.652741432189941, -12.874263763427734, -10.095787048339844, -7.31730842590332, -4.53883171081543, -1.7603542804718018, 1.0181231498718262, 3.796600341796875, 6.575078010559082, 9.353555679321289, 12.13203239440918, 14.910511016845703, 17.688987731933594, 20.467464447021484, 23.245943069458008, 26.0244197845459, 28.802898406982422, 31.581375122070312, 34.3598518371582, 37.138328552246094, 39.91680908203125, 42.69528579711914, 45.47376251220703, 48.25224304199219, 51.03071975708008, 53.80919647216797, 56.58767318725586, 59.36614990234375, 62.14462661743164, 64.92310333251953, 67.70158386230469, 70.48005676269531, 73.25853729248047, 76.03701782226562, 78.81549072265625, 81.5939712524414, 84.37244415283203, 87.15092468261719, 89.92939758300781, 92.70787811279297, 95.4863510131836, 98.26483154296875, 101.04330444335938, 103.82178497314453, 106.60026550292969]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 9.0, 15.0, 17.0, 23.0, 35.0, 39.0, 71.0, 124.0, 213.0, 289.0, 631.0, 1159.0, 2235.0, 5046.0, 12384.0, 39241.0, 271947.0, 2616698.0, 1112624.0, 96135.0, 21296.0, 7436.0, 3221.0, 1444.0, 718.0, 425.0, 270.0, 156.0, 112.0, 61.0, 60.0, 35.0, 22.0, 24.0, 12.0, 9.0, 6.0, 7.0, 6.0, 7.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.171875, -5.9495849609375, -5.727294921875, -5.5050048828125, -5.28271484375, -5.0604248046875, -4.838134765625, -4.6158447265625, -4.3935546875, -4.1712646484375, -3.948974609375, -3.7266845703125, -3.50439453125, -3.2821044921875, -3.059814453125, -2.8375244140625, -2.615234375, -2.3929443359375, -2.170654296875, -1.9483642578125, -1.72607421875, -1.5037841796875, -1.281494140625, -1.0592041015625, -0.8369140625, -0.6146240234375, -0.392333984375, -0.1700439453125, 0.05224609375, 0.2745361328125, 0.496826171875, 0.7191162109375, 0.94140625, 1.1636962890625, 1.385986328125, 1.6082763671875, 1.83056640625, 2.0528564453125, 2.275146484375, 2.4974365234375, 2.7197265625, 2.9420166015625, 3.164306640625, 3.3865966796875, 3.60888671875, 3.8311767578125, 4.053466796875, 4.2757568359375, 4.498046875, 4.7203369140625, 4.942626953125, 5.1649169921875, 5.38720703125, 5.6094970703125, 5.831787109375, 6.0540771484375, 6.2763671875, 6.4986572265625, 6.720947265625, 6.9432373046875, 7.16552734375, 7.3878173828125, 7.610107421875, 7.8323974609375, 8.0546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 14.0, 7.0, 12.0, 24.0, 22.0, 36.0, 39.0, 42.0, 71.0, 70.0, 84.0, 71.0, 71.0, 87.0, 76.0, 58.0, 44.0, 39.0, 35.0, 33.0, 22.0, 17.0, 15.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7109375, -3.515869140625, -3.32080078125, -3.125732421875, -2.9306640625, -2.735595703125, -2.54052734375, -2.345458984375, -2.150390625, -1.955322265625, -1.76025390625, -1.565185546875, -1.3701171875, -1.175048828125, -0.97998046875, -0.784912109375, -0.58984375, -0.394775390625, -0.19970703125, -0.004638671875, 0.1904296875, 0.385498046875, 0.58056640625, 0.775634765625, 0.970703125, 1.165771484375, 1.36083984375, 1.555908203125, 1.7509765625, 1.946044921875, 2.14111328125, 2.336181640625, 2.53125, 2.726318359375, 2.92138671875, 3.116455078125, 3.3115234375, 3.506591796875, 3.70166015625, 3.896728515625, 4.091796875, 4.286865234375, 4.48193359375, 4.677001953125, 4.8720703125, 5.067138671875, 5.26220703125, 5.457275390625, 5.65234375, 5.847412109375, 6.04248046875, 6.237548828125, 6.4326171875, 6.627685546875, 6.82275390625, 7.017822265625, 7.212890625, 7.407958984375, 7.60302734375, 7.798095703125, 7.9931640625, 8.188232421875, 8.38330078125, 8.578369140625, 8.7734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 9.0, 10.0, 18.0, 23.0, 43.0, 71.0, 110.0, 152.0, 252.0, 506.0, 1066.0, 2947.0, 11935.0, 96999.0, 3437162.0, 602955.0, 31475.0, 5639.0, 1592.0, 611.0, 301.0, 156.0, 96.0, 61.0, 34.0, 15.0, 15.0, 5.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.390625, -11.9595947265625, -11.528564453125, -11.0975341796875, -10.66650390625, -10.2354736328125, -9.804443359375, -9.3734130859375, -8.9423828125, -8.5113525390625, -8.080322265625, -7.6492919921875, -7.21826171875, -6.7872314453125, -6.356201171875, -5.9251708984375, -5.494140625, -5.0631103515625, -4.632080078125, -4.2010498046875, -3.77001953125, -3.3389892578125, -2.907958984375, -2.4769287109375, -2.0458984375, -1.6148681640625, -1.183837890625, -0.7528076171875, -0.32177734375, 0.1092529296875, 0.540283203125, 0.9713134765625, 1.40234375, 1.8333740234375, 2.264404296875, 2.6954345703125, 3.12646484375, 3.5574951171875, 3.988525390625, 4.4195556640625, 4.8505859375, 5.2816162109375, 5.712646484375, 6.1436767578125, 6.57470703125, 7.0057373046875, 7.436767578125, 7.8677978515625, 8.298828125, 8.7298583984375, 9.160888671875, 9.5919189453125, 10.02294921875, 10.4539794921875, 10.885009765625, 11.3160400390625, 11.7470703125, 12.1781005859375, 12.609130859375, 13.0401611328125, 13.47119140625, 13.9022216796875, 14.333251953125, 14.7642822265625, 15.1953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 11.0, 9.0, 10.0, 15.0, 28.0, 24.0, 64.0, 85.0, 202.0, 362.0, 693.0, 949.0, 725.0, 369.0, 211.0, 136.0, 72.0, 30.0, 28.0, 17.0, 8.0, 6.0, 6.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-17.25, -16.8624267578125, -16.474853515625, -16.0872802734375, -15.69970703125, -15.3121337890625, -14.924560546875, -14.5369873046875, -14.1494140625, -13.7618408203125, -13.374267578125, -12.9866943359375, -12.59912109375, -12.2115478515625, -11.823974609375, -11.4364013671875, -11.048828125, -10.6612548828125, -10.273681640625, -9.8861083984375, -9.49853515625, -9.1109619140625, -8.723388671875, -8.3358154296875, -7.9482421875, -7.5606689453125, -7.173095703125, -6.7855224609375, -6.39794921875, -6.0103759765625, -5.622802734375, -5.2352294921875, -4.84765625, -4.4600830078125, -4.072509765625, -3.6849365234375, -3.29736328125, -2.9097900390625, -2.522216796875, -2.1346435546875, -1.7470703125, -1.3594970703125, -0.971923828125, -0.5843505859375, -0.19677734375, 0.1907958984375, 0.578369140625, 0.9659423828125, 1.353515625, 1.7410888671875, 2.128662109375, 2.5162353515625, 2.90380859375, 3.2913818359375, 3.678955078125, 4.0665283203125, 4.4541015625, 4.8416748046875, 5.229248046875, 5.6168212890625, 6.00439453125, 6.3919677734375, 6.779541015625, 7.1671142578125, 7.5546875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 20.0, 36.0, 75.0, 140.0, 205.0, 195.0, 150.0, 77.0, 44.0, 21.0, 6.0, 4.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-131.5286102294922, -127.94721984863281, -124.3658218383789, -120.78443145751953, -117.20304107666016, -113.62164306640625, -110.04025268554688, -106.4588623046875, -102.8774642944336, -99.29607391357422, -95.71467590332031, -92.13328552246094, -88.55189514160156, -84.97049713134766, -81.38910675048828, -77.80770874023438, -74.226318359375, -70.64492797851562, -67.06352996826172, -63.482139587402344, -59.9007453918457, -56.31935119628906, -52.73796081542969, -49.15656661987305, -45.57518005371094, -41.9937858581543, -38.41239547729492, -34.83100128173828, -31.24960708618164, -27.668214797973633, -24.086822509765625, -20.505428314208984, -16.924034118652344, -13.34264087677002, -9.761247634887695, -6.1798553466796875, -2.5984621047973633, 0.9829311370849609, 4.564323425292969, 8.14571762084961, 11.727109909057617, 15.308503150939941, 18.889896392822266, 22.471288681030273, 26.05268096923828, 29.634075164794922, 33.21546936035156, 36.79685974121094, 40.37825393676758, 43.95964813232422, 47.541038513183594, 51.122432708740234, 54.703826904296875, 58.28521728515625, 61.86661148071289, 65.44800567626953, 69.0293960571289, 72.61078643798828, 76.19218444824219, 79.77357482910156, 83.35496520996094, 86.93636322021484, 90.51775360107422, 94.09915161132812, 97.6805419921875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 12.0, 15.0, 19.0, 21.0, 37.0, 49.0, 81.0, 71.0, 82.0, 76.0, 72.0, 71.0, 69.0, 81.0, 66.0, 51.0, 34.0, 32.0, 15.0, 14.0, 18.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.54129028320312, -91.36346435546875, -89.1856460571289, -87.00782012939453, -84.83000183105469, -82.65217590332031, -80.47435760498047, -78.2965316772461, -76.11871337890625, -73.94088745117188, -71.76306915283203, -69.58524322509766, -67.40742492675781, -65.22959899902344, -63.051780700683594, -60.87395477294922, -58.69613265991211, -56.518310546875, -54.34048843383789, -52.16266632080078, -49.98484420776367, -47.80702209472656, -45.62919616699219, -43.451377868652344, -41.27355194091797, -39.09572982788086, -36.91790771484375, -34.74008560180664, -32.56226348876953, -30.384441375732422, -28.20661735534668, -26.02879524230957, -23.850975036621094, -21.673152923583984, -19.495330810546875, -17.317508697509766, -15.13968563079834, -12.96186351776123, -10.784040451049805, -8.606218338012695, -6.428396224975586, -4.250574111938477, -2.072751522064209, 0.1050710678100586, 2.282893180847168, 4.460715293884277, 6.638538360595703, 8.816360473632812, 10.994182586669922, 13.172004699707031, 15.34982681274414, 17.52764892578125, 19.70547103881836, 21.88329315185547, 24.06111717224121, 26.23893928527832, 28.41676139831543, 30.59458351135254, 32.77240753173828, 34.95022964477539, 37.1280517578125, 39.30587387084961, 41.48369598388672, 43.66151809692383, 45.83934020996094]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 12.0, 15.0, 17.0, 22.0, 21.0, 57.0, 87.0, 142.0, 293.0, 503.0, 1203.0, 2567.0, 6556.0, 19558.0, 66666.0, 251319.0, 467590.0, 164503.0, 44865.0, 13971.0, 4909.0, 1870.0, 849.0, 389.0, 223.0, 126.0, 69.0, 42.0, 39.0, 25.0, 10.0, 14.0, 8.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1171875, -8.84375, -8.5703125, -8.296875, -8.0234375, -7.75, -7.4765625, -7.203125, -6.9296875, -6.65625, -6.3828125, -6.109375, -5.8359375, -5.5625, -5.2890625, -5.015625, -4.7421875, -4.46875, -4.1953125, -3.921875, -3.6484375, -3.375, -3.1015625, -2.828125, -2.5546875, -2.28125, -2.0078125, -1.734375, -1.4609375, -1.1875, -0.9140625, -0.640625, -0.3671875, -0.09375, 0.1796875, 0.453125, 0.7265625, 1.0, 1.2734375, 1.546875, 1.8203125, 2.09375, 2.3671875, 2.640625, 2.9140625, 3.1875, 3.4609375, 3.734375, 4.0078125, 4.28125, 4.5546875, 4.828125, 5.1015625, 5.375, 5.6484375, 5.921875, 6.1953125, 6.46875, 6.7421875, 7.015625, 7.2890625, 7.5625, 7.8359375, 8.109375, 8.3828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 10.0, 14.0, 12.0, 11.0, 18.0, 17.0, 26.0, 34.0, 24.0, 27.0, 46.0, 48.0, 34.0, 63.0, 51.0, 48.0, 42.0, 52.0, 44.0, 50.0, 59.0, 51.0, 32.0, 33.0, 35.0, 22.0, 21.0, 14.0, 14.0, 9.0, 13.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.96929931640625, -3.8370361328125, -3.70477294921875, -3.572509765625, -3.44024658203125, -3.3079833984375, -3.17572021484375, -3.04345703125, -2.91119384765625, -2.7789306640625, -2.64666748046875, -2.514404296875, -2.38214111328125, -2.2498779296875, -2.11761474609375, -1.9853515625, -1.85308837890625, -1.7208251953125, -1.58856201171875, -1.456298828125, -1.32403564453125, -1.1917724609375, -1.05950927734375, -0.92724609375, -0.79498291015625, -0.6627197265625, -0.53045654296875, -0.398193359375, -0.26593017578125, -0.1336669921875, -0.00140380859375, 0.130859375, 0.26312255859375, 0.3953857421875, 0.52764892578125, 0.659912109375, 0.79217529296875, 0.9244384765625, 1.05670166015625, 1.18896484375, 1.32122802734375, 1.4534912109375, 1.58575439453125, 1.718017578125, 1.85028076171875, 1.9825439453125, 2.11480712890625, 2.2470703125, 2.37933349609375, 2.5115966796875, 2.64385986328125, 2.776123046875, 2.90838623046875, 3.0406494140625, 3.17291259765625, 3.30517578125, 3.43743896484375, 3.5697021484375, 3.70196533203125, 3.834228515625, 3.96649169921875, 4.0987548828125, 4.23101806640625, 4.36328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 8.0, 14.0, 19.0, 17.0, 31.0, 43.0, 82.0, 102.0, 171.0, 273.0, 576.0, 1107.0, 3429.0, 17172.0, 259679.0, 724554.0, 33278.0, 4953.0, 1533.0, 625.0, 324.0, 178.0, 127.0, 89.0, 46.0, 33.0, 23.0, 20.0, 10.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.9375, -19.25341796875, -18.5693359375, -17.88525390625, -17.201171875, -16.51708984375, -15.8330078125, -15.14892578125, -14.46484375, -13.78076171875, -13.0966796875, -12.41259765625, -11.728515625, -11.04443359375, -10.3603515625, -9.67626953125, -8.9921875, -8.30810546875, -7.6240234375, -6.93994140625, -6.255859375, -5.57177734375, -4.8876953125, -4.20361328125, -3.51953125, -2.83544921875, -2.1513671875, -1.46728515625, -0.783203125, -0.09912109375, 0.5849609375, 1.26904296875, 1.953125, 2.63720703125, 3.3212890625, 4.00537109375, 4.689453125, 5.37353515625, 6.0576171875, 6.74169921875, 7.42578125, 8.10986328125, 8.7939453125, 9.47802734375, 10.162109375, 10.84619140625, 11.5302734375, 12.21435546875, 12.8984375, 13.58251953125, 14.2666015625, 14.95068359375, 15.634765625, 16.31884765625, 17.0029296875, 17.68701171875, 18.37109375, 19.05517578125, 19.7392578125, 20.42333984375, 21.107421875, 21.79150390625, 22.4755859375, 23.15966796875, 23.84375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 6.0, 8.0, 9.0, 10.0, 25.0, 10.0, 20.0, 19.0, 30.0, 23.0, 37.0, 32.0, 40.0, 16.0, 49.0, 41.0, 48.0, 39.0, 53.0, 40.0, 64.0, 37.0, 46.0, 45.0, 30.0, 27.0, 29.0, 19.0, 24.0, 21.0, 13.0, 14.0, 14.0, 12.0, 7.0, 4.0, 8.0, 4.0, 6.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8515625, -13.3984375, -12.9453125, -12.4921875, -12.0390625, -11.5859375, -11.1328125, -10.6796875, -10.2265625, -9.7734375, -9.3203125, -8.8671875, -8.4140625, -7.9609375, -7.5078125, -7.0546875, -6.6015625, -6.1484375, -5.6953125, -5.2421875, -4.7890625, -4.3359375, -3.8828125, -3.4296875, -2.9765625, -2.5234375, -2.0703125, -1.6171875, -1.1640625, -0.7109375, -0.2578125, 0.1953125, 0.6484375, 1.1015625, 1.5546875, 2.0078125, 2.4609375, 2.9140625, 3.3671875, 3.8203125, 4.2734375, 4.7265625, 5.1796875, 5.6328125, 6.0859375, 6.5390625, 6.9921875, 7.4453125, 7.8984375, 8.3515625, 8.8046875, 9.2578125, 9.7109375, 10.1640625, 10.6171875, 11.0703125, 11.5234375, 11.9765625, 12.4296875, 12.8828125, 13.3359375, 13.7890625, 14.2421875, 14.6953125, 15.1484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 6.0, 8.0, 11.0, 12.0, 13.0, 20.0, 39.0, 41.0, 72.0, 81.0, 135.0, 193.0, 358.0, 590.0, 1106.0, 2416.0, 6742.0, 23272.0, 106854.0, 725231.0, 138921.0, 28648.0, 7937.0, 2857.0, 1217.0, 639.0, 383.0, 209.0, 178.0, 103.0, 70.0, 58.0, 34.0, 19.0, 16.0, 15.0, 16.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-7.33984375, -7.114501953125, -6.88916015625, -6.663818359375, -6.4384765625, -6.213134765625, -5.98779296875, -5.762451171875, -5.537109375, -5.311767578125, -5.08642578125, -4.861083984375, -4.6357421875, -4.410400390625, -4.18505859375, -3.959716796875, -3.734375, -3.509033203125, -3.28369140625, -3.058349609375, -2.8330078125, -2.607666015625, -2.38232421875, -2.156982421875, -1.931640625, -1.706298828125, -1.48095703125, -1.255615234375, -1.0302734375, -0.804931640625, -0.57958984375, -0.354248046875, -0.12890625, 0.096435546875, 0.32177734375, 0.547119140625, 0.7724609375, 0.997802734375, 1.22314453125, 1.448486328125, 1.673828125, 1.899169921875, 2.12451171875, 2.349853515625, 2.5751953125, 2.800537109375, 3.02587890625, 3.251220703125, 3.4765625, 3.701904296875, 3.92724609375, 4.152587890625, 4.3779296875, 4.603271484375, 4.82861328125, 5.053955078125, 5.279296875, 5.504638671875, 5.72998046875, 5.955322265625, 6.1806640625, 6.406005859375, 6.63134765625, 6.856689453125, 7.08203125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 1.0, 5.0, 6.0, 5.0, 7.0, 15.0, 18.0, 9.0, 16.0, 23.0, 36.0, 39.0, 57.0, 96.0, 168.0, 152.0, 106.0, 51.0, 50.0, 36.0, 21.0, 17.0, 11.0, 14.0, 8.0, 14.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018329620361328125, -0.0017670989036560059, -0.0017012357711791992, -0.0016353726387023926, -0.001569509506225586, -0.0015036463737487793, -0.0014377832412719727, -0.001371920108795166, -0.0013060569763183594, -0.0012401938438415527, -0.001174330711364746, -0.0011084675788879395, -0.0010426044464111328, -0.0009767413139343262, -0.0009108781814575195, -0.0008450150489807129, -0.0007791519165039062, -0.0007132887840270996, -0.000647425651550293, -0.0005815625190734863, -0.0005156993865966797, -0.00044983625411987305, -0.0003839731216430664, -0.00031810998916625977, -0.0002522468566894531, -0.00018638372421264648, -0.00012052059173583984, -5.46574592590332e-05, 1.1205673217773438e-05, 7.706880569458008e-05, 0.00014293193817138672, 0.00020879507064819336, 0.000274658203125, 0.00034052133560180664, 0.0004063844680786133, 0.0004722476005554199, 0.0005381107330322266, 0.0006039738655090332, 0.0006698369979858398, 0.0007357001304626465, 0.0008015632629394531, 0.0008674263954162598, 0.0009332895278930664, 0.000999152660369873, 0.0010650157928466797, 0.0011308789253234863, 0.001196742057800293, 0.0012626051902770996, 0.0013284683227539062, 0.0013943314552307129, 0.0014601945877075195, 0.0015260577201843262, 0.0015919208526611328, 0.0016577839851379395, 0.001723647117614746, 0.0017895102500915527, 0.0018553733825683594, 0.001921236515045166, 0.0019870996475219727, 0.0020529627799987793, 0.002118825912475586, 0.0021846890449523926, 0.0022505521774291992, 0.002316415309906006, 0.0023822784423828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 4.0, 13.0, 20.0, 28.0, 47.0, 63.0, 92.0, 146.0, 262.0, 514.0, 1073.0, 2538.0, 8136.0, 39307.0, 523327.0, 421825.0, 38345.0, 8012.0, 2566.0, 1041.0, 526.0, 256.0, 136.0, 95.0, 71.0, 32.0, 21.0, 21.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.984375, -9.6817626953125, -9.379150390625, -9.0765380859375, -8.77392578125, -8.4713134765625, -8.168701171875, -7.8660888671875, -7.5634765625, -7.2608642578125, -6.958251953125, -6.6556396484375, -6.35302734375, -6.0504150390625, -5.747802734375, -5.4451904296875, -5.142578125, -4.8399658203125, -4.537353515625, -4.2347412109375, -3.93212890625, -3.6295166015625, -3.326904296875, -3.0242919921875, -2.7216796875, -2.4190673828125, -2.116455078125, -1.8138427734375, -1.51123046875, -1.2086181640625, -0.906005859375, -0.6033935546875, -0.30078125, 0.0018310546875, 0.304443359375, 0.6070556640625, 0.90966796875, 1.2122802734375, 1.514892578125, 1.8175048828125, 2.1201171875, 2.4227294921875, 2.725341796875, 3.0279541015625, 3.33056640625, 3.6331787109375, 3.935791015625, 4.2384033203125, 4.541015625, 4.8436279296875, 5.146240234375, 5.4488525390625, 5.75146484375, 6.0540771484375, 6.356689453125, 6.6593017578125, 6.9619140625, 7.2645263671875, 7.567138671875, 7.8697509765625, 8.17236328125, 8.4749755859375, 8.777587890625, 9.0802001953125, 9.3828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 5.0, 8.0, 6.0, 8.0, 5.0, 13.0, 13.0, 17.0, 22.0, 25.0, 35.0, 42.0, 56.0, 75.0, 111.0, 131.0, 101.0, 82.0, 61.0, 35.0, 26.0, 27.0, 18.0, 8.0, 11.0, 4.0, 10.0, 10.0, 8.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0, -5.8016357421875, -5.603271484375, -5.4049072265625, -5.20654296875, -5.0081787109375, -4.809814453125, -4.6114501953125, -4.4130859375, -4.2147216796875, -4.016357421875, -3.8179931640625, -3.61962890625, -3.4212646484375, -3.222900390625, -3.0245361328125, -2.826171875, -2.6278076171875, -2.429443359375, -2.2310791015625, -2.03271484375, -1.8343505859375, -1.635986328125, -1.4376220703125, -1.2392578125, -1.0408935546875, -0.842529296875, -0.6441650390625, -0.44580078125, -0.2474365234375, -0.049072265625, 0.1492919921875, 0.34765625, 0.5460205078125, 0.744384765625, 0.9427490234375, 1.14111328125, 1.3394775390625, 1.537841796875, 1.7362060546875, 1.9345703125, 2.1329345703125, 2.331298828125, 2.5296630859375, 2.72802734375, 2.9263916015625, 3.124755859375, 3.3231201171875, 3.521484375, 3.7198486328125, 3.918212890625, 4.1165771484375, 4.31494140625, 4.5133056640625, 4.711669921875, 4.9100341796875, 5.1083984375, 5.3067626953125, 5.505126953125, 5.7034912109375, 5.90185546875, 6.1002197265625, 6.298583984375, 6.4969482421875, 6.6953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 18.0, 53.0, 181.0, 407.0, 193.0, 78.0, 31.0, 19.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.91183471679688, -199.8923797607422, -192.87294006347656, -185.85348510742188, -178.83404541015625, -171.81459045410156, -164.79513549804688, -157.77569580078125, -150.75625610351562, -143.73680114746094, -136.7173614501953, -129.69790649414062, -122.678466796875, -115.65901184082031, -108.63956451416016, -101.6201171875, -94.60066223144531, -87.58121490478516, -80.561767578125, -73.54231262207031, -66.52287292480469, -59.503421783447266, -52.483970642089844, -45.46452331542969, -38.44507598876953, -31.425628662109375, -24.406179428100586, -17.386730194091797, -10.36728286743164, -3.3478355407714844, 3.6716156005859375, 10.691062927246094, 17.710525512695312, 24.72997283935547, 31.749422073364258, 38.76887130737305, 45.7883186340332, 52.80776596069336, 59.82721710205078, 66.84666442871094, 73.8661117553711, 80.88555908203125, 87.9050064086914, 94.92445373535156, 101.94390869140625, 108.96334838867188, 115.98280334472656, 123.00225067138672, 130.02169799804688, 137.04115295410156, 144.0605926513672, 151.08004760742188, 158.0994873046875, 165.1189422607422, 172.13839721679688, 179.1578369140625, 186.17727661132812, 193.1967315673828, 200.21617126464844, 207.23562622070312, 214.25506591796875, 221.27452087402344, 228.29397583007812, 235.31341552734375, 242.33287048339844]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 7.0, 7.0, 11.0, 8.0, 17.0, 11.0, 19.0, 19.0, 25.0, 21.0, 17.0, 25.0, 23.0, 29.0, 35.0, 41.0, 27.0, 57.0, 56.0, 89.0, 55.0, 50.0, 34.0, 32.0, 30.0, 24.0, 36.0, 30.0, 17.0, 16.0, 17.0, 15.0, 22.0, 16.0, 10.0, 9.0, 11.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.49586868286133, -51.54290771484375, -49.58994674682617, -47.636985778808594, -45.684024810791016, -43.73106384277344, -41.778106689453125, -39.82514190673828, -37.87218475341797, -35.91922378540039, -33.96626281738281, -32.013301849365234, -30.060340881347656, -28.107379913330078, -26.154420852661133, -24.201459884643555, -22.248497009277344, -20.295536041259766, -18.342575073242188, -16.38961410522461, -14.436654090881348, -12.48369312286377, -10.530733108520508, -8.57777214050293, -6.624811172485352, -4.671850204467773, -2.7188897132873535, -0.7659292221069336, 1.1870317459106445, 3.1399927139282227, 5.092952728271484, 7.0459136962890625, 8.998870849609375, 10.951831817626953, 12.904792785644531, 14.857752799987793, 16.810714721679688, 18.763675689697266, 20.71663475036621, 22.66959571838379, 24.622556686401367, 26.575517654418945, 28.528478622436523, 30.48143768310547, 32.43439865112305, 34.387359619140625, 36.3403205871582, 38.29328155517578, 40.24624252319336, 42.19920349121094, 44.152164459228516, 46.105125427246094, 48.05808639526367, 50.01104736328125, 51.96400451660156, 53.916969299316406, 55.86992645263672, 57.8228874206543, 59.775848388671875, 61.72880935668945, 63.68177032470703, 65.63472747802734, 67.58769226074219, 69.5406494140625, 71.49361419677734]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 5.0, 10.0, 17.0, 26.0, 31.0, 43.0, 76.0, 100.0, 159.0, 282.0, 616.0, 1257.0, 3316.0, 11619.0, 85372.0, 2980998.0, 1062461.0, 36733.0, 6848.0, 2244.0, 932.0, 454.0, 241.0, 139.0, 94.0, 53.0, 34.0, 32.0, 23.0, 15.0, 16.0, 9.0, 3.0, 1.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.28662109375, -9.9169921875, -9.54736328125, -9.177734375, -8.80810546875, -8.4384765625, -8.06884765625, -7.69921875, -7.32958984375, -6.9599609375, -6.59033203125, -6.220703125, -5.85107421875, -5.4814453125, -5.11181640625, -4.7421875, -4.37255859375, -4.0029296875, -3.63330078125, -3.263671875, -2.89404296875, -2.5244140625, -2.15478515625, -1.78515625, -1.41552734375, -1.0458984375, -0.67626953125, -0.306640625, 0.06298828125, 0.4326171875, 0.80224609375, 1.171875, 1.54150390625, 1.9111328125, 2.28076171875, 2.650390625, 3.02001953125, 3.3896484375, 3.75927734375, 4.12890625, 4.49853515625, 4.8681640625, 5.23779296875, 5.607421875, 5.97705078125, 6.3466796875, 6.71630859375, 7.0859375, 7.45556640625, 7.8251953125, 8.19482421875, 8.564453125, 8.93408203125, 9.3037109375, 9.67333984375, 10.04296875, 10.41259765625, 10.7822265625, 11.15185546875, 11.521484375, 11.89111328125, 12.2607421875, 12.63037109375, 13.0]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 9.0, 10.0, 19.0, 16.0, 20.0, 27.0, 41.0, 28.0, 46.0, 41.0, 54.0, 44.0, 50.0, 51.0, 44.0, 57.0, 55.0, 46.0, 52.0, 37.0, 37.0, 41.0, 23.0, 33.0, 27.0, 19.0, 11.0, 13.0, 5.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.0718994140625, -3.932861328125, -3.7938232421875, -3.65478515625, -3.5157470703125, -3.376708984375, -3.2376708984375, -3.0986328125, -2.9595947265625, -2.820556640625, -2.6815185546875, -2.54248046875, -2.4034423828125, -2.264404296875, -2.1253662109375, -1.986328125, -1.8472900390625, -1.708251953125, -1.5692138671875, -1.43017578125, -1.2911376953125, -1.152099609375, -1.0130615234375, -0.8740234375, -0.7349853515625, -0.595947265625, -0.4569091796875, -0.31787109375, -0.1788330078125, -0.039794921875, 0.0992431640625, 0.23828125, 0.3773193359375, 0.516357421875, 0.6553955078125, 0.79443359375, 0.9334716796875, 1.072509765625, 1.2115478515625, 1.3505859375, 1.4896240234375, 1.628662109375, 1.7677001953125, 1.90673828125, 2.0457763671875, 2.184814453125, 2.3238525390625, 2.462890625, 2.6019287109375, 2.740966796875, 2.8800048828125, 3.01904296875, 3.1580810546875, 3.297119140625, 3.4361572265625, 3.5751953125, 3.7142333984375, 3.853271484375, 3.9923095703125, 4.13134765625, 4.2703857421875, 4.409423828125, 4.5484619140625, 4.6875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 12.0, 9.0, 18.0, 28.0, 54.0, 84.0, 118.0, 223.0, 420.0, 748.0, 1633.0, 5670.0, 75600.0, 4028576.0, 72808.0, 5540.0, 1471.0, 591.0, 291.0, 155.0, 97.0, 43.0, 28.0, 27.0, 10.0, 13.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -27.09716796875, -26.2880859375, -25.47900390625, -24.669921875, -23.86083984375, -23.0517578125, -22.24267578125, -21.43359375, -20.62451171875, -19.8154296875, -19.00634765625, -18.197265625, -17.38818359375, -16.5791015625, -15.77001953125, -14.9609375, -14.15185546875, -13.3427734375, -12.53369140625, -11.724609375, -10.91552734375, -10.1064453125, -9.29736328125, -8.48828125, -7.67919921875, -6.8701171875, -6.06103515625, -5.251953125, -4.44287109375, -3.6337890625, -2.82470703125, -2.015625, -1.20654296875, -0.3974609375, 0.41162109375, 1.220703125, 2.02978515625, 2.8388671875, 3.64794921875, 4.45703125, 5.26611328125, 6.0751953125, 6.88427734375, 7.693359375, 8.50244140625, 9.3115234375, 10.12060546875, 10.9296875, 11.73876953125, 12.5478515625, 13.35693359375, 14.166015625, 14.97509765625, 15.7841796875, 16.59326171875, 17.40234375, 18.21142578125, 19.0205078125, 19.82958984375, 20.638671875, 21.44775390625, 22.2568359375, 23.06591796875, 23.875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 10.0, 16.0, 27.0, 43.0, 137.0, 332.0, 1022.0, 1432.0, 650.0, 224.0, 69.0, 46.0, 22.0, 22.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.15625, -24.51611328125, -23.8759765625, -23.23583984375, -22.595703125, -21.95556640625, -21.3154296875, -20.67529296875, -20.03515625, -19.39501953125, -18.7548828125, -18.11474609375, -17.474609375, -16.83447265625, -16.1943359375, -15.55419921875, -14.9140625, -14.27392578125, -13.6337890625, -12.99365234375, -12.353515625, -11.71337890625, -11.0732421875, -10.43310546875, -9.79296875, -9.15283203125, -8.5126953125, -7.87255859375, -7.232421875, -6.59228515625, -5.9521484375, -5.31201171875, -4.671875, -4.03173828125, -3.3916015625, -2.75146484375, -2.111328125, -1.47119140625, -0.8310546875, -0.19091796875, 0.44921875, 1.08935546875, 1.7294921875, 2.36962890625, 3.009765625, 3.64990234375, 4.2900390625, 4.93017578125, 5.5703125, 6.21044921875, 6.8505859375, 7.49072265625, 8.130859375, 8.77099609375, 9.4111328125, 10.05126953125, 10.69140625, 11.33154296875, 11.9716796875, 12.61181640625, 13.251953125, 13.89208984375, 14.5322265625, 15.17236328125, 15.8125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 5.0, 34.0, 94.0, 349.0, 345.0, 113.0, 37.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.16969299316406, -132.783203125, -125.3967056274414, -118.01021575927734, -110.62371826171875, -103.23722839355469, -95.85073852539062, -88.46424865722656, -81.07775115966797, -73.6912612915039, -66.30476379394531, -58.91827392578125, -51.53178024291992, -44.145286560058594, -36.75879669189453, -29.372303009033203, -21.985809326171875, -14.599316596984863, -7.212823867797852, 0.17366790771484375, 7.560161590576172, 14.9466552734375, 22.333145141601562, 29.71963882446289, 37.10613250732422, 44.49262619018555, 51.879119873046875, 59.26560974121094, 66.652099609375, 74.0385971069336, 81.42508697509766, 88.81158447265625, 96.19808959960938, 103.58457946777344, 110.97107696533203, 118.3575668334961, 125.74406433105469, 133.13055419921875, 140.5170440673828, 147.90353393554688, 155.2900390625, 162.67652893066406, 170.06301879882812, 177.44952392578125, 184.8360137939453, 192.22250366210938, 199.60899353027344, 206.9954833984375, 214.38197326660156, 221.76846313476562, 229.1549530029297, 236.54144287109375, 243.92794799804688, 251.31443786621094, 258.700927734375, 266.0874328613281, 273.4739074707031, 280.86041259765625, 288.24688720703125, 295.6333923339844, 303.0198669433594, 310.4063720703125, 317.7928466796875, 325.1793518066406, 332.56585693359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 22.0, 28.0, 36.0, 64.0, 85.0, 134.0, 156.0, 132.0, 100.0, 81.0, 60.0, 39.0, 27.0, 12.0, 8.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.11483764648438, -122.36213684082031, -118.60943603515625, -114.85672760009766, -111.1040267944336, -107.35132598876953, -103.59862518310547, -99.84591674804688, -96.09321594238281, -92.34051513671875, -88.58781433105469, -84.8351058959961, -81.08240509033203, -77.32970428466797, -73.5770034790039, -69.82429504394531, -66.07159423828125, -62.31889343261719, -58.56618881225586, -54.8134880065918, -51.06078338623047, -47.308082580566406, -43.555381774902344, -39.802677154541016, -36.04998016357422, -32.297279357910156, -28.544574737548828, -24.791873931884766, -21.039169311523438, -17.286468505859375, -13.53376579284668, -9.781063079833984, -6.028358459472656, -2.27565598487854, 1.4770464897155762, 5.229748725891113, 8.982451438903809, 12.735153198242188, 16.487855911254883, 20.240558624267578, 23.993261337280273, 27.74596405029297, 31.498666763305664, 35.25136947631836, 39.00407028198242, 42.75677490234375, 46.50947570800781, 50.262176513671875, 54.0148811340332, 57.767581939697266, 61.520286560058594, 65.27298736572266, 69.02568817138672, 72.77839660644531, 76.53109741210938, 80.28379821777344, 84.0364990234375, 87.78919982910156, 91.54190063476562, 95.29460906982422, 99.04730987548828, 102.80001068115234, 106.5527114868164, 110.305419921875, 114.05812072753906]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 8.0, 4.0, 4.0, 17.0, 17.0, 27.0, 30.0, 40.0, 74.0, 116.0, 268.0, 479.0, 1116.0, 3078.0, 9866.0, 39643.0, 200317.0, 549616.0, 191064.0, 37857.0, 9599.0, 3081.0, 1184.0, 461.0, 227.0, 132.0, 71.0, 52.0, 31.0, 23.0, 13.0, 14.0, 9.0, 8.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.484375, -9.1627197265625, -8.841064453125, -8.5194091796875, -8.19775390625, -7.8760986328125, -7.554443359375, -7.2327880859375, -6.9111328125, -6.5894775390625, -6.267822265625, -5.9461669921875, -5.62451171875, -5.3028564453125, -4.981201171875, -4.6595458984375, -4.337890625, -4.0162353515625, -3.694580078125, -3.3729248046875, -3.05126953125, -2.7296142578125, -2.407958984375, -2.0863037109375, -1.7646484375, -1.4429931640625, -1.121337890625, -0.7996826171875, -0.47802734375, -0.1563720703125, 0.165283203125, 0.4869384765625, 0.80859375, 1.1302490234375, 1.451904296875, 1.7735595703125, 2.09521484375, 2.4168701171875, 2.738525390625, 3.0601806640625, 3.3818359375, 3.7034912109375, 4.025146484375, 4.3468017578125, 4.66845703125, 4.9901123046875, 5.311767578125, 5.6334228515625, 5.955078125, 6.2767333984375, 6.598388671875, 6.9200439453125, 7.24169921875, 7.5633544921875, 7.885009765625, 8.2066650390625, 8.5283203125, 8.8499755859375, 9.171630859375, 9.4932861328125, 9.81494140625, 10.1365966796875, 10.458251953125, 10.7799072265625, 11.1015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 18.0, 22.0, 21.0, 24.0, 39.0, 52.0, 63.0, 49.0, 80.0, 64.0, 82.0, 83.0, 79.0, 80.0, 55.0, 57.0, 33.0, 28.0, 24.0, 14.0, 13.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.765625, -7.54058837890625, -7.3155517578125, -7.09051513671875, -6.865478515625, -6.64044189453125, -6.4154052734375, -6.19036865234375, -5.96533203125, -5.74029541015625, -5.5152587890625, -5.29022216796875, -5.065185546875, -4.84014892578125, -4.6151123046875, -4.39007568359375, -4.1650390625, -3.94000244140625, -3.7149658203125, -3.48992919921875, -3.264892578125, -3.03985595703125, -2.8148193359375, -2.58978271484375, -2.36474609375, -2.13970947265625, -1.9146728515625, -1.68963623046875, -1.464599609375, -1.23956298828125, -1.0145263671875, -0.78948974609375, -0.564453125, -0.33941650390625, -0.1143798828125, 0.11065673828125, 0.335693359375, 0.56072998046875, 0.7857666015625, 1.01080322265625, 1.23583984375, 1.46087646484375, 1.6859130859375, 1.91094970703125, 2.135986328125, 2.36102294921875, 2.5860595703125, 2.81109619140625, 3.0361328125, 3.26116943359375, 3.4862060546875, 3.71124267578125, 3.936279296875, 4.16131591796875, 4.3863525390625, 4.61138916015625, 4.83642578125, 5.06146240234375, 5.2864990234375, 5.51153564453125, 5.736572265625, 5.96160888671875, 6.1866455078125, 6.41168212890625, 6.63671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 5.0, 6.0, 10.0, 14.0, 20.0, 31.0, 28.0, 49.0, 56.0, 64.0, 131.0, 173.0, 312.0, 706.0, 2141.0, 8751.0, 52893.0, 532824.0, 389990.0, 48339.0, 8315.0, 2042.0, 704.0, 351.0, 192.0, 115.0, 74.0, 56.0, 38.0, 32.0, 19.0, 20.0, 12.0, 9.0, 8.0, 5.0, 3.0, 0.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.942626953125, -11.55712890625, -11.171630859375, -10.7861328125, -10.400634765625, -10.01513671875, -9.629638671875, -9.244140625, -8.858642578125, -8.47314453125, -8.087646484375, -7.7021484375, -7.316650390625, -6.93115234375, -6.545654296875, -6.16015625, -5.774658203125, -5.38916015625, -5.003662109375, -4.6181640625, -4.232666015625, -3.84716796875, -3.461669921875, -3.076171875, -2.690673828125, -2.30517578125, -1.919677734375, -1.5341796875, -1.148681640625, -0.76318359375, -0.377685546875, 0.0078125, 0.393310546875, 0.77880859375, 1.164306640625, 1.5498046875, 1.935302734375, 2.32080078125, 2.706298828125, 3.091796875, 3.477294921875, 3.86279296875, 4.248291015625, 4.6337890625, 5.019287109375, 5.40478515625, 5.790283203125, 6.17578125, 6.561279296875, 6.94677734375, 7.332275390625, 7.7177734375, 8.103271484375, 8.48876953125, 8.874267578125, 9.259765625, 9.645263671875, 10.03076171875, 10.416259765625, 10.8017578125, 11.187255859375, 11.57275390625, 11.958251953125, 12.34375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 11.0, 16.0, 17.0, 11.0, 22.0, 17.0, 29.0, 41.0, 28.0, 47.0, 56.0, 48.0, 60.0, 64.0, 69.0, 49.0, 59.0, 35.0, 44.0, 40.0, 44.0, 43.0, 24.0, 24.0, 17.0, 24.0, 11.0, 18.0, 10.0, 5.0, 4.0, 6.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8671875, -14.2974853515625, -13.727783203125, -13.1580810546875, -12.58837890625, -12.0186767578125, -11.448974609375, -10.8792724609375, -10.3095703125, -9.7398681640625, -9.170166015625, -8.6004638671875, -8.03076171875, -7.4610595703125, -6.891357421875, -6.3216552734375, -5.751953125, -5.1822509765625, -4.612548828125, -4.0428466796875, -3.47314453125, -2.9034423828125, -2.333740234375, -1.7640380859375, -1.1943359375, -0.6246337890625, -0.054931640625, 0.5147705078125, 1.08447265625, 1.6541748046875, 2.223876953125, 2.7935791015625, 3.36328125, 3.9329833984375, 4.502685546875, 5.0723876953125, 5.64208984375, 6.2117919921875, 6.781494140625, 7.3511962890625, 7.9208984375, 8.4906005859375, 9.060302734375, 9.6300048828125, 10.19970703125, 10.7694091796875, 11.339111328125, 11.9088134765625, 12.478515625, 13.0482177734375, 13.617919921875, 14.1876220703125, 14.75732421875, 15.3270263671875, 15.896728515625, 16.4664306640625, 17.0361328125, 17.6058349609375, 18.175537109375, 18.7452392578125, 19.31494140625, 19.8846435546875, 20.454345703125, 21.0240478515625, 21.59375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 7.0, 11.0, 22.0, 23.0, 33.0, 66.0, 114.0, 190.0, 314.0, 621.0, 1198.0, 2557.0, 6322.0, 19009.0, 74269.0, 512086.0, 334012.0, 68863.0, 17731.0, 6056.0, 2510.0, 1168.0, 601.0, 316.0, 161.0, 102.0, 82.0, 29.0, 28.0, 17.0, 8.0, 9.0, 10.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1875, -3.077484130859375, -2.96746826171875, -2.857452392578125, -2.7474365234375, -2.637420654296875, -2.52740478515625, -2.417388916015625, -2.307373046875, -2.197357177734375, -2.08734130859375, -1.977325439453125, -1.8673095703125, -1.757293701171875, -1.64727783203125, -1.537261962890625, -1.42724609375, -1.317230224609375, -1.20721435546875, -1.097198486328125, -0.9871826171875, -0.877166748046875, -0.76715087890625, -0.657135009765625, -0.547119140625, -0.437103271484375, -0.32708740234375, -0.217071533203125, -0.1070556640625, 0.002960205078125, 0.11297607421875, 0.222991943359375, 0.3330078125, 0.443023681640625, 0.55303955078125, 0.663055419921875, 0.7730712890625, 0.883087158203125, 0.99310302734375, 1.103118896484375, 1.213134765625, 1.323150634765625, 1.43316650390625, 1.543182373046875, 1.6531982421875, 1.763214111328125, 1.87322998046875, 1.983245849609375, 2.09326171875, 2.203277587890625, 2.31329345703125, 2.423309326171875, 2.5333251953125, 2.643341064453125, 2.75335693359375, 2.863372802734375, 2.973388671875, 3.083404541015625, 3.19342041015625, 3.303436279296875, 3.4134521484375, 3.523468017578125, 3.63348388671875, 3.743499755859375, 3.853515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 6.0, 12.0, 29.0, 26.0, 48.0, 58.0, 78.0, 117.0, 110.0, 103.0, 104.0, 82.0, 55.0, 42.0, 31.0, 19.0, 14.0, 10.0, 13.0, 5.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012664794921875, -0.0012311935424804688, -0.0011959075927734375, -0.0011606216430664062, -0.001125335693359375, -0.0010900497436523438, -0.0010547637939453125, -0.0010194778442382812, -0.00098419189453125, -0.0009489059448242188, -0.0009136199951171875, -0.0008783340454101562, -0.000843048095703125, -0.0008077621459960938, -0.0007724761962890625, -0.0007371902465820312, -0.000701904296875, -0.0006666183471679688, -0.0006313323974609375, -0.0005960464477539062, -0.000560760498046875, -0.0005254745483398438, -0.0004901885986328125, -0.00045490264892578125, -0.00041961669921875, -0.00038433074951171875, -0.0003490447998046875, -0.00031375885009765625, -0.000278472900390625, -0.00024318695068359375, -0.0002079010009765625, -0.00017261505126953125, -0.0001373291015625, -0.00010204315185546875, -6.67572021484375e-05, -3.147125244140625e-05, 3.814697265625e-06, 3.910064697265625e-05, 7.43865966796875e-05, 0.00010967254638671875, 0.00014495849609375, 0.00018024444580078125, 0.0002155303955078125, 0.00025081634521484375, 0.000286102294921875, 0.00032138824462890625, 0.0003566741943359375, 0.00039196014404296875, 0.00042724609375, 0.00046253204345703125, 0.0004978179931640625, 0.0005331039428710938, 0.000568389892578125, 0.0006036758422851562, 0.0006389617919921875, 0.0006742477416992188, 0.00070953369140625, 0.0007448196411132812, 0.0007801055908203125, 0.0008153915405273438, 0.000850677490234375, 0.0008859634399414062, 0.0009212493896484375, 0.0009565353393554688, 0.0009918212890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 13.0, 22.0, 24.0, 43.0, 44.0, 92.0, 153.0, 290.0, 552.0, 1234.0, 2568.0, 6464.0, 18455.0, 64486.0, 268754.0, 546672.0, 97176.0, 26126.0, 8826.0, 3595.0, 1476.0, 652.0, 340.0, 195.0, 92.0, 64.0, 33.0, 25.0, 20.0, 16.0, 14.0, 9.0, 4.0, 7.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0078125, -3.896942138671875, -3.78607177734375, -3.675201416015625, -3.5643310546875, -3.453460693359375, -3.34259033203125, -3.231719970703125, -3.120849609375, -3.009979248046875, -2.89910888671875, -2.788238525390625, -2.6773681640625, -2.566497802734375, -2.45562744140625, -2.344757080078125, -2.23388671875, -2.123016357421875, -2.01214599609375, -1.901275634765625, -1.7904052734375, -1.679534912109375, -1.56866455078125, -1.457794189453125, -1.346923828125, -1.236053466796875, -1.12518310546875, -1.014312744140625, -0.9034423828125, -0.792572021484375, -0.68170166015625, -0.570831298828125, -0.4599609375, -0.349090576171875, -0.23822021484375, -0.127349853515625, -0.0164794921875, 0.094390869140625, 0.20526123046875, 0.316131591796875, 0.427001953125, 0.537872314453125, 0.64874267578125, 0.759613037109375, 0.8704833984375, 0.981353759765625, 1.09222412109375, 1.203094482421875, 1.31396484375, 1.424835205078125, 1.53570556640625, 1.646575927734375, 1.7574462890625, 1.868316650390625, 1.97918701171875, 2.090057373046875, 2.200927734375, 2.311798095703125, 2.42266845703125, 2.533538818359375, 2.6444091796875, 2.755279541015625, 2.86614990234375, 2.977020263671875, 3.087890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 12.0, 11.0, 16.0, 17.0, 13.0, 17.0, 37.0, 50.0, 58.0, 67.0, 62.0, 88.0, 62.0, 70.0, 61.0, 69.0, 51.0, 51.0, 26.0, 27.0, 25.0, 23.0, 18.0, 12.0, 12.0, 5.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.640625, -3.54388427734375, -3.4471435546875, -3.35040283203125, -3.253662109375, -3.15692138671875, -3.0601806640625, -2.96343994140625, -2.86669921875, -2.76995849609375, -2.6732177734375, -2.57647705078125, -2.479736328125, -2.38299560546875, -2.2862548828125, -2.18951416015625, -2.0927734375, -1.99603271484375, -1.8992919921875, -1.80255126953125, -1.705810546875, -1.60906982421875, -1.5123291015625, -1.41558837890625, -1.31884765625, -1.22210693359375, -1.1253662109375, -1.02862548828125, -0.931884765625, -0.83514404296875, -0.7384033203125, -0.64166259765625, -0.544921875, -0.44818115234375, -0.3514404296875, -0.25469970703125, -0.157958984375, -0.06121826171875, 0.0355224609375, 0.13226318359375, 0.22900390625, 0.32574462890625, 0.4224853515625, 0.51922607421875, 0.615966796875, 0.71270751953125, 0.8094482421875, 0.90618896484375, 1.0029296875, 1.09967041015625, 1.1964111328125, 1.29315185546875, 1.389892578125, 1.48663330078125, 1.5833740234375, 1.68011474609375, 1.77685546875, 1.87359619140625, 1.9703369140625, 2.06707763671875, 2.163818359375, 2.26055908203125, 2.3572998046875, 2.45404052734375, 2.55078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 14.0, 23.0, 35.0, 64.0, 99.0, 213.0, 234.0, 148.0, 78.0, 39.0, 15.0, 11.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.12248992919922, -60.266807556152344, -57.41112518310547, -54.555442810058594, -51.69976043701172, -48.844078063964844, -45.98839569091797, -43.132713317871094, -40.27703094482422, -37.421348571777344, -34.56566619873047, -31.709983825683594, -28.85430145263672, -25.998619079589844, -23.14293670654297, -20.287254333496094, -17.43157196044922, -14.575889587402344, -11.720207214355469, -8.864524841308594, -6.008842468261719, -3.1531600952148438, -0.29747772216796875, 2.5582046508789062, 5.413887023925781, 8.269569396972656, 11.125251770019531, 13.980934143066406, 16.83661651611328, 19.692298889160156, 22.54798126220703, 25.403663635253906, 28.25933837890625, 31.115020751953125, 33.970703125, 36.826385498046875, 39.68206787109375, 42.537750244140625, 45.3934326171875, 48.249114990234375, 51.10479736328125, 53.960479736328125, 56.816162109375, 59.671844482421875, 62.52752685546875, 65.38320922851562, 68.2388916015625, 71.09457397460938, 73.95025634765625, 76.80593872070312, 79.66162109375, 82.51730346679688, 85.37298583984375, 88.22866821289062, 91.0843505859375, 93.94003295898438, 96.79571533203125, 99.65139770507812, 102.507080078125, 105.36276245117188, 108.21844482421875, 111.07412719726562, 113.9298095703125, 116.78549194335938, 119.64117431640625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 6.0, 5.0, 9.0, 7.0, 11.0, 18.0, 17.0, 18.0, 16.0, 20.0, 27.0, 31.0, 39.0, 37.0, 51.0, 65.0, 72.0, 83.0, 74.0, 48.0, 47.0, 39.0, 35.0, 31.0, 19.0, 25.0, 19.0, 21.0, 15.0, 15.0, 8.0, 12.0, 6.0, 15.0, 8.0, 5.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.111228942871094, -57.178802490234375, -55.24637222290039, -53.31394577026367, -51.38151550292969, -49.44908905029297, -47.51666259765625, -45.584232330322266, -43.65180587768555, -41.71937942504883, -39.786949157714844, -37.854522705078125, -35.92209243774414, -33.98966598510742, -32.05723571777344, -30.12480926513672, -28.192380905151367, -26.259952545166016, -24.327524185180664, -22.395095825195312, -20.462669372558594, -18.530241012573242, -16.59781265258789, -14.665385246276855, -12.732956886291504, -10.800528526306152, -8.868101119995117, -6.935672760009766, -5.003244876861572, -3.070816993713379, -1.1383886337280273, 0.7940387725830078, 2.7264671325683594, 4.658895015716553, 6.591322898864746, 8.523751258850098, 10.456178665161133, 12.388607025146484, 14.321035385131836, 16.253463745117188, 18.185890197753906, 20.118318557739258, 22.05074691772461, 23.983173370361328, 25.91560173034668, 27.84803009033203, 29.780458450317383, 31.712886810302734, 33.64531707763672, 35.57774353027344, 37.51017379760742, 39.44260025024414, 41.375030517578125, 43.307456970214844, 45.23988342285156, 47.17231369018555, 49.104740142822266, 51.037166595458984, 52.96959686279297, 54.90202331542969, 56.83445358276367, 58.76688003540039, 60.699310302734375, 62.631736755371094, 64.56416320800781]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 10.0, 16.0, 27.0, 35.0, 49.0, 102.0, 171.0, 349.0, 733.0, 1785.0, 5224.0, 21369.0, 263109.0, 3478944.0, 389039.0, 24667.0, 5404.0, 1759.0, 703.0, 317.0, 184.0, 99.0, 68.0, 43.0, 25.0, 16.0, 11.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.484375, -12.123046875, -11.76171875, -11.400390625, -11.0390625, -10.677734375, -10.31640625, -9.955078125, -9.59375, -9.232421875, -8.87109375, -8.509765625, -8.1484375, -7.787109375, -7.42578125, -7.064453125, -6.703125, -6.341796875, -5.98046875, -5.619140625, -5.2578125, -4.896484375, -4.53515625, -4.173828125, -3.8125, -3.451171875, -3.08984375, -2.728515625, -2.3671875, -2.005859375, -1.64453125, -1.283203125, -0.921875, -0.560546875, -0.19921875, 0.162109375, 0.5234375, 0.884765625, 1.24609375, 1.607421875, 1.96875, 2.330078125, 2.69140625, 3.052734375, 3.4140625, 3.775390625, 4.13671875, 4.498046875, 4.859375, 5.220703125, 5.58203125, 5.943359375, 6.3046875, 6.666015625, 7.02734375, 7.388671875, 7.75, 8.111328125, 8.47265625, 8.833984375, 9.1953125, 9.556640625, 9.91796875, 10.279296875, 10.640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 11.0, 14.0, 15.0, 30.0, 29.0, 26.0, 46.0, 40.0, 38.0, 39.0, 53.0, 42.0, 60.0, 63.0, 55.0, 46.0, 40.0, 62.0, 35.0, 60.0, 27.0, 38.0, 26.0, 23.0, 18.0, 12.0, 13.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.595703125, -3.443511962890625, -3.29132080078125, -3.139129638671875, -2.9869384765625, -2.834747314453125, -2.68255615234375, -2.530364990234375, -2.378173828125, -2.225982666015625, -2.07379150390625, -1.921600341796875, -1.7694091796875, -1.617218017578125, -1.46502685546875, -1.312835693359375, -1.16064453125, -1.008453369140625, -0.85626220703125, -0.704071044921875, -0.5518798828125, -0.399688720703125, -0.24749755859375, -0.095306396484375, 0.056884765625, 0.209075927734375, 0.36126708984375, 0.513458251953125, 0.6656494140625, 0.817840576171875, 0.97003173828125, 1.122222900390625, 1.2744140625, 1.426605224609375, 1.57879638671875, 1.730987548828125, 1.8831787109375, 2.035369873046875, 2.18756103515625, 2.339752197265625, 2.491943359375, 2.644134521484375, 2.79632568359375, 2.948516845703125, 3.1007080078125, 3.252899169921875, 3.40509033203125, 3.557281494140625, 3.70947265625, 3.861663818359375, 4.01385498046875, 4.166046142578125, 4.3182373046875, 4.470428466796875, 4.62261962890625, 4.774810791015625, 4.927001953125, 5.079193115234375, 5.23138427734375, 5.383575439453125, 5.5357666015625, 5.687957763671875, 5.84014892578125, 5.992340087890625, 6.14453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 9.0, 15.0, 19.0, 41.0, 68.0, 176.0, 470.0, 2039.0, 31543.0, 4088515.0, 67474.0, 2952.0, 575.0, 182.0, 88.0, 51.0, 27.0, 20.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.46875, -32.4091796875, -31.349609375, -30.2900390625, -29.23046875, -28.1708984375, -27.111328125, -26.0517578125, -24.9921875, -23.9326171875, -22.873046875, -21.8134765625, -20.75390625, -19.6943359375, -18.634765625, -17.5751953125, -16.515625, -15.4560546875, -14.396484375, -13.3369140625, -12.27734375, -11.2177734375, -10.158203125, -9.0986328125, -8.0390625, -6.9794921875, -5.919921875, -4.8603515625, -3.80078125, -2.7412109375, -1.681640625, -0.6220703125, 0.4375, 1.4970703125, 2.556640625, 3.6162109375, 4.67578125, 5.7353515625, 6.794921875, 7.8544921875, 8.9140625, 9.9736328125, 11.033203125, 12.0927734375, 13.15234375, 14.2119140625, 15.271484375, 16.3310546875, 17.390625, 18.4501953125, 19.509765625, 20.5693359375, 21.62890625, 22.6884765625, 23.748046875, 24.8076171875, 25.8671875, 26.9267578125, 27.986328125, 29.0458984375, 30.10546875, 31.1650390625, 32.224609375, 33.2841796875, 34.34375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 12.0, 10.0, 15.0, 26.0, 38.0, 52.0, 76.0, 159.0, 316.0, 581.0, 841.0, 771.0, 530.0, 250.0, 146.0, 73.0, 59.0, 34.0, 13.0, 12.0, 9.0, 12.0, 9.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.2371826171875, -8.864990234375, -8.4927978515625, -8.12060546875, -7.7484130859375, -7.376220703125, -7.0040283203125, -6.6318359375, -6.2596435546875, -5.887451171875, -5.5152587890625, -5.14306640625, -4.7708740234375, -4.398681640625, -4.0264892578125, -3.654296875, -3.2821044921875, -2.909912109375, -2.5377197265625, -2.16552734375, -1.7933349609375, -1.421142578125, -1.0489501953125, -0.6767578125, -0.3045654296875, 0.067626953125, 0.4398193359375, 0.81201171875, 1.1842041015625, 1.556396484375, 1.9285888671875, 2.30078125, 2.6729736328125, 3.045166015625, 3.4173583984375, 3.78955078125, 4.1617431640625, 4.533935546875, 4.9061279296875, 5.2783203125, 5.6505126953125, 6.022705078125, 6.3948974609375, 6.76708984375, 7.1392822265625, 7.511474609375, 7.8836669921875, 8.255859375, 8.6280517578125, 9.000244140625, 9.3724365234375, 9.74462890625, 10.1168212890625, 10.489013671875, 10.8612060546875, 11.2333984375, 11.6055908203125, 11.977783203125, 12.3499755859375, 12.72216796875, 13.0943603515625, 13.466552734375, 13.8387451171875, 14.2109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 11.0, 32.0, 47.0, 110.0, 211.0, 231.0, 165.0, 91.0, 44.0, 20.0, 15.0, 9.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-178.6913604736328, -174.558837890625, -170.42630004882812, -166.2937774658203, -162.1612548828125, -158.02871704101562, -153.8961944580078, -149.763671875, -145.63113403320312, -141.4986114501953, -137.36607360839844, -133.23355102539062, -129.1010284423828, -124.96849822998047, -120.83596801757812, -116.70344543457031, -112.5709228515625, -108.43839263916016, -104.30587005615234, -100.17333984375, -96.04081726074219, -91.90828704833984, -87.7757568359375, -83.64323425292969, -79.51070404052734, -75.378173828125, -71.24565124511719, -67.11312103271484, -62.980594635009766, -58.84806823730469, -54.715538024902344, -50.583011627197266, -46.45048522949219, -42.31795883178711, -38.18543243408203, -34.05290222167969, -29.92037582397461, -25.78784942626953, -21.65532112121582, -17.52279281616211, -13.390266418457031, -9.257739067077637, -5.125211715698242, -0.9926843643188477, 3.139842987060547, 7.272369384765625, 11.404897689819336, 15.537425994873047, 19.669952392578125, 23.802478790283203, 27.935007095336914, 32.067535400390625, 36.2000617980957, 40.33258819580078, 44.465118408203125, 48.5976448059082, 52.73017120361328, 56.86269760131836, 60.99522399902344, 65.12775421142578, 69.26028442382812, 73.39280700683594, 77.52533721923828, 81.65786743164062, 85.79039001464844]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 10.0, 12.0, 11.0, 26.0, 18.0, 18.0, 31.0, 25.0, 34.0, 42.0, 48.0, 44.0, 48.0, 58.0, 59.0, 58.0, 37.0, 50.0, 55.0, 49.0, 34.0, 35.0, 36.0, 27.0, 30.0, 26.0, 17.0, 8.0, 6.0, 9.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.94472885131836, -46.5534553527832, -45.16218566894531, -43.770912170410156, -42.379642486572266, -40.98836898803711, -39.59709930419922, -38.20582580566406, -36.81455612182617, -35.423282623291016, -34.032012939453125, -32.64073944091797, -31.249469757080078, -29.858198165893555, -28.46692657470703, -27.075653076171875, -25.68438148498535, -24.293109893798828, -22.901838302612305, -21.51056671142578, -20.119295120239258, -18.728023529052734, -17.336750030517578, -15.945479393005371, -14.554207801818848, -13.162936210632324, -11.7716646194458, -10.380392074584961, -8.989120483398438, -7.597849369049072, -6.206577301025391, -4.815305709838867, -3.4240341186523438, -2.0327625274658203, -0.6414906978607178, 0.7497811317443848, 2.141052722930908, 3.5323243141174316, 4.923596382141113, 6.314867973327637, 7.70613956451416, 9.097411155700684, 10.488682746887207, 11.879955291748047, 13.27122688293457, 14.662498474121094, 16.053770065307617, 17.44504165649414, 18.836313247680664, 20.227584838867188, 21.61885643005371, 23.010128021240234, 24.401399612426758, 25.79267120361328, 27.183944702148438, 28.575214385986328, 29.966487884521484, 31.357759475708008, 32.74903106689453, 34.14030456542969, 35.53157424926758, 36.922847747802734, 38.314117431640625, 39.70539093017578, 41.09666061401367]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 4.0, 11.0, 17.0, 21.0, 27.0, 49.0, 71.0, 131.0, 228.0, 427.0, 858.0, 1868.0, 4477.0, 12150.0, 39552.0, 160371.0, 532359.0, 219814.0, 50894.0, 15423.0, 5439.0, 2205.0, 998.0, 482.0, 252.0, 163.0, 88.0, 58.0, 30.0, 17.0, 21.0, 6.0, 10.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.3885498046875, -7.120849609375, -6.8531494140625, -6.58544921875, -6.3177490234375, -6.050048828125, -5.7823486328125, -5.5146484375, -5.2469482421875, -4.979248046875, -4.7115478515625, -4.44384765625, -4.1761474609375, -3.908447265625, -3.6407470703125, -3.373046875, -3.1053466796875, -2.837646484375, -2.5699462890625, -2.30224609375, -2.0345458984375, -1.766845703125, -1.4991455078125, -1.2314453125, -0.9637451171875, -0.696044921875, -0.4283447265625, -0.16064453125, 0.1070556640625, 0.374755859375, 0.6424560546875, 0.91015625, 1.1778564453125, 1.445556640625, 1.7132568359375, 1.98095703125, 2.2486572265625, 2.516357421875, 2.7840576171875, 3.0517578125, 3.3194580078125, 3.587158203125, 3.8548583984375, 4.12255859375, 4.3902587890625, 4.657958984375, 4.9256591796875, 5.193359375, 5.4610595703125, 5.728759765625, 5.9964599609375, 6.26416015625, 6.5318603515625, 6.799560546875, 7.0672607421875, 7.3349609375, 7.6026611328125, 7.870361328125, 8.1380615234375, 8.40576171875, 8.6734619140625, 8.941162109375, 9.2088623046875, 9.4765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 5.0, 12.0, 18.0, 32.0, 14.0, 22.0, 29.0, 27.0, 42.0, 49.0, 31.0, 50.0, 55.0, 57.0, 43.0, 60.0, 43.0, 49.0, 46.0, 48.0, 36.0, 45.0, 20.0, 30.0, 19.0, 21.0, 19.0, 22.0, 15.0, 6.0, 9.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8671875, -4.71954345703125, -4.5718994140625, -4.42425537109375, -4.276611328125, -4.12896728515625, -3.9813232421875, -3.83367919921875, -3.68603515625, -3.53839111328125, -3.3907470703125, -3.24310302734375, -3.095458984375, -2.94781494140625, -2.8001708984375, -2.65252685546875, -2.5048828125, -2.35723876953125, -2.2095947265625, -2.06195068359375, -1.914306640625, -1.76666259765625, -1.6190185546875, -1.47137451171875, -1.32373046875, -1.17608642578125, -1.0284423828125, -0.88079833984375, -0.733154296875, -0.58551025390625, -0.4378662109375, -0.29022216796875, -0.142578125, 0.00506591796875, 0.1527099609375, 0.30035400390625, 0.447998046875, 0.59564208984375, 0.7432861328125, 0.89093017578125, 1.03857421875, 1.18621826171875, 1.3338623046875, 1.48150634765625, 1.629150390625, 1.77679443359375, 1.9244384765625, 2.07208251953125, 2.2197265625, 2.36737060546875, 2.5150146484375, 2.66265869140625, 2.810302734375, 2.95794677734375, 3.1055908203125, 3.25323486328125, 3.40087890625, 3.54852294921875, 3.6961669921875, 3.84381103515625, 3.991455078125, 4.13909912109375, 4.2867431640625, 4.43438720703125, 4.58203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 8.0, 5.0, 9.0, 12.0, 27.0, 22.0, 44.0, 39.0, 56.0, 75.0, 144.0, 205.0, 366.0, 638.0, 1092.0, 2668.0, 8387.0, 44567.0, 620313.0, 322978.0, 34926.0, 7133.0, 2395.0, 1024.0, 491.0, 300.0, 196.0, 138.0, 87.0, 54.0, 41.0, 32.0, 26.0, 11.0, 10.0, 5.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.8515625, -10.463134765625, -10.07470703125, -9.686279296875, -9.2978515625, -8.909423828125, -8.52099609375, -8.132568359375, -7.744140625, -7.355712890625, -6.96728515625, -6.578857421875, -6.1904296875, -5.802001953125, -5.41357421875, -5.025146484375, -4.63671875, -4.248291015625, -3.85986328125, -3.471435546875, -3.0830078125, -2.694580078125, -2.30615234375, -1.917724609375, -1.529296875, -1.140869140625, -0.75244140625, -0.364013671875, 0.0244140625, 0.412841796875, 0.80126953125, 1.189697265625, 1.578125, 1.966552734375, 2.35498046875, 2.743408203125, 3.1318359375, 3.520263671875, 3.90869140625, 4.297119140625, 4.685546875, 5.073974609375, 5.46240234375, 5.850830078125, 6.2392578125, 6.627685546875, 7.01611328125, 7.404541015625, 7.79296875, 8.181396484375, 8.56982421875, 8.958251953125, 9.3466796875, 9.735107421875, 10.12353515625, 10.511962890625, 10.900390625, 11.288818359375, 11.67724609375, 12.065673828125, 12.4541015625, 12.842529296875, 13.23095703125, 13.619384765625, 14.0078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 17.0, 15.0, 14.0, 14.0, 29.0, 35.0, 31.0, 28.0, 47.0, 43.0, 56.0, 61.0, 67.0, 49.0, 57.0, 44.0, 48.0, 48.0, 34.0, 36.0, 33.0, 30.0, 22.0, 31.0, 14.0, 19.0, 11.0, 11.0, 6.0, 3.0, 4.0, 1.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-21.5, -20.9466552734375, -20.393310546875, -19.8399658203125, -19.28662109375, -18.7332763671875, -18.179931640625, -17.6265869140625, -17.0732421875, -16.5198974609375, -15.966552734375, -15.4132080078125, -14.85986328125, -14.3065185546875, -13.753173828125, -13.1998291015625, -12.646484375, -12.0931396484375, -11.539794921875, -10.9864501953125, -10.43310546875, -9.8797607421875, -9.326416015625, -8.7730712890625, -8.2197265625, -7.6663818359375, -7.113037109375, -6.5596923828125, -6.00634765625, -5.4530029296875, -4.899658203125, -4.3463134765625, -3.79296875, -3.2396240234375, -2.686279296875, -2.1329345703125, -1.57958984375, -1.0262451171875, -0.472900390625, 0.0804443359375, 0.6337890625, 1.1871337890625, 1.740478515625, 2.2938232421875, 2.84716796875, 3.4005126953125, 3.953857421875, 4.5072021484375, 5.060546875, 5.6138916015625, 6.167236328125, 6.7205810546875, 7.27392578125, 7.8272705078125, 8.380615234375, 8.9339599609375, 9.4873046875, 10.0406494140625, 10.593994140625, 11.1473388671875, 11.70068359375, 12.2540283203125, 12.807373046875, 13.3607177734375, 13.9140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 4.0, 7.0, 3.0, 5.0, 13.0, 17.0, 28.0, 27.0, 40.0, 52.0, 100.0, 154.0, 270.0, 468.0, 810.0, 1656.0, 3153.0, 7342.0, 18179.0, 54425.0, 276918.0, 580713.0, 66832.0, 21279.0, 8349.0, 3807.0, 1683.0, 948.0, 455.0, 293.0, 164.0, 90.0, 64.0, 45.0, 37.0, 30.0, 25.0, 17.0, 8.0, 11.0, 8.0, 4.0, 6.0, 2.0, 1.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.282440185546875, -3.18011474609375, -3.077789306640625, -2.9754638671875, -2.873138427734375, -2.77081298828125, -2.668487548828125, -2.566162109375, -2.463836669921875, -2.36151123046875, -2.259185791015625, -2.1568603515625, -2.054534912109375, -1.95220947265625, -1.849884033203125, -1.74755859375, -1.645233154296875, -1.54290771484375, -1.440582275390625, -1.3382568359375, -1.235931396484375, -1.13360595703125, -1.031280517578125, -0.928955078125, -0.826629638671875, -0.72430419921875, -0.621978759765625, -0.5196533203125, -0.417327880859375, -0.31500244140625, -0.212677001953125, -0.1103515625, -0.008026123046875, 0.09429931640625, 0.196624755859375, 0.2989501953125, 0.401275634765625, 0.50360107421875, 0.605926513671875, 0.708251953125, 0.810577392578125, 0.91290283203125, 1.015228271484375, 1.1175537109375, 1.219879150390625, 1.32220458984375, 1.424530029296875, 1.52685546875, 1.629180908203125, 1.73150634765625, 1.833831787109375, 1.9361572265625, 2.038482666015625, 2.14080810546875, 2.243133544921875, 2.345458984375, 2.447784423828125, 2.55010986328125, 2.652435302734375, 2.7547607421875, 2.857086181640625, 2.95941162109375, 3.061737060546875, 3.1640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 6.0, 10.0, 4.0, 7.0, 8.0, 18.0, 15.0, 18.0, 38.0, 41.0, 66.0, 96.0, 117.0, 116.0, 90.0, 66.0, 59.0, 40.0, 33.0, 31.0, 15.0, 17.0, 12.0, 10.0, 6.0, 11.0, 4.0, 8.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0009512901306152344, -0.0009226873517036438, -0.0008940845727920532, -0.0008654817938804626, -0.0008368790149688721, -0.0008082762360572815, -0.0007796734571456909, -0.0007510706782341003, -0.0007224678993225098, -0.0006938651204109192, -0.0006652623414993286, -0.000636659562587738, -0.0006080567836761475, -0.0005794540047645569, -0.0005508512258529663, -0.0005222484469413757, -0.0004936456680297852, -0.0004650428891181946, -0.000436440110206604, -0.00040783733129501343, -0.00037923455238342285, -0.0003506317734718323, -0.0003220289945602417, -0.0002934262156486511, -0.00026482343673706055, -0.00023622065782546997, -0.0002076178789138794, -0.00017901510000228882, -0.00015041232109069824, -0.00012180954217910767, -9.320676326751709e-05, -6.460398435592651e-05, -3.600120544433594e-05, -7.398426532745361e-06, 2.1204352378845215e-05, 4.980713129043579e-05, 7.840991020202637e-05, 0.00010701268911361694, 0.00013561546802520752, 0.0001642182469367981, 0.00019282102584838867, 0.00022142380475997925, 0.0002500265836715698, 0.0002786293625831604, 0.000307232141494751, 0.00033583492040634155, 0.00036443769931793213, 0.0003930404782295227, 0.0004216432571411133, 0.00045024603605270386, 0.00047884881496429443, 0.000507451593875885, 0.0005360543727874756, 0.0005646571516990662, 0.0005932599306106567, 0.0006218627095222473, 0.0006504654884338379, 0.0006790682673454285, 0.000707671046257019, 0.0007362738251686096, 0.0007648766040802002, 0.0007934793829917908, 0.0008220821619033813, 0.0008506849408149719, 0.0008792877197265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 7.0, 6.0, 21.0, 12.0, 25.0, 39.0, 68.0, 122.0, 186.0, 436.0, 856.0, 2082.0, 6174.0, 23047.0, 133069.0, 770712.0, 86435.0, 17031.0, 4988.0, 1742.0, 717.0, 329.0, 184.0, 93.0, 70.0, 39.0, 28.0, 14.0, 6.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.490631103515625, -3.33477783203125, -3.178924560546875, -3.0230712890625, -2.867218017578125, -2.71136474609375, -2.555511474609375, -2.399658203125, -2.243804931640625, -2.08795166015625, -1.932098388671875, -1.7762451171875, -1.620391845703125, -1.46453857421875, -1.308685302734375, -1.15283203125, -0.996978759765625, -0.84112548828125, -0.685272216796875, -0.5294189453125, -0.373565673828125, -0.21771240234375, -0.061859130859375, 0.093994140625, 0.249847412109375, 0.40570068359375, 0.561553955078125, 0.7174072265625, 0.873260498046875, 1.02911376953125, 1.184967041015625, 1.3408203125, 1.496673583984375, 1.65252685546875, 1.808380126953125, 1.9642333984375, 2.120086669921875, 2.27593994140625, 2.431793212890625, 2.587646484375, 2.743499755859375, 2.89935302734375, 3.055206298828125, 3.2110595703125, 3.366912841796875, 3.52276611328125, 3.678619384765625, 3.83447265625, 3.990325927734375, 4.14617919921875, 4.302032470703125, 4.4578857421875, 4.613739013671875, 4.76959228515625, 4.925445556640625, 5.081298828125, 5.237152099609375, 5.39300537109375, 5.548858642578125, 5.7047119140625, 5.860565185546875, 6.01641845703125, 6.172271728515625, 6.328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 10.0, 7.0, 3.0, 9.0, 11.0, 14.0, 24.0, 30.0, 42.0, 34.0, 47.0, 94.0, 123.0, 140.0, 116.0, 82.0, 53.0, 35.0, 23.0, 27.0, 25.0, 11.0, 15.0, 5.0, 5.0, 7.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7421875, -3.61041259765625, -3.4786376953125, -3.34686279296875, -3.215087890625, -3.08331298828125, -2.9515380859375, -2.81976318359375, -2.68798828125, -2.55621337890625, -2.4244384765625, -2.29266357421875, -2.160888671875, -2.02911376953125, -1.8973388671875, -1.76556396484375, -1.6337890625, -1.50201416015625, -1.3702392578125, -1.23846435546875, -1.106689453125, -0.97491455078125, -0.8431396484375, -0.71136474609375, -0.57958984375, -0.44781494140625, -0.3160400390625, -0.18426513671875, -0.052490234375, 0.07928466796875, 0.2110595703125, 0.34283447265625, 0.474609375, 0.60638427734375, 0.7381591796875, 0.86993408203125, 1.001708984375, 1.13348388671875, 1.2652587890625, 1.39703369140625, 1.52880859375, 1.66058349609375, 1.7923583984375, 1.92413330078125, 2.055908203125, 2.18768310546875, 2.3194580078125, 2.45123291015625, 2.5830078125, 2.71478271484375, 2.8465576171875, 2.97833251953125, 3.110107421875, 3.24188232421875, 3.3736572265625, 3.50543212890625, 3.63720703125, 3.76898193359375, 3.9007568359375, 4.03253173828125, 4.164306640625, 4.29608154296875, 4.4278564453125, 4.55963134765625, 4.69140625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 11.0, 8.0, 38.0, 66.0, 128.0, 326.0, 202.0, 95.0, 51.0, 25.0, 20.0, 11.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.0772933959961, -72.72566223144531, -69.37403106689453, -66.02239990234375, -62.6707763671875, -59.31914520263672, -55.96751403808594, -52.615882873535156, -49.26425552368164, -45.91262435913086, -42.560997009277344, -39.20936584472656, -35.85773468017578, -32.506107330322266, -29.154476165771484, -25.802846908569336, -22.451217651367188, -19.09958839416504, -15.747958183288574, -12.39632797241211, -9.044698715209961, -5.6930694580078125, -2.3414382934570312, 1.0101909637451172, 4.361820220947266, 7.713449954986572, 11.065079689025879, 14.416709899902344, 17.768339157104492, 21.11996841430664, 24.471599578857422, 27.82322883605957, 31.17486572265625, 34.52649688720703, 37.87812423706055, 41.22975540161133, 44.581382751464844, 47.933013916015625, 51.284645080566406, 54.63627624511719, 57.9879035949707, 61.339534759521484, 64.691162109375, 68.04279327392578, 71.39442443847656, 74.74604797363281, 78.09768676757812, 81.44931030273438, 84.80094146728516, 88.15257263183594, 91.50420379638672, 94.8558349609375, 98.20745849609375, 101.55908966064453, 104.91072082519531, 108.2623519897461, 111.61398315429688, 114.96561431884766, 118.31724548339844, 121.66886901855469, 125.02050018310547, 128.37213134765625, 131.7237548828125, 135.0753936767578, 138.42701721191406]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 10.0, 7.0, 7.0, 21.0, 16.0, 26.0, 21.0, 23.0, 31.0, 33.0, 29.0, 40.0, 47.0, 104.0, 142.0, 101.0, 52.0, 42.0, 37.0, 35.0, 28.0, 21.0, 26.0, 21.0, 14.0, 16.0, 10.0, 11.0, 5.0, 6.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-109.59367370605469, -106.89695739746094, -104.20023345947266, -101.5035171508789, -98.80680084228516, -96.1100845336914, -93.41336059570312, -90.71664428710938, -88.01992797851562, -85.32321166992188, -82.6264877319336, -79.92977142333984, -77.2330551147461, -74.53633880615234, -71.83961486816406, -69.14289855957031, -66.44618225097656, -63.74946212768555, -61.0527458190918, -58.35602569580078, -55.65930938720703, -52.962589263916016, -50.265869140625, -47.56915283203125, -44.87242889404297, -42.17570877075195, -39.4789924621582, -36.78227233886719, -34.08555603027344, -31.388835906982422, -28.69211769104004, -25.995399475097656, -23.298683166503906, -20.601964950561523, -17.90524673461914, -15.208527565002441, -12.511809349060059, -9.815091133117676, -7.118371963500977, -4.421653747558594, -1.724935531616211, 0.971782922744751, 3.668501377105713, 6.365220069885254, 9.061938285827637, 11.75865650177002, 14.455375671386719, 17.1520938873291, 19.848812103271484, 22.545530319213867, 25.24224853515625, 27.938968658447266, 30.635684967041016, 33.33240509033203, 36.02912139892578, 38.7258415222168, 41.42256164550781, 44.11928176879883, 46.81599807739258, 49.512718200683594, 52.209434509277344, 54.90615463256836, 57.602874755859375, 60.299591064453125, 62.996307373046875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 5.0, 13.0, 13.0, 21.0, 41.0, 54.0, 94.0, 136.0, 219.0, 416.0, 800.0, 1540.0, 3409.0, 9770.0, 50205.0, 866719.0, 2967832.0, 256902.0, 24542.0, 6435.0, 2507.0, 1143.0, 648.0, 328.0, 183.0, 108.0, 74.0, 40.0, 25.0, 25.0, 10.0, 5.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.5048828125, -10.189453125, -9.8740234375, -9.55859375, -9.2431640625, -8.927734375, -8.6123046875, -8.296875, -7.9814453125, -7.666015625, -7.3505859375, -7.03515625, -6.7197265625, -6.404296875, -6.0888671875, -5.7734375, -5.4580078125, -5.142578125, -4.8271484375, -4.51171875, -4.1962890625, -3.880859375, -3.5654296875, -3.25, -2.9345703125, -2.619140625, -2.3037109375, -1.98828125, -1.6728515625, -1.357421875, -1.0419921875, -0.7265625, -0.4111328125, -0.095703125, 0.2197265625, 0.53515625, 0.8505859375, 1.166015625, 1.4814453125, 1.796875, 2.1123046875, 2.427734375, 2.7431640625, 3.05859375, 3.3740234375, 3.689453125, 4.0048828125, 4.3203125, 4.6357421875, 4.951171875, 5.2666015625, 5.58203125, 5.8974609375, 6.212890625, 6.5283203125, 6.84375, 7.1591796875, 7.474609375, 7.7900390625, 8.10546875, 8.4208984375, 8.736328125, 9.0517578125, 9.3671875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 4.0, 12.0, 11.0, 15.0, 20.0, 38.0, 32.0, 46.0, 46.0, 57.0, 52.0, 59.0, 74.0, 68.0, 71.0, 69.0, 49.0, 60.0, 50.0, 31.0, 22.0, 32.0, 21.0, 15.0, 14.0, 12.0, 7.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.74609375, -6.5494384765625, -6.352783203125, -6.1561279296875, -5.95947265625, -5.7628173828125, -5.566162109375, -5.3695068359375, -5.1728515625, -4.9761962890625, -4.779541015625, -4.5828857421875, -4.38623046875, -4.1895751953125, -3.992919921875, -3.7962646484375, -3.599609375, -3.4029541015625, -3.206298828125, -3.0096435546875, -2.81298828125, -2.6163330078125, -2.419677734375, -2.2230224609375, -2.0263671875, -1.8297119140625, -1.633056640625, -1.4364013671875, -1.23974609375, -1.0430908203125, -0.846435546875, -0.6497802734375, -0.453125, -0.2564697265625, -0.059814453125, 0.1368408203125, 0.33349609375, 0.5301513671875, 0.726806640625, 0.9234619140625, 1.1201171875, 1.3167724609375, 1.513427734375, 1.7100830078125, 1.90673828125, 2.1033935546875, 2.300048828125, 2.4967041015625, 2.693359375, 2.8900146484375, 3.086669921875, 3.2833251953125, 3.47998046875, 3.6766357421875, 3.873291015625, 4.0699462890625, 4.2666015625, 4.4632568359375, 4.659912109375, 4.8565673828125, 5.05322265625, 5.2498779296875, 5.446533203125, 5.6431884765625, 5.83984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 14.0, 20.0, 23.0, 53.0, 116.0, 289.0, 943.0, 5010.0, 89740.0, 4011573.0, 79852.0, 5126.0, 960.0, 275.0, 111.0, 65.0, 30.0, 12.0, 16.0, 13.0, 6.0, 10.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.3125, -22.5478515625, -21.783203125, -21.0185546875, -20.25390625, -19.4892578125, -18.724609375, -17.9599609375, -17.1953125, -16.4306640625, -15.666015625, -14.9013671875, -14.13671875, -13.3720703125, -12.607421875, -11.8427734375, -11.078125, -10.3134765625, -9.548828125, -8.7841796875, -8.01953125, -7.2548828125, -6.490234375, -5.7255859375, -4.9609375, -4.1962890625, -3.431640625, -2.6669921875, -1.90234375, -1.1376953125, -0.373046875, 0.3916015625, 1.15625, 1.9208984375, 2.685546875, 3.4501953125, 4.21484375, 4.9794921875, 5.744140625, 6.5087890625, 7.2734375, 8.0380859375, 8.802734375, 9.5673828125, 10.33203125, 11.0966796875, 11.861328125, 12.6259765625, 13.390625, 14.1552734375, 14.919921875, 15.6845703125, 16.44921875, 17.2138671875, 17.978515625, 18.7431640625, 19.5078125, 20.2724609375, 21.037109375, 21.8017578125, 22.56640625, 23.3310546875, 24.095703125, 24.8603515625, 25.625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 13.0, 12.0, 14.0, 21.0, 31.0, 45.0, 62.0, 71.0, 155.0, 230.0, 388.0, 546.0, 687.0, 576.0, 431.0, 288.0, 176.0, 91.0, 79.0, 49.0, 29.0, 17.0, 15.0, 9.0, 9.0, 6.0, 7.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.287841796875, -7.95068359375, -7.613525390625, -7.2763671875, -6.939208984375, -6.60205078125, -6.264892578125, -5.927734375, -5.590576171875, -5.25341796875, -4.916259765625, -4.5791015625, -4.241943359375, -3.90478515625, -3.567626953125, -3.23046875, -2.893310546875, -2.55615234375, -2.218994140625, -1.8818359375, -1.544677734375, -1.20751953125, -0.870361328125, -0.533203125, -0.196044921875, 0.14111328125, 0.478271484375, 0.8154296875, 1.152587890625, 1.48974609375, 1.826904296875, 2.1640625, 2.501220703125, 2.83837890625, 3.175537109375, 3.5126953125, 3.849853515625, 4.18701171875, 4.524169921875, 4.861328125, 5.198486328125, 5.53564453125, 5.872802734375, 6.2099609375, 6.547119140625, 6.88427734375, 7.221435546875, 7.55859375, 7.895751953125, 8.23291015625, 8.570068359375, 8.9072265625, 9.244384765625, 9.58154296875, 9.918701171875, 10.255859375, 10.593017578125, 10.93017578125, 11.267333984375, 11.6044921875, 11.941650390625, 12.27880859375, 12.615966796875, 12.953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 20.0, 82.0, 243.0, 374.0, 179.0, 67.0, 22.0, 9.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.60047912597656, -192.05999755859375, -185.51951599121094, -178.97903442382812, -172.4385528564453, -165.8980712890625, -159.35760498046875, -152.81710815429688, -146.27664184570312, -139.7361602783203, -133.1956787109375, -126.65519714355469, -120.11471557617188, -113.57423400878906, -107.03376007080078, -100.49327850341797, -93.95278930664062, -87.41230773925781, -80.871826171875, -74.33134460449219, -67.79086303710938, -61.25038528442383, -54.70990753173828, -48.16942596435547, -41.628944396972656, -35.088462829589844, -28.547983169555664, -22.007503509521484, -15.467021942138672, -8.92654037475586, -2.3860626220703125, 4.1544189453125, 10.694915771484375, 17.235397338867188, 23.775876998901367, 30.316356658935547, 36.85683822631836, 43.39731979370117, 49.93779754638672, 56.47827911376953, 63.018760681152344, 69.55924224853516, 76.09972381591797, 82.64019775390625, 89.18067932128906, 95.72116088867188, 102.26164245605469, 108.8021240234375, 115.34260559082031, 121.88308715820312, 128.42356872558594, 134.96405029296875, 141.50453186035156, 148.04501342773438, 154.58547973632812, 161.1259765625, 167.66644287109375, 174.20692443847656, 180.74740600585938, 187.2878875732422, 193.828369140625, 200.3688507080078, 206.90933227539062, 213.44979858398438, 219.99029541015625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 9.0, 3.0, 5.0, 8.0, 10.0, 11.0, 16.0, 9.0, 20.0, 16.0, 20.0, 30.0, 28.0, 33.0, 38.0, 42.0, 47.0, 43.0, 51.0, 41.0, 38.0, 41.0, 46.0, 41.0, 36.0, 39.0, 33.0, 37.0, 33.0, 20.0, 25.0, 24.0, 23.0, 17.0, 12.0, 12.0, 6.0, 14.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-47.3223876953125, -45.875431060791016, -44.428470611572266, -42.98151397705078, -41.5345573425293, -40.08760070800781, -38.64064025878906, -37.19368362426758, -35.746726989746094, -34.29977035522461, -32.85280990600586, -31.405853271484375, -29.95889663696289, -28.511938095092773, -27.064979553222656, -25.618022918701172, -24.171064376831055, -22.724105834960938, -21.277149200439453, -19.830190658569336, -18.38323402404785, -16.936275482177734, -15.489317893981934, -14.042360305786133, -12.595402717590332, -11.148445129394531, -9.70148754119873, -8.25452995300293, -6.807571887969971, -5.36061429977417, -3.913656234741211, -2.46669864654541, -1.0197410583496094, 0.42721664905548096, 1.8741743564605713, 3.321132183074951, 4.768089771270752, 6.215047359466553, 7.662005424499512, 9.108963012695312, 10.555920600891113, 12.002878189086914, 13.449835777282715, 14.896793365478516, 16.343751907348633, 17.790708541870117, 19.237667083740234, 20.68462371826172, 22.131582260131836, 23.578540802001953, 25.025497436523438, 26.472455978393555, 27.91941261291504, 29.366371154785156, 30.81332778930664, 32.260284423828125, 33.707244873046875, 35.15420150756836, 36.60116195678711, 38.048118591308594, 39.49507522583008, 40.94203186035156, 42.38899230957031, 43.8359489440918, 45.28290557861328]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 27.0, 29.0, 69.0, 67.0, 129.0, 251.0, 408.0, 827.0, 1587.0, 3437.0, 8132.0, 20684.0, 60677.0, 212830.0, 473546.0, 180741.0, 53259.0, 18302.0, 7268.0, 3150.0, 1399.0, 700.0, 387.0, 246.0, 142.0, 99.0, 41.0, 38.0, 14.0, 17.0, 12.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.68658447265625, -6.4669189453125, -6.24725341796875, -6.027587890625, -5.80792236328125, -5.5882568359375, -5.36859130859375, -5.14892578125, -4.92926025390625, -4.7095947265625, -4.48992919921875, -4.270263671875, -4.05059814453125, -3.8309326171875, -3.61126708984375, -3.3916015625, -3.17193603515625, -2.9522705078125, -2.73260498046875, -2.512939453125, -2.29327392578125, -2.0736083984375, -1.85394287109375, -1.63427734375, -1.41461181640625, -1.1949462890625, -0.97528076171875, -0.755615234375, -0.53594970703125, -0.3162841796875, -0.09661865234375, 0.123046875, 0.34271240234375, 0.5623779296875, 0.78204345703125, 1.001708984375, 1.22137451171875, 1.4410400390625, 1.66070556640625, 1.88037109375, 2.10003662109375, 2.3197021484375, 2.53936767578125, 2.759033203125, 2.97869873046875, 3.1983642578125, 3.41802978515625, 3.6376953125, 3.85736083984375, 4.0770263671875, 4.29669189453125, 4.516357421875, 4.73602294921875, 4.9556884765625, 5.17535400390625, 5.39501953125, 5.61468505859375, 5.8343505859375, 6.05401611328125, 6.273681640625, 6.49334716796875, 6.7130126953125, 6.93267822265625, 7.15234375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 10.0, 12.0, 10.0, 19.0, 21.0, 25.0, 34.0, 30.0, 41.0, 46.0, 45.0, 51.0, 63.0, 63.0, 48.0, 67.0, 46.0, 50.0, 44.0, 42.0, 48.0, 36.0, 29.0, 34.0, 21.0, 14.0, 8.0, 15.0, 4.0, 7.0, 3.0, 4.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -4.9976806640625, -4.815673828125, -4.6336669921875, -4.45166015625, -4.2696533203125, -4.087646484375, -3.9056396484375, -3.7236328125, -3.5416259765625, -3.359619140625, -3.1776123046875, -2.99560546875, -2.8135986328125, -2.631591796875, -2.4495849609375, -2.267578125, -2.0855712890625, -1.903564453125, -1.7215576171875, -1.53955078125, -1.3575439453125, -1.175537109375, -0.9935302734375, -0.8115234375, -0.6295166015625, -0.447509765625, -0.2655029296875, -0.08349609375, 0.0985107421875, 0.280517578125, 0.4625244140625, 0.64453125, 0.8265380859375, 1.008544921875, 1.1905517578125, 1.37255859375, 1.5545654296875, 1.736572265625, 1.9185791015625, 2.1005859375, 2.2825927734375, 2.464599609375, 2.6466064453125, 2.82861328125, 3.0106201171875, 3.192626953125, 3.3746337890625, 3.556640625, 3.7386474609375, 3.920654296875, 4.1026611328125, 4.28466796875, 4.4666748046875, 4.648681640625, 4.8306884765625, 5.0126953125, 5.1947021484375, 5.376708984375, 5.5587158203125, 5.74072265625, 5.9227294921875, 6.104736328125, 6.2867431640625, 6.46875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 10.0, 10.0, 14.0, 27.0, 49.0, 60.0, 116.0, 183.0, 386.0, 766.0, 2052.0, 13295.0, 854102.0, 168471.0, 6184.0, 1527.0, 595.0, 298.0, 137.0, 112.0, 51.0, 33.0, 21.0, 20.0, 12.0, 7.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.171875, -27.36328125, -26.5546875, -25.74609375, -24.9375, -24.12890625, -23.3203125, -22.51171875, -21.703125, -20.89453125, -20.0859375, -19.27734375, -18.46875, -17.66015625, -16.8515625, -16.04296875, -15.234375, -14.42578125, -13.6171875, -12.80859375, -12.0, -11.19140625, -10.3828125, -9.57421875, -8.765625, -7.95703125, -7.1484375, -6.33984375, -5.53125, -4.72265625, -3.9140625, -3.10546875, -2.296875, -1.48828125, -0.6796875, 0.12890625, 0.9375, 1.74609375, 2.5546875, 3.36328125, 4.171875, 4.98046875, 5.7890625, 6.59765625, 7.40625, 8.21484375, 9.0234375, 9.83203125, 10.640625, 11.44921875, 12.2578125, 13.06640625, 13.875, 14.68359375, 15.4921875, 16.30078125, 17.109375, 17.91796875, 18.7265625, 19.53515625, 20.34375, 21.15234375, 21.9609375, 22.76953125, 23.578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 12.0, 10.0, 18.0, 14.0, 36.0, 39.0, 42.0, 53.0, 77.0, 76.0, 68.0, 89.0, 78.0, 76.0, 63.0, 50.0, 42.0, 41.0, 28.0, 19.0, 17.0, 7.0, 14.0, 4.0, 2.0, 6.0, 1.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.203125, -25.279052734375, -24.35498046875, -23.430908203125, -22.5068359375, -21.582763671875, -20.65869140625, -19.734619140625, -18.810546875, -17.886474609375, -16.96240234375, -16.038330078125, -15.1142578125, -14.190185546875, -13.26611328125, -12.342041015625, -11.41796875, -10.493896484375, -9.56982421875, -8.645751953125, -7.7216796875, -6.797607421875, -5.87353515625, -4.949462890625, -4.025390625, -3.101318359375, -2.17724609375, -1.253173828125, -0.3291015625, 0.594970703125, 1.51904296875, 2.443115234375, 3.3671875, 4.291259765625, 5.21533203125, 6.139404296875, 7.0634765625, 7.987548828125, 8.91162109375, 9.835693359375, 10.759765625, 11.683837890625, 12.60791015625, 13.531982421875, 14.4560546875, 15.380126953125, 16.30419921875, 17.228271484375, 18.15234375, 19.076416015625, 20.00048828125, 20.924560546875, 21.8486328125, 22.772705078125, 23.69677734375, 24.620849609375, 25.544921875, 26.468994140625, 27.39306640625, 28.317138671875, 29.2412109375, 30.165283203125, 31.08935546875, 32.013427734375, 32.9375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 4.0, 8.0, 10.0, 13.0, 17.0, 34.0, 52.0, 69.0, 104.0, 163.0, 312.0, 728.0, 1908.0, 6032.0, 28176.0, 663859.0, 313606.0, 24712.0, 5477.0, 1721.0, 693.0, 315.0, 163.0, 106.0, 68.0, 42.0, 39.0, 23.0, 14.0, 10.0, 7.0, 10.0, 8.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-5.92578125, -5.75628662109375, -5.5867919921875, -5.41729736328125, -5.247802734375, -5.07830810546875, -4.9088134765625, -4.73931884765625, -4.56982421875, -4.40032958984375, -4.2308349609375, -4.06134033203125, -3.891845703125, -3.72235107421875, -3.5528564453125, -3.38336181640625, -3.2138671875, -3.04437255859375, -2.8748779296875, -2.70538330078125, -2.535888671875, -2.36639404296875, -2.1968994140625, -2.02740478515625, -1.85791015625, -1.68841552734375, -1.5189208984375, -1.34942626953125, -1.179931640625, -1.01043701171875, -0.8409423828125, -0.67144775390625, -0.501953125, -0.33245849609375, -0.1629638671875, 0.00653076171875, 0.176025390625, 0.34552001953125, 0.5150146484375, 0.68450927734375, 0.85400390625, 1.02349853515625, 1.1929931640625, 1.36248779296875, 1.531982421875, 1.70147705078125, 1.8709716796875, 2.04046630859375, 2.2099609375, 2.37945556640625, 2.5489501953125, 2.71844482421875, 2.887939453125, 3.05743408203125, 3.2269287109375, 3.39642333984375, 3.56591796875, 3.73541259765625, 3.9049072265625, 4.07440185546875, 4.243896484375, 4.41339111328125, 4.5828857421875, 4.75238037109375, 4.921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 4.0, 9.0, 19.0, 31.0, 42.0, 52.0, 106.0, 185.0, 200.0, 119.0, 65.0, 38.0, 28.0, 13.0, 9.0, 11.0, 4.0, 5.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013914108276367188, -0.0013463646173477173, -0.0013013184070587158, -0.0012562721967697144, -0.0012112259864807129, -0.0011661797761917114, -0.00112113356590271, -0.0010760873556137085, -0.001031041145324707, -0.0009859949350357056, -0.0009409487247467041, -0.0008959025144577026, -0.0008508563041687012, -0.0008058100938796997, -0.0007607638835906982, -0.0007157176733016968, -0.0006706714630126953, -0.0006256252527236938, -0.0005805790424346924, -0.0005355328321456909, -0.0004904866218566895, -0.000445440411567688, -0.0004003942012786865, -0.00035534799098968506, -0.0003103017807006836, -0.00026525557041168213, -0.00022020936012268066, -0.0001751631498336792, -0.00013011693954467773, -8.507072925567627e-05, -4.0024518966674805e-05, 5.02169132232666e-06, 5.0067901611328125e-05, 9.511411190032959e-05, 0.00014016032218933105, 0.00018520653247833252, 0.00023025274276733398, 0.00027529895305633545, 0.0003203451633453369, 0.0003653913736343384, 0.00041043758392333984, 0.0004554837942123413, 0.0005005300045013428, 0.0005455762147903442, 0.0005906224250793457, 0.0006356686353683472, 0.0006807148456573486, 0.0007257610559463501, 0.0007708072662353516, 0.000815853476524353, 0.0008608996868133545, 0.000905945897102356, 0.0009509921073913574, 0.0009960383176803589, 0.0010410845279693604, 0.0010861307382583618, 0.0011311769485473633, 0.0011762231588363647, 0.0012212693691253662, 0.0012663155794143677, 0.0013113617897033691, 0.0013564079999923706, 0.001401454210281372, 0.0014465004205703735, 0.001491546630859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 13.0, 10.0, 15.0, 14.0, 46.0, 48.0, 80.0, 134.0, 214.0, 436.0, 905.0, 2108.0, 5778.0, 20230.0, 118307.0, 786926.0, 87850.0, 16658.0, 5002.0, 1923.0, 818.0, 429.0, 244.0, 127.0, 76.0, 57.0, 33.0, 18.0, 13.0, 10.0, 7.0, 7.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.974853515625, -3.84423828125, -3.713623046875, -3.5830078125, -3.452392578125, -3.32177734375, -3.191162109375, -3.060546875, -2.929931640625, -2.79931640625, -2.668701171875, -2.5380859375, -2.407470703125, -2.27685546875, -2.146240234375, -2.015625, -1.885009765625, -1.75439453125, -1.623779296875, -1.4931640625, -1.362548828125, -1.23193359375, -1.101318359375, -0.970703125, -0.840087890625, -0.70947265625, -0.578857421875, -0.4482421875, -0.317626953125, -0.18701171875, -0.056396484375, 0.07421875, 0.204833984375, 0.33544921875, 0.466064453125, 0.5966796875, 0.727294921875, 0.85791015625, 0.988525390625, 1.119140625, 1.249755859375, 1.38037109375, 1.510986328125, 1.6416015625, 1.772216796875, 1.90283203125, 2.033447265625, 2.1640625, 2.294677734375, 2.42529296875, 2.555908203125, 2.6865234375, 2.817138671875, 2.94775390625, 3.078369140625, 3.208984375, 3.339599609375, 3.47021484375, 3.600830078125, 3.7314453125, 3.862060546875, 3.99267578125, 4.123291015625, 4.25390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 10.0, 8.0, 19.0, 12.0, 28.0, 40.0, 43.0, 48.0, 73.0, 104.0, 98.0, 104.0, 92.0, 69.0, 56.0, 45.0, 44.0, 18.0, 15.0, 8.0, 11.0, 6.0, 8.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.0234375, -3.91168212890625, -3.7999267578125, -3.68817138671875, -3.576416015625, -3.46466064453125, -3.3529052734375, -3.24114990234375, -3.12939453125, -3.01763916015625, -2.9058837890625, -2.79412841796875, -2.682373046875, -2.57061767578125, -2.4588623046875, -2.34710693359375, -2.2353515625, -2.12359619140625, -2.0118408203125, -1.90008544921875, -1.788330078125, -1.67657470703125, -1.5648193359375, -1.45306396484375, -1.34130859375, -1.22955322265625, -1.1177978515625, -1.00604248046875, -0.894287109375, -0.78253173828125, -0.6707763671875, -0.55902099609375, -0.447265625, -0.33551025390625, -0.2237548828125, -0.11199951171875, -0.000244140625, 0.11151123046875, 0.2232666015625, 0.33502197265625, 0.44677734375, 0.55853271484375, 0.6702880859375, 0.78204345703125, 0.893798828125, 1.00555419921875, 1.1173095703125, 1.22906494140625, 1.3408203125, 1.45257568359375, 1.5643310546875, 1.67608642578125, 1.787841796875, 1.89959716796875, 2.0113525390625, 2.12310791015625, 2.23486328125, 2.34661865234375, 2.4583740234375, 2.57012939453125, 2.681884765625, 2.79364013671875, 2.9053955078125, 3.01715087890625, 3.12890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 11.0, 2.0, 16.0, 106.0, 574.0, 239.0, 44.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-302.7991027832031, -294.3559875488281, -285.9128723144531, -277.4697570800781, -269.0266418457031, -260.5835266113281, -252.1404266357422, -243.6973114013672, -235.2541961669922, -226.8110809326172, -218.3679656982422, -209.9248504638672, -201.48175048828125, -193.03863525390625, -184.59552001953125, -176.15240478515625, -167.70928955078125, -159.26617431640625, -150.82305908203125, -142.37994384765625, -133.93682861328125, -125.49372100830078, -117.05061340332031, -108.60749816894531, -100.16438293457031, -91.72126770019531, -83.27815246582031, -74.83504486083984, -66.39192962646484, -57.948814392089844, -49.50570297241211, -41.062591552734375, -32.61944580078125, -24.176332473754883, -15.733219146728516, -7.290105819702148, 1.1530075073242188, 9.596122741699219, 18.039234161376953, 26.482345581054688, 34.92546081542969, 43.36857604980469, 51.81168746948242, 60.254798889160156, 68.69791412353516, 77.14102935791016, 85.58413696289062, 94.02725219726562, 102.47036743164062, 110.91348266601562, 119.35659790039062, 127.7997055053711, 136.24282836914062, 144.68594360351562, 153.12904357910156, 161.57215881347656, 170.01527404785156, 178.45838928222656, 186.90150451660156, 195.34461975097656, 203.7877197265625, 212.2308349609375, 220.6739501953125, 229.1170654296875, 237.5601806640625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 11.0, 13.0, 11.0, 17.0, 20.0, 27.0, 36.0, 32.0, 33.0, 38.0, 39.0, 66.0, 137.0, 163.0, 52.0, 41.0, 35.0, 44.0, 30.0, 17.0, 27.0, 24.0, 15.0, 13.0, 11.0, 9.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-124.73792266845703, -121.45777130126953, -118.17762756347656, -114.89747619628906, -111.61732482910156, -108.3371810913086, -105.0570297241211, -101.77688598632812, -98.49673461914062, -95.21658325195312, -91.93643951416016, -88.65628814697266, -85.37614440917969, -82.09599304199219, -78.81584167480469, -75.53569030761719, -72.25554656982422, -68.97539520263672, -65.69525146484375, -62.41510009765625, -59.134952545166016, -55.85480499267578, -52.57465362548828, -49.29450607299805, -46.01435852050781, -42.73421096801758, -39.454063415527344, -36.173912048339844, -32.89376449584961, -29.613616943359375, -26.333467483520508, -23.05331802368164, -19.773178100585938, -16.493030548095703, -13.212881088256836, -9.932732582092285, -6.652584075927734, -3.3724365234375, -0.09228706359863281, 3.1878623962402344, 6.468009948730469, 9.74815845489502, 13.02830696105957, 16.308456420898438, 19.588603973388672, 22.868751525878906, 26.148900985717773, 29.42905044555664, 32.709197998046875, 35.98934555053711, 39.269493103027344, 42.549644470214844, 45.82979202270508, 49.10993957519531, 52.39009094238281, 55.67023849487305, 58.95038604736328, 62.230533599853516, 65.51068115234375, 68.79083251953125, 72.07098388671875, 75.35112762451172, 78.63127899169922, 81.91142272949219, 85.19157409667969]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 9.0, 5.0, 10.0, 18.0, 23.0, 38.0, 47.0, 120.0, 163.0, 271.0, 446.0, 747.0, 1442.0, 2485.0, 5001.0, 10932.0, 29954.0, 128923.0, 762794.0, 2142285.0, 893663.0, 156047.0, 35133.0, 12134.0, 5433.0, 2708.0, 1416.0, 820.0, 461.0, 241.0, 160.0, 102.0, 67.0, 62.0, 29.0, 19.0, 20.0, 14.0, 11.0, 2.0, 6.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.9375, -8.671142578125, -8.40478515625, -8.138427734375, -7.8720703125, -7.605712890625, -7.33935546875, -7.072998046875, -6.806640625, -6.540283203125, -6.27392578125, -6.007568359375, -5.7412109375, -5.474853515625, -5.20849609375, -4.942138671875, -4.67578125, -4.409423828125, -4.14306640625, -3.876708984375, -3.6103515625, -3.343994140625, -3.07763671875, -2.811279296875, -2.544921875, -2.278564453125, -2.01220703125, -1.745849609375, -1.4794921875, -1.213134765625, -0.94677734375, -0.680419921875, -0.4140625, -0.147705078125, 0.11865234375, 0.385009765625, 0.6513671875, 0.917724609375, 1.18408203125, 1.450439453125, 1.716796875, 1.983154296875, 2.24951171875, 2.515869140625, 2.7822265625, 3.048583984375, 3.31494140625, 3.581298828125, 3.84765625, 4.114013671875, 4.38037109375, 4.646728515625, 4.9130859375, 5.179443359375, 5.44580078125, 5.712158203125, 5.978515625, 6.244873046875, 6.51123046875, 6.777587890625, 7.0439453125, 7.310302734375, 7.57666015625, 7.843017578125, 8.109375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 6.0, 9.0, 16.0, 22.0, 15.0, 27.0, 49.0, 45.0, 38.0, 48.0, 69.0, 61.0, 59.0, 57.0, 56.0, 48.0, 49.0, 53.0, 42.0, 31.0, 40.0, 25.0, 24.0, 21.0, 19.0, 16.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19140625, -5.01495361328125, -4.8385009765625, -4.66204833984375, -4.485595703125, -4.30914306640625, -4.1326904296875, -3.95623779296875, -3.77978515625, -3.60333251953125, -3.4268798828125, -3.25042724609375, -3.073974609375, -2.89752197265625, -2.7210693359375, -2.54461669921875, -2.3681640625, -2.19171142578125, -2.0152587890625, -1.83880615234375, -1.662353515625, -1.48590087890625, -1.3094482421875, -1.13299560546875, -0.95654296875, -0.78009033203125, -0.6036376953125, -0.42718505859375, -0.250732421875, -0.07427978515625, 0.1021728515625, 0.27862548828125, 0.455078125, 0.63153076171875, 0.8079833984375, 0.98443603515625, 1.160888671875, 1.33734130859375, 1.5137939453125, 1.69024658203125, 1.86669921875, 2.04315185546875, 2.2196044921875, 2.39605712890625, 2.572509765625, 2.74896240234375, 2.9254150390625, 3.10186767578125, 3.2783203125, 3.45477294921875, 3.6312255859375, 3.80767822265625, 3.984130859375, 4.16058349609375, 4.3370361328125, 4.51348876953125, 4.68994140625, 4.86639404296875, 5.0428466796875, 5.21929931640625, 5.395751953125, 5.57220458984375, 5.7486572265625, 5.92510986328125, 6.1015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 6.0, 19.0, 43.0, 52.0, 81.0, 147.0, 341.0, 634.0, 1651.0, 6407.0, 176527.0, 3978184.0, 24948.0, 3191.0, 1038.0, 451.0, 236.0, 125.0, 66.0, 35.0, 29.0, 14.0, 16.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.80078125, -33.5703125, -32.33984375, -31.109375, -29.87890625, -28.6484375, -27.41796875, -26.1875, -24.95703125, -23.7265625, -22.49609375, -21.265625, -20.03515625, -18.8046875, -17.57421875, -16.34375, -15.11328125, -13.8828125, -12.65234375, -11.421875, -10.19140625, -8.9609375, -7.73046875, -6.5, -5.26953125, -4.0390625, -2.80859375, -1.578125, -0.34765625, 0.8828125, 2.11328125, 3.34375, 4.57421875, 5.8046875, 7.03515625, 8.265625, 9.49609375, 10.7265625, 11.95703125, 13.1875, 14.41796875, 15.6484375, 16.87890625, 18.109375, 19.33984375, 20.5703125, 21.80078125, 23.03125, 24.26171875, 25.4921875, 26.72265625, 27.953125, 29.18359375, 30.4140625, 31.64453125, 32.875, 34.10546875, 35.3359375, 36.56640625, 37.796875, 39.02734375, 40.2578125, 41.48828125, 42.71875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 11.0, 27.0, 26.0, 42.0, 77.0, 109.0, 180.0, 283.0, 423.0, 595.0, 667.0, 563.0, 351.0, 256.0, 132.0, 110.0, 72.0, 37.0, 32.0, 20.0, 10.0, 10.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-24.40625, -23.7877197265625, -23.169189453125, -22.5506591796875, -21.93212890625, -21.3135986328125, -20.695068359375, -20.0765380859375, -19.4580078125, -18.8394775390625, -18.220947265625, -17.6024169921875, -16.98388671875, -16.3653564453125, -15.746826171875, -15.1282958984375, -14.509765625, -13.8912353515625, -13.272705078125, -12.6541748046875, -12.03564453125, -11.4171142578125, -10.798583984375, -10.1800537109375, -9.5615234375, -8.9429931640625, -8.324462890625, -7.7059326171875, -7.08740234375, -6.4688720703125, -5.850341796875, -5.2318115234375, -4.61328125, -3.9947509765625, -3.376220703125, -2.7576904296875, -2.13916015625, -1.5206298828125, -0.902099609375, -0.2835693359375, 0.3349609375, 0.9534912109375, 1.572021484375, 2.1905517578125, 2.80908203125, 3.4276123046875, 4.046142578125, 4.6646728515625, 5.283203125, 5.9017333984375, 6.520263671875, 7.1387939453125, 7.75732421875, 8.3758544921875, 8.994384765625, 9.6129150390625, 10.2314453125, 10.8499755859375, 11.468505859375, 12.0870361328125, 12.70556640625, 13.3240966796875, 13.942626953125, 14.5611572265625, 15.1796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 10.0, 7.0, 14.0, 18.0, 32.0, 68.0, 115.0, 174.0, 205.0, 139.0, 96.0, 49.0, 22.0, 11.0, 7.0, 8.0, 3.0, 1.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-186.98609924316406, -180.78042602539062, -174.5747528076172, -168.36907958984375, -162.16342163085938, -155.95774841308594, -149.7520751953125, -143.54640197753906, -137.34072875976562, -131.1350555419922, -124.92938232421875, -118.72371673583984, -112.5180435180664, -106.31237030029297, -100.10670471191406, -93.90103149414062, -87.69535827636719, -81.48968505859375, -75.28401184082031, -69.0783462524414, -62.87267303466797, -56.66699981689453, -50.46133041381836, -44.25566101074219, -38.04998779296875, -31.844316482543945, -25.63864517211914, -19.432973861694336, -13.227302551269531, -7.021631240844727, -0.8159599304199219, 5.38970947265625, 11.59539794921875, 17.801069259643555, 24.00674057006836, 30.212411880493164, 36.41808319091797, 42.623756408691406, 48.82942581176758, 55.03509521484375, 61.24076843261719, 67.44644165039062, 73.65211486816406, 79.85778045654297, 86.0634536743164, 92.26912689208984, 98.47479248046875, 104.68046569824219, 110.88613891601562, 117.09181213378906, 123.2974853515625, 129.50315856933594, 135.70883178710938, 141.91448974609375, 148.1201629638672, 154.32583618164062, 160.53150939941406, 166.7371826171875, 172.94285583496094, 179.14852905273438, 185.35418701171875, 191.5598602294922, 197.76553344726562, 203.97120666503906, 210.1768798828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 16.0, 21.0, 30.0, 39.0, 50.0, 50.0, 84.0, 80.0, 88.0, 115.0, 84.0, 67.0, 62.0, 64.0, 45.0, 30.0, 15.0, 17.0, 14.0, 6.0, 10.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0], "bins": [-221.938720703125, -216.66555786132812, -211.39239501953125, -206.11923217773438, -200.8460693359375, -195.57290649414062, -190.29974365234375, -185.02659606933594, -179.75343322753906, -174.4802703857422, -169.2071075439453, -163.93394470214844, -158.66078186035156, -153.38763427734375, -148.11447143554688, -142.84130859375, -137.56814575195312, -132.29498291015625, -127.02182006835938, -121.7486572265625, -116.47550201416016, -111.20233917236328, -105.9291763305664, -100.65602111816406, -95.38284301757812, -90.10968017578125, -84.83651733398438, -79.5633544921875, -74.29019927978516, -69.01703643798828, -63.743873596191406, -58.4707145690918, -53.19755554199219, -47.92439270019531, -42.6512336730957, -37.37807083129883, -32.10491180419922, -26.831748962402344, -21.55858612060547, -16.28542709350586, -11.012264251708984, -5.739102840423584, -0.4659414291381836, 4.807220458984375, 10.080381393432617, 15.35354232788086, 20.626705169677734, 25.899864196777344, 31.17302703857422, 36.446189880371094, 41.7193489074707, 46.99251174926758, 52.26567077636719, 57.53883361816406, 62.81199645996094, 68.08515930175781, 73.35832214355469, 78.63148498535156, 83.90464782714844, 89.17781066894531, 94.45096588134766, 99.72412872314453, 104.9972915649414, 110.27044677734375, 115.54360961914062]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 8.0, 21.0, 22.0, 40.0, 69.0, 177.0, 417.0, 950.0, 3220.0, 14263.0, 141692.0, 817576.0, 58386.0, 8299.0, 2081.0, 728.0, 326.0, 144.0, 62.0, 30.0, 17.0, 7.0, 10.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.9375, -16.4442138671875, -15.950927734375, -15.4576416015625, -14.96435546875, -14.4710693359375, -13.977783203125, -13.4844970703125, -12.9912109375, -12.4979248046875, -12.004638671875, -11.5113525390625, -11.01806640625, -10.5247802734375, -10.031494140625, -9.5382080078125, -9.044921875, -8.5516357421875, -8.058349609375, -7.5650634765625, -7.07177734375, -6.5784912109375, -6.085205078125, -5.5919189453125, -5.0986328125, -4.6053466796875, -4.112060546875, -3.6187744140625, -3.12548828125, -2.6322021484375, -2.138916015625, -1.6456298828125, -1.15234375, -0.6590576171875, -0.165771484375, 0.3275146484375, 0.82080078125, 1.3140869140625, 1.807373046875, 2.3006591796875, 2.7939453125, 3.2872314453125, 3.780517578125, 4.2738037109375, 4.76708984375, 5.2603759765625, 5.753662109375, 6.2469482421875, 6.740234375, 7.2335205078125, 7.726806640625, 8.2200927734375, 8.71337890625, 9.2066650390625, 9.699951171875, 10.1932373046875, 10.6865234375, 11.1798095703125, 11.673095703125, 12.1663818359375, 12.65966796875, 13.1529541015625, 13.646240234375, 14.1395263671875, 14.6328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 13.0, 22.0, 36.0, 26.0, 51.0, 78.0, 74.0, 99.0, 84.0, 92.0, 93.0, 88.0, 76.0, 48.0, 39.0, 25.0, 20.0, 7.0, 12.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.421875, -16.038818359375, -15.65576171875, -15.272705078125, -14.8896484375, -14.506591796875, -14.12353515625, -13.740478515625, -13.357421875, -12.974365234375, -12.59130859375, -12.208251953125, -11.8251953125, -11.442138671875, -11.05908203125, -10.676025390625, -10.29296875, -9.909912109375, -9.52685546875, -9.143798828125, -8.7607421875, -8.377685546875, -7.99462890625, -7.611572265625, -7.228515625, -6.845458984375, -6.46240234375, -6.079345703125, -5.6962890625, -5.313232421875, -4.93017578125, -4.547119140625, -4.1640625, -3.781005859375, -3.39794921875, -3.014892578125, -2.6318359375, -2.248779296875, -1.86572265625, -1.482666015625, -1.099609375, -0.716552734375, -0.33349609375, 0.049560546875, 0.4326171875, 0.815673828125, 1.19873046875, 1.581787109375, 1.96484375, 2.347900390625, 2.73095703125, 3.114013671875, 3.4970703125, 3.880126953125, 4.26318359375, 4.646240234375, 5.029296875, 5.412353515625, 5.79541015625, 6.178466796875, 6.5615234375, 6.944580078125, 7.32763671875, 7.710693359375, 8.09375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 8.0, 11.0, 8.0, 13.0, 18.0, 33.0, 30.0, 45.0, 60.0, 69.0, 79.0, 117.0, 194.0, 331.0, 587.0, 1346.0, 4201.0, 23196.0, 750687.0, 242807.0, 18359.0, 3617.0, 1155.0, 531.0, 339.0, 217.0, 112.0, 93.0, 64.0, 52.0, 39.0, 34.0, 17.0, 11.0, 18.0, 7.0, 8.0, 7.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.5390625, -11.1661376953125, -10.793212890625, -10.4202880859375, -10.04736328125, -9.6744384765625, -9.301513671875, -8.9285888671875, -8.5556640625, -8.1827392578125, -7.809814453125, -7.4368896484375, -7.06396484375, -6.6910400390625, -6.318115234375, -5.9451904296875, -5.572265625, -5.1993408203125, -4.826416015625, -4.4534912109375, -4.08056640625, -3.7076416015625, -3.334716796875, -2.9617919921875, -2.5888671875, -2.2159423828125, -1.843017578125, -1.4700927734375, -1.09716796875, -0.7242431640625, -0.351318359375, 0.0216064453125, 0.39453125, 0.7674560546875, 1.140380859375, 1.5133056640625, 1.88623046875, 2.2591552734375, 2.632080078125, 3.0050048828125, 3.3779296875, 3.7508544921875, 4.123779296875, 4.4967041015625, 4.86962890625, 5.2425537109375, 5.615478515625, 5.9884033203125, 6.361328125, 6.7342529296875, 7.107177734375, 7.4801025390625, 7.85302734375, 8.2259521484375, 8.598876953125, 8.9718017578125, 9.3447265625, 9.7176513671875, 10.090576171875, 10.4635009765625, 10.83642578125, 11.2093505859375, 11.582275390625, 11.9552001953125, 12.328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 3.0, 8.0, 10.0, 15.0, 15.0, 26.0, 35.0, 36.0, 39.0, 41.0, 58.0, 67.0, 96.0, 103.0, 94.0, 65.0, 49.0, 36.0, 40.0, 23.0, 32.0, 21.0, 22.0, 13.0, 9.0, 6.0, 9.0, 7.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.96875, -25.982421875, -24.99609375, -24.009765625, -23.0234375, -22.037109375, -21.05078125, -20.064453125, -19.078125, -18.091796875, -17.10546875, -16.119140625, -15.1328125, -14.146484375, -13.16015625, -12.173828125, -11.1875, -10.201171875, -9.21484375, -8.228515625, -7.2421875, -6.255859375, -5.26953125, -4.283203125, -3.296875, -2.310546875, -1.32421875, -0.337890625, 0.6484375, 1.634765625, 2.62109375, 3.607421875, 4.59375, 5.580078125, 6.56640625, 7.552734375, 8.5390625, 9.525390625, 10.51171875, 11.498046875, 12.484375, 13.470703125, 14.45703125, 15.443359375, 16.4296875, 17.416015625, 18.40234375, 19.388671875, 20.375, 21.361328125, 22.34765625, 23.333984375, 24.3203125, 25.306640625, 26.29296875, 27.279296875, 28.265625, 29.251953125, 30.23828125, 31.224609375, 32.2109375, 33.197265625, 34.18359375, 35.169921875, 36.15625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 11.0, 11.0, 10.0, 16.0, 34.0, 46.0, 62.0, 97.0, 184.0, 352.0, 886.0, 2435.0, 8173.0, 47788.0, 881462.0, 89132.0, 12317.0, 3272.0, 1177.0, 445.0, 257.0, 146.0, 71.0, 47.0, 36.0, 21.0, 23.0, 13.0, 10.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9384765625, -1.8751983642578125, -1.811920166015625, -1.7486419677734375, -1.68536376953125, -1.6220855712890625, -1.558807373046875, -1.4955291748046875, -1.4322509765625, -1.3689727783203125, -1.305694580078125, -1.2424163818359375, -1.17913818359375, -1.1158599853515625, -1.052581787109375, -0.9893035888671875, -0.926025390625, -0.8627471923828125, -0.799468994140625, -0.7361907958984375, -0.67291259765625, -0.6096343994140625, -0.546356201171875, -0.4830780029296875, -0.4197998046875, -0.3565216064453125, -0.293243408203125, -0.2299652099609375, -0.16668701171875, -0.1034088134765625, -0.040130615234375, 0.0231475830078125, 0.08642578125, 0.1497039794921875, 0.212982177734375, 0.2762603759765625, 0.33953857421875, 0.4028167724609375, 0.466094970703125, 0.5293731689453125, 0.5926513671875, 0.6559295654296875, 0.719207763671875, 0.7824859619140625, 0.84576416015625, 0.9090423583984375, 0.972320556640625, 1.0355987548828125, 1.098876953125, 1.1621551513671875, 1.225433349609375, 1.2887115478515625, 1.35198974609375, 1.4152679443359375, 1.478546142578125, 1.5418243408203125, 1.6051025390625, 1.6683807373046875, 1.731658935546875, 1.7949371337890625, 1.85821533203125, 1.9214935302734375, 1.984771728515625, 2.0480499267578125, 2.111328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 3.0, 14.0, 12.0, 21.0, 10.0, 29.0, 43.0, 54.0, 89.0, 114.0, 118.0, 125.0, 123.0, 58.0, 44.0, 39.0, 25.0, 15.0, 12.0, 6.0, 17.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0006594657897949219, -0.0006439685821533203, -0.0006284713745117188, -0.0006129741668701172, -0.0005974769592285156, -0.0005819797515869141, -0.0005664825439453125, -0.0005509853363037109, -0.0005354881286621094, -0.0005199909210205078, -0.0005044937133789062, -0.0004889965057373047, -0.0004734992980957031, -0.00045800209045410156, -0.0004425048828125, -0.00042700767517089844, -0.0004115104675292969, -0.0003960132598876953, -0.00038051605224609375, -0.0003650188446044922, -0.0003495216369628906, -0.00033402442932128906, -0.0003185272216796875, -0.00030303001403808594, -0.0002875328063964844, -0.0002720355987548828, -0.00025653839111328125, -0.0002410411834716797, -0.00022554397583007812, -0.00021004676818847656, -0.000194549560546875, -0.00017905235290527344, -0.00016355514526367188, -0.0001480579376220703, -0.00013256072998046875, -0.00011706352233886719, -0.00010156631469726562, -8.606910705566406e-05, -7.05718994140625e-05, -5.507469177246094e-05, -3.9577484130859375e-05, -2.4080276489257812e-05, -8.58306884765625e-06, 6.9141387939453125e-06, 2.2411346435546875e-05, 3.790855407714844e-05, 5.340576171875e-05, 6.890296936035156e-05, 8.440017700195312e-05, 9.989738464355469e-05, 0.00011539459228515625, 0.0001308917999267578, 0.00014638900756835938, 0.00016188621520996094, 0.0001773834228515625, 0.00019288063049316406, 0.00020837783813476562, 0.0002238750457763672, 0.00023937225341796875, 0.0002548694610595703, 0.0002703666687011719, 0.00028586387634277344, 0.000301361083984375, 0.00031685829162597656, 0.0003323554992675781]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 8.0, 14.0, 16.0, 31.0, 51.0, 108.0, 230.0, 465.0, 1224.0, 3726.0, 14086.0, 86521.0, 867069.0, 59035.0, 11073.0, 3034.0, 1039.0, 429.0, 175.0, 101.0, 36.0, 28.0, 12.0, 10.0, 6.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.397064208984375, -2.33123779296875, -2.265411376953125, -2.1995849609375, -2.133758544921875, -2.06793212890625, -2.002105712890625, -1.936279296875, -1.870452880859375, -1.80462646484375, -1.738800048828125, -1.6729736328125, -1.607147216796875, -1.54132080078125, -1.475494384765625, -1.40966796875, -1.343841552734375, -1.27801513671875, -1.212188720703125, -1.1463623046875, -1.080535888671875, -1.01470947265625, -0.948883056640625, -0.883056640625, -0.817230224609375, -0.75140380859375, -0.685577392578125, -0.6197509765625, -0.553924560546875, -0.48809814453125, -0.422271728515625, -0.3564453125, -0.290618896484375, -0.22479248046875, -0.158966064453125, -0.0931396484375, -0.027313232421875, 0.03851318359375, 0.104339599609375, 0.170166015625, 0.235992431640625, 0.30181884765625, 0.367645263671875, 0.4334716796875, 0.499298095703125, 0.56512451171875, 0.630950927734375, 0.69677734375, 0.762603759765625, 0.82843017578125, 0.894256591796875, 0.9600830078125, 1.025909423828125, 1.09173583984375, 1.157562255859375, 1.223388671875, 1.289215087890625, 1.35504150390625, 1.420867919921875, 1.4866943359375, 1.552520751953125, 1.61834716796875, 1.684173583984375, 1.75]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 10.0, 5.0, 7.0, 10.0, 8.0, 11.0, 15.0, 18.0, 23.0, 23.0, 39.0, 59.0, 54.0, 61.0, 80.0, 90.0, 66.0, 65.0, 66.0, 59.0, 50.0, 37.0, 19.0, 26.0, 17.0, 12.0, 16.0, 9.0, 11.0, 6.0, 3.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.4163665771484375, -1.368865966796875, -1.3213653564453125, -1.27386474609375, -1.2263641357421875, -1.178863525390625, -1.1313629150390625, -1.0838623046875, -1.0363616943359375, -0.988861083984375, -0.9413604736328125, -0.89385986328125, -0.8463592529296875, -0.798858642578125, -0.7513580322265625, -0.703857421875, -0.6563568115234375, -0.608856201171875, -0.5613555908203125, -0.51385498046875, -0.4663543701171875, -0.418853759765625, -0.3713531494140625, -0.3238525390625, -0.2763519287109375, -0.228851318359375, -0.1813507080078125, -0.13385009765625, -0.0863494873046875, -0.038848876953125, 0.0086517333984375, 0.05615234375, 0.1036529541015625, 0.151153564453125, 0.1986541748046875, 0.24615478515625, 0.2936553955078125, 0.341156005859375, 0.3886566162109375, 0.4361572265625, 0.4836578369140625, 0.531158447265625, 0.5786590576171875, 0.62615966796875, 0.6736602783203125, 0.721160888671875, 0.7686614990234375, 0.816162109375, 0.8636627197265625, 0.911163330078125, 0.9586639404296875, 1.00616455078125, 1.0536651611328125, 1.101165771484375, 1.1486663818359375, 1.1961669921875, 1.2436676025390625, 1.291168212890625, 1.3386688232421875, 1.38616943359375, 1.4336700439453125, 1.481170654296875, 1.5286712646484375, 1.576171875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 12.0, 19.0, 13.0, 42.0, 105.0, 516.0, 162.0, 65.0, 29.0, 22.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.85951232910156, -161.33152770996094, -157.8035430908203, -154.2755584716797, -150.74758911132812, -147.2196044921875, -143.69161987304688, -140.16363525390625, -136.63565063476562, -133.107666015625, -129.57968139648438, -126.05170440673828, -122.52371978759766, -118.99573516845703, -115.46775817871094, -111.93977355957031, -108.41178894042969, -104.88380432128906, -101.35581970214844, -97.82784271240234, -94.29985809326172, -90.7718734741211, -87.243896484375, -83.71591186523438, -80.18792724609375, -76.65994262695312, -73.1319580078125, -69.6039810180664, -66.07599639892578, -62.548011779785156, -59.0200309753418, -55.49205017089844, -51.964073181152344, -48.43608856201172, -44.90810775756836, -41.380126953125, -37.852142333984375, -34.32415771484375, -30.79617691040039, -27.2681941986084, -23.740211486816406, -20.212228775024414, -16.684246063232422, -13.15626335144043, -9.628280639648438, -6.100297927856445, -2.572315216064453, 0.9556674957275391, 4.483650207519531, 8.011632919311523, 11.539615631103516, 15.067598342895508, 18.5955810546875, 22.123563766479492, 25.651546478271484, 29.179529190063477, 32.70751190185547, 36.235496520996094, 39.76347732543945, 43.29145812988281, 46.81944274902344, 50.34742736816406, 53.87540817260742, 57.40338897705078, 60.931373596191406]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 7.0, 7.0, 7.0, 10.0, 13.0, 15.0, 15.0, 18.0, 15.0, 21.0, 17.0, 24.0, 28.0, 46.0, 157.0, 299.0, 68.0, 34.0, 21.0, 18.0, 20.0, 20.0, 25.0, 10.0, 12.0, 13.0, 7.0, 5.0, 6.0, 7.0, 4.0, 6.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.678955078125, -66.32838439941406, -63.977813720703125, -61.62724304199219, -59.27667236328125, -56.92610168457031, -54.57553482055664, -52.2249641418457, -49.874393463134766, -47.52382278442383, -45.17325210571289, -42.82268142700195, -40.47211456298828, -38.121543884277344, -35.770973205566406, -33.42040252685547, -31.06983184814453, -28.719261169433594, -26.368690490722656, -24.01812171936035, -21.667551040649414, -19.316980361938477, -16.966411590576172, -14.615840911865234, -12.265270233154297, -9.91469955444336, -7.564129829406738, -5.213559627532959, -2.8629894256591797, -0.5124187469482422, 1.838150978088379, 4.188720703125, 6.5392913818359375, 8.889862060546875, 11.240431785583496, 13.591001510620117, 15.941572189331055, 18.292142868041992, 20.642711639404297, 22.993282318115234, 25.343852996826172, 27.69442367553711, 30.044994354248047, 32.395565032958984, 34.746131896972656, 37.096702575683594, 39.44727325439453, 41.79784393310547, 44.148414611816406, 46.498985290527344, 48.84955596923828, 51.20012664794922, 53.550697326660156, 55.901268005371094, 58.251834869384766, 60.6024055480957, 62.95297622680664, 65.30354309082031, 67.65411376953125, 70.00468444824219, 72.35525512695312, 74.70582580566406, 77.056396484375, 79.40696716308594, 81.75753784179688]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 2.0, 11.0, 8.0, 9.0, 12.0, 7.0, 9.0, 12.0, 35.0, 23.0, 24.0, 35.0, 40.0, 42.0, 75.0, 230.0, 133.0, 47.0, 43.0, 34.0, 39.0, 25.0, 16.0, 19.0, 16.0, 19.0, 12.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.796875, -8.5697021484375, -8.342529296875, -8.1153564453125, -7.88818359375, -7.6610107421875, -7.433837890625, -7.2066650390625, -6.9794921875, -6.7523193359375, -6.525146484375, -6.2979736328125, -6.07080078125, -5.8436279296875, -5.616455078125, -5.3892822265625, -5.162109375, -4.9349365234375, -4.707763671875, -4.4805908203125, -4.25341796875, -4.0262451171875, -3.799072265625, -3.5718994140625, -3.3447265625, -3.1175537109375, -2.890380859375, -2.6632080078125, -2.43603515625, -2.2088623046875, -1.981689453125, -1.7545166015625, -1.52734375, -1.3001708984375, -1.072998046875, -0.8458251953125, -0.61865234375, -0.3914794921875, -0.164306640625, 0.0628662109375, 0.2900390625, 0.5172119140625, 0.744384765625, 0.9715576171875, 1.19873046875, 1.4259033203125, 1.653076171875, 1.8802490234375, 2.107421875, 2.3345947265625, 2.561767578125, 2.7889404296875, 3.01611328125, 3.2432861328125, 3.470458984375, 3.6976318359375, 3.9248046875, 4.1519775390625, 4.379150390625, 4.6063232421875, 4.83349609375, 5.0606689453125, 5.287841796875, 5.5150146484375, 5.7421875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 9.0, 15.0, 21.0, 4.0, 5.0, 9.0, 22.0, 55.0, 78.0, 163.0, 355.0, 1255.0, 7532.0, 8351625.0, 24079.0, 2344.0, 500.0, 240.0, 106.0, 44.0, 46.0, 21.0, 12.0, 10.0, 12.0, 3.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.75170135498047, -49.36695098876953, -46.98219680786133, -44.597442626953125, -42.21269226074219, -39.82794189453125, -37.44318771362305, -35.058433532714844, -32.673683166503906, -30.288930892944336, -27.904178619384766, -25.519426345825195, -23.134674072265625, -20.749921798706055, -18.365169525146484, -15.980417251586914, -13.595664978027344, -11.210912704467773, -8.826160430908203, -6.441408157348633, -4.0566558837890625, -1.6719036102294922, 0.7128486633300781, 3.0976009368896484, 5.482353210449219, 7.867105484008789, 10.25185775756836, 12.63661003112793, 15.0213623046875, 17.40611457824707, 19.79086685180664, 22.17561912536621, 24.560379028320312, 26.945131301879883, 29.329883575439453, 31.714635848999023, 34.099388122558594, 36.48413848876953, 38.868892669677734, 41.25364685058594, 43.638397216796875, 46.02314758300781, 48.407901763916016, 50.79265594482422, 53.177406311035156, 55.562156677246094, 57.9469108581543, 60.3316650390625, 62.71641540527344, 65.10116577148438, 67.48591613769531, 69.87067413330078, 72.25542449951172, 74.64017486572266, 77.02493286132812, 79.40968322753906, 81.79443359375, 84.17918395996094, 86.56393432617188, 88.94869232177734, 91.33344268798828, 93.71819305419922, 96.10295104980469, 98.48770141601562, 100.87245178222656]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 7.0, 7.0, 3.0, 1.0, 2.0, 8.0, 1.0, 8.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-177.3442840576172, -173.36721801757812, -169.39015197753906, -165.4130859375, -161.43603515625, -157.45896911621094, -153.48190307617188, -149.5048370361328, -145.52777099609375, -141.5507049560547, -137.57363891601562, -133.59658813476562, -129.61952209472656, -125.6424560546875, -121.66539001464844, -117.68832397460938, -113.71126556396484, -109.73419952392578, -105.75714111328125, -101.78007507324219, -97.80300903320312, -93.82594299316406, -89.84888458251953, -85.87181854248047, -81.89476013183594, -77.91769409179688, -73.94063568115234, -69.96356964111328, -65.98650360107422, -62.00944137573242, -58.032379150390625, -54.05531311035156, -50.0782470703125, -46.1011848449707, -42.12411880493164, -38.147056579589844, -34.16999053955078, -30.192928314208984, -26.215866088867188, -22.238801956176758, -18.261737823486328, -14.284673690795898, -10.307610511779785, -6.330547332763672, -2.353483200073242, 1.6235809326171875, 5.600643157958984, 9.577707290649414, 13.554771423339844, 17.531835556030273, 21.508899688720703, 25.4859619140625, 29.46302604675293, 33.44009017944336, 37.417152404785156, 41.39421844482422, 45.371280670166016, 49.34834289550781, 53.325408935546875, 57.30247116088867, 61.27953338623047, 65.25659942626953, 69.23365783691406, 73.21072387695312, 77.18778991699219]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 11.0, 24.0, 31.0, 37.0, 55.0, 73.0, 84.0, 86.0, 109.0, 88.0, 85.0, 74.0, 61.0, 47.0, 32.0, 37.0, 21.0, 13.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.685302734375, -4.54638671875, -4.407470703125, -4.2685546875, -4.129638671875, -3.99072265625, -3.851806640625, -3.712890625, -3.573974609375, -3.43505859375, -3.296142578125, -3.1572265625, -3.018310546875, -2.87939453125, -2.740478515625, -2.6015625, -2.462646484375, -2.32373046875, -2.184814453125, -2.0458984375, -1.906982421875, -1.76806640625, -1.629150390625, -1.490234375, -1.351318359375, -1.21240234375, -1.073486328125, -0.9345703125, -0.795654296875, -0.65673828125, -0.517822265625, -0.37890625, -0.239990234375, -0.10107421875, 0.037841796875, 0.1767578125, 0.315673828125, 0.45458984375, 0.593505859375, 0.732421875, 0.871337890625, 1.01025390625, 1.149169921875, 1.2880859375, 1.427001953125, 1.56591796875, 1.704833984375, 1.84375, 1.982666015625, 2.12158203125, 2.260498046875, 2.3994140625, 2.538330078125, 2.67724609375, 2.816162109375, 2.955078125, 3.093994140625, 3.23291015625, 3.371826171875, 3.5107421875, 3.649658203125, 3.78857421875, 3.927490234375, 4.06640625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 8.0, 6.0, 5.0, 17.0, 43.0, 64.0, 128.0, 318.0, 966.0, 5545.0, 70864.0, 386950.0, 53533.0, 4321.0, 907.0, 313.0, 126.0, 61.0, 37.0, 24.0, 13.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.1875, -110.873046875, -107.55859375, -104.244140625, -100.9296875, -97.615234375, -94.30078125, -90.986328125, -87.671875, -84.357421875, -81.04296875, -77.728515625, -74.4140625, -71.099609375, -67.78515625, -64.470703125, -61.15625, -57.841796875, -54.52734375, -51.212890625, -47.8984375, -44.583984375, -41.26953125, -37.955078125, -34.640625, -31.326171875, -28.01171875, -24.697265625, -21.3828125, -18.068359375, -14.75390625, -11.439453125, -8.125, -4.810546875, -1.49609375, 1.818359375, 5.1328125, 8.447265625, 11.76171875, 15.076171875, 18.390625, 21.705078125, 25.01953125, 28.333984375, 31.6484375, 34.962890625, 38.27734375, 41.591796875, 44.90625, 48.220703125, 51.53515625, 54.849609375, 58.1640625, 61.478515625, 64.79296875, 68.107421875, 71.421875, 74.736328125, 78.05078125, 81.365234375, 84.6796875, 87.994140625, 91.30859375, 94.623046875, 97.9375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 14.0, 13.0, 21.0, 33.0, 47.0, 91.0, 118.0, 136.0, 135.0, 139.0, 88.0, 63.0, 48.0, 22.0, 11.0, 11.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09375, -18.618408203125, -18.14306640625, -17.667724609375, -17.1923828125, -16.717041015625, -16.24169921875, -15.766357421875, -15.291015625, -14.815673828125, -14.34033203125, -13.864990234375, -13.3896484375, -12.914306640625, -12.43896484375, -11.963623046875, -11.48828125, -11.012939453125, -10.53759765625, -10.062255859375, -9.5869140625, -9.111572265625, -8.63623046875, -8.160888671875, -7.685546875, -7.210205078125, -6.73486328125, -6.259521484375, -5.7841796875, -5.308837890625, -4.83349609375, -4.358154296875, -3.8828125, -3.407470703125, -2.93212890625, -2.456787109375, -1.9814453125, -1.506103515625, -1.03076171875, -0.555419921875, -0.080078125, 0.395263671875, 0.87060546875, 1.345947265625, 1.8212890625, 2.296630859375, 2.77197265625, 3.247314453125, 3.72265625, 4.197998046875, 4.67333984375, 5.148681640625, 5.6240234375, 6.099365234375, 6.57470703125, 7.050048828125, 7.525390625, 8.000732421875, 8.47607421875, 8.951416015625, 9.4267578125, 9.902099609375, 10.37744140625, 10.852783203125, 11.328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 2.0, 3.0, 4.0, 10.0, 14.0, 36.0, 74.0, 172.0, 91.0, 39.0, 16.0, 6.0, 6.0, 4.0, 7.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-106.58972930908203, -104.20504760742188, -101.82035827636719, -99.4356689453125, -97.05098724365234, -94.66630554199219, -92.2816162109375, -89.89692687988281, -87.51224517822266, -85.1275634765625, -82.74287414550781, -80.35818481445312, -77.97350311279297, -75.58882141113281, -73.20413208007812, -70.81944274902344, -68.43476104736328, -66.05007934570312, -63.66539001464844, -61.280704498291016, -58.896018981933594, -56.51133346557617, -54.12664794921875, -51.74196243286133, -49.357276916503906, -46.972591400146484, -44.58790588378906, -42.20322036743164, -39.81853485107422, -37.4338493347168, -35.049163818359375, -32.66447830200195, -30.27979278564453, -27.89510726928711, -25.510421752929688, -23.125736236572266, -20.741050720214844, -18.356365203857422, -15.9716796875, -13.586994171142578, -11.202308654785156, -8.817623138427734, -6.4329376220703125, -4.048252105712891, -1.6635665893554688, 0.7211189270019531, 3.105804443359375, 5.490489959716797, 7.875175476074219, 10.25986099243164, 12.644546508789062, 15.029232025146484, 17.413917541503906, 19.798603057861328, 22.18328857421875, 24.567974090576172, 26.952659606933594, 29.337345123291016, 31.722030639648438, 34.10671615600586, 36.49140167236328, 38.8760871887207, 41.260772705078125, 43.64545822143555, 46.03014373779297]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 3.0, 3.0, 4.0, 6.0, 15.0, 24.0, 36.0, 54.0, 85.0, 63.0, 58.0, 22.0, 26.0, 13.0, 10.0, 15.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.44866943359375, -30.308494567871094, -29.16832160949707, -28.028146743774414, -26.88797378540039, -25.747798919677734, -24.607624053955078, -23.467449188232422, -22.3272762298584, -21.187101364135742, -20.04692840576172, -18.906753540039062, -17.766578674316406, -16.626405715942383, -15.486230850219727, -14.346056938171387, -13.205883026123047, -12.065709114074707, -10.925535202026367, -9.785360336303711, -8.645186424255371, -7.505012512207031, -6.364838123321533, -5.224663734436035, -4.084489822387695, -2.9443156719207764, -1.8041415214538574, -0.6639673709869385, 0.47620677947998047, 1.6163806915283203, 2.7565550804138184, 3.8967294692993164, 5.036903381347656, 6.177077293395996, 7.317251682281494, 8.457426071166992, 9.597599983215332, 10.737773895263672, 11.877948760986328, 13.018122673034668, 14.158296585083008, 15.298470497131348, 16.438644409179688, 17.578819274902344, 18.718994140625, 19.859167098999023, 20.99934196472168, 22.139514923095703, 23.27968978881836, 24.419864654541016, 25.56003761291504, 26.700212478637695, 27.84038543701172, 28.980560302734375, 30.12073516845703, 31.260910034179688, 32.401084899902344, 33.541259765625, 34.681434631347656, 35.82160568237305, 36.9617805480957, 38.10195541381836, 39.242130279541016, 40.38230514526367, 41.52247619628906]}, "eval/loss": 6.05579948425293, "eval/wer": 1.3242760809202698, "eval/runtime": 647.7056, "eval/samples_per_second": 4.079, "eval/steps_per_second": 0.511} \ No newline at end of file +{"train/loss": 5.4388, "train/learning_rate": 2.718450704225352e-05, "train/epoch": 3.36, "train/global_step": 3000, "_runtime": 17848, "_timestamp": 1648159192, "_step": 3001, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 11.0, 7.0, 12.0, 13.0, 21.0, 23.0, 25.0, 23.0, 31.0, 46.0, 47.0, 38.0, 49.0, 54.0, 50.0, 66.0, 47.0, 52.0, 45.0, 64.0, 48.0, 46.0, 37.0, 23.0, 29.0, 17.0, 11.0, 14.0, 4.0, 10.0, 8.0, 7.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.06173706054688, -75.80459594726562, -73.54745483398438, -71.29032135009766, -69.0331802368164, -66.77603912353516, -64.51890563964844, -62.26176452636719, -60.00462341308594, -57.74748229980469, -55.4903450012207, -53.23320770263672, -50.97606658935547, -48.71892547607422, -46.461788177490234, -44.20465087890625, -41.947509765625, -39.69036865234375, -37.433231353759766, -35.17609405517578, -32.91895294189453, -30.661813735961914, -28.404674530029297, -26.14753532409668, -23.890396118164062, -21.633256912231445, -19.376117706298828, -17.11897850036621, -14.861839294433594, -12.604700088500977, -10.34756088256836, -8.090421676635742, -5.833290100097656, -3.576150894165039, -1.3190116882324219, 0.9381275177001953, 3.1952667236328125, 5.45240592956543, 7.709545135498047, 9.966684341430664, 12.223823547363281, 14.480962753295898, 16.738101959228516, 18.995241165161133, 21.25238037109375, 23.509519577026367, 25.766658782958984, 28.0237979888916, 30.28093719482422, 32.53807830810547, 34.79521560668945, 37.05235290527344, 39.30949401855469, 41.56663513183594, 43.82377243041992, 46.080909729003906, 48.338050842285156, 50.595191955566406, 52.85232925415039, 55.109466552734375, 57.366607666015625, 59.623748779296875, 61.88088607788086, 64.13802337646484, 66.3951644897461]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 13.0, 13.0, 10.0, 14.0, 18.0, 18.0, 18.0, 18.0, 23.0, 30.0, 35.0, 28.0, 38.0, 35.0, 33.0, 47.0, 52.0, 48.0, 36.0, 40.0, 40.0, 30.0, 41.0, 38.0, 42.0, 26.0, 27.0, 31.0, 23.0, 20.0, 16.0, 17.0, 18.0, 12.0, 6.0, 11.0, 6.0, 7.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.63709259033203, -58.81853485107422, -56.999977111816406, -55.18142318725586, -53.36286544799805, -51.544307708740234, -49.72575378417969, -47.907196044921875, -46.08863830566406, -44.27008056640625, -42.45152282714844, -40.63296890258789, -38.81441116333008, -36.995853424072266, -35.17729949951172, -33.358741760253906, -31.540184020996094, -29.72162628173828, -27.9030704498291, -26.084514617919922, -24.26595687866211, -22.447399139404297, -20.628843307495117, -18.810287475585938, -16.991729736328125, -15.173172950744629, -13.354616165161133, -11.536059379577637, -9.71750259399414, -7.8989458084106445, -6.080389022827148, -4.261832237243652, -2.4432754516601562, -0.6247186660766602, 1.193838119506836, 3.012394905090332, 4.830951690673828, 6.649508476257324, 8.46806526184082, 10.286622047424316, 12.105178833007812, 13.923735618591309, 15.742292404174805, 17.560848236083984, 19.379405975341797, 21.19796371459961, 23.01651954650879, 24.83507537841797, 26.65363311767578, 28.472190856933594, 30.290746688842773, 32.10930252075195, 33.927860260009766, 35.74641799926758, 37.564971923828125, 39.38352966308594, 41.20208740234375, 43.02064514160156, 44.839202880859375, 46.65775680541992, 48.476314544677734, 50.29487228393555, 52.113426208496094, 53.931983947753906, 55.75054168701172]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 14.0, 22.0, 46.0, 71.0, 123.0, 214.0, 366.0, 592.0, 1049.0, 1829.0, 2957.0, 5431.0, 9784.0, 17781.0, 31737.0, 59061.0, 108717.0, 194431.0, 329891.0, 504693.0, 657690.0, 697545.0, 589223.0, 411198.0, 252856.0, 142775.0, 78256.0, 42971.0, 23178.0, 12903.0, 7223.0, 4075.0, 2355.0, 1346.0, 754.0, 450.0, 276.0, 144.0, 86.0, 72.0, 31.0, 22.0, 12.0, 8.0, 5.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-43.25, -41.98681640625, -40.7236328125, -39.46044921875, -38.197265625, -36.93408203125, -35.6708984375, -34.40771484375, -33.14453125, -31.88134765625, -30.6181640625, -29.35498046875, -28.091796875, -26.82861328125, -25.5654296875, -24.30224609375, -23.0390625, -21.77587890625, -20.5126953125, -19.24951171875, -17.986328125, -16.72314453125, -15.4599609375, -14.19677734375, -12.93359375, -11.67041015625, -10.4072265625, -9.14404296875, -7.880859375, -6.61767578125, -5.3544921875, -4.09130859375, -2.828125, -1.56494140625, -0.3017578125, 0.96142578125, 2.224609375, 3.48779296875, 4.7509765625, 6.01416015625, 7.27734375, 8.54052734375, 9.8037109375, 11.06689453125, 12.330078125, 13.59326171875, 14.8564453125, 16.11962890625, 17.3828125, 18.64599609375, 19.9091796875, 21.17236328125, 22.435546875, 23.69873046875, 24.9619140625, 26.22509765625, 27.48828125, 28.75146484375, 30.0146484375, 31.27783203125, 32.541015625, 33.80419921875, 35.0673828125, 36.33056640625, 37.59375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 13.0, 12.0, 12.0, 15.0, 17.0, 9.0, 23.0, 18.0, 38.0, 43.0, 24.0, 40.0, 38.0, 48.0, 39.0, 36.0, 40.0, 47.0, 42.0, 40.0, 40.0, 34.0, 41.0, 37.0, 29.0, 19.0, 26.0, 32.0, 21.0, 22.0, 15.0, 17.0, 16.0, 9.0, 11.0, 8.0, 4.0, 8.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.59375, -48.0654296875, -46.537109375, -45.0087890625, -43.48046875, -41.9521484375, -40.423828125, -38.8955078125, -37.3671875, -35.8388671875, -34.310546875, -32.7822265625, -31.25390625, -29.7255859375, -28.197265625, -26.6689453125, -25.140625, -23.6123046875, -22.083984375, -20.5556640625, -19.02734375, -17.4990234375, -15.970703125, -14.4423828125, -12.9140625, -11.3857421875, -9.857421875, -8.3291015625, -6.80078125, -5.2724609375, -3.744140625, -2.2158203125, -0.6875, 0.8408203125, 2.369140625, 3.8974609375, 5.42578125, 6.9541015625, 8.482421875, 10.0107421875, 11.5390625, 13.0673828125, 14.595703125, 16.1240234375, 17.65234375, 19.1806640625, 20.708984375, 22.2373046875, 23.765625, 25.2939453125, 26.822265625, 28.3505859375, 29.87890625, 31.4072265625, 32.935546875, 34.4638671875, 35.9921875, 37.5205078125, 39.048828125, 40.5771484375, 42.10546875, 43.6337890625, 45.162109375, 46.6904296875, 48.21875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 8.0, 10.0, 22.0, 29.0, 56.0, 83.0, 101.0, 194.0, 297.0, 466.0, 683.0, 1026.0, 1571.0, 2516.0, 3766.0, 5693.0, 8547.0, 13014.0, 19812.0, 30244.0, 45341.0, 67588.0, 98853.0, 143344.0, 204170.0, 281418.0, 374439.0, 471201.0, 526729.0, 487888.0, 398331.0, 301924.0, 219679.0, 156694.0, 108257.0, 73661.0, 49482.0, 33402.0, 21755.0, 14565.0, 9392.0, 6206.0, 4082.0, 2697.0, 1708.0, 1181.0, 746.0, 500.0, 339.0, 216.0, 119.0, 95.0, 65.0, 35.0, 21.0, 12.0, 8.0, 6.0, 4.0, 3.0, 3.0], "bins": [-33.375, -32.3193359375, -31.263671875, -30.2080078125, -29.15234375, -28.0966796875, -27.041015625, -25.9853515625, -24.9296875, -23.8740234375, -22.818359375, -21.7626953125, -20.70703125, -19.6513671875, -18.595703125, -17.5400390625, -16.484375, -15.4287109375, -14.373046875, -13.3173828125, -12.26171875, -11.2060546875, -10.150390625, -9.0947265625, -8.0390625, -6.9833984375, -5.927734375, -4.8720703125, -3.81640625, -2.7607421875, -1.705078125, -0.6494140625, 0.40625, 1.4619140625, 2.517578125, 3.5732421875, 4.62890625, 5.6845703125, 6.740234375, 7.7958984375, 8.8515625, 9.9072265625, 10.962890625, 12.0185546875, 13.07421875, 14.1298828125, 15.185546875, 16.2412109375, 17.296875, 18.3525390625, 19.408203125, 20.4638671875, 21.51953125, 22.5751953125, 23.630859375, 24.6865234375, 25.7421875, 26.7978515625, 27.853515625, 28.9091796875, 29.96484375, 31.0205078125, 32.076171875, 33.1318359375, 34.1875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 12.0, 9.0, 12.0, 14.0, 39.0, 34.0, 42.0, 51.0, 55.0, 102.0, 109.0, 113.0, 116.0, 171.0, 208.0, 202.0, 229.0, 256.0, 261.0, 250.0, 251.0, 250.0, 198.0, 173.0, 137.0, 143.0, 110.0, 90.0, 77.0, 64.0, 52.0, 37.0, 35.0, 33.0, 22.0, 27.0, 14.0, 12.0, 8.0, 8.0, 8.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-17.859375, -17.2802734375, -16.701171875, -16.1220703125, -15.54296875, -14.9638671875, -14.384765625, -13.8056640625, -13.2265625, -12.6474609375, -12.068359375, -11.4892578125, -10.91015625, -10.3310546875, -9.751953125, -9.1728515625, -8.59375, -8.0146484375, -7.435546875, -6.8564453125, -6.27734375, -5.6982421875, -5.119140625, -4.5400390625, -3.9609375, -3.3818359375, -2.802734375, -2.2236328125, -1.64453125, -1.0654296875, -0.486328125, 0.0927734375, 0.671875, 1.2509765625, 1.830078125, 2.4091796875, 2.98828125, 3.5673828125, 4.146484375, 4.7255859375, 5.3046875, 5.8837890625, 6.462890625, 7.0419921875, 7.62109375, 8.2001953125, 8.779296875, 9.3583984375, 9.9375, 10.5166015625, 11.095703125, 11.6748046875, 12.25390625, 12.8330078125, 13.412109375, 13.9912109375, 14.5703125, 15.1494140625, 15.728515625, 16.3076171875, 16.88671875, 17.4658203125, 18.044921875, 18.6240234375, 19.203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 7.0, 3.0, 5.0, 7.0, 11.0, 9.0, 15.0, 24.0, 22.0, 16.0, 25.0, 32.0, 30.0, 31.0, 39.0, 50.0, 60.0, 46.0, 46.0, 35.0, 51.0, 51.0, 36.0, 52.0, 42.0, 37.0, 38.0, 37.0, 19.0, 24.0, 15.0, 18.0, 11.0, 11.0, 11.0, 12.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.551883697509766, -41.90956497192383, -40.267250061035156, -38.62493133544922, -36.98261642456055, -35.34029769897461, -33.69798278808594, -32.0556640625, -30.413349151611328, -28.771032333374023, -27.12871551513672, -25.486398696899414, -23.84408187866211, -22.201763153076172, -20.5594482421875, -18.917129516601562, -17.274812698364258, -15.632495880126953, -13.990179061889648, -12.347862243652344, -10.705545425415039, -9.063227653503418, -7.420910835266113, -5.778594017028809, -4.136277198791504, -2.493960380554199, -0.8516433238983154, 0.7906737327575684, 2.432990550994873, 4.075307846069336, 5.717624664306641, 7.359941482543945, 9.00225830078125, 10.644575119018555, 12.28689193725586, 13.929208755493164, 15.571525573730469, 17.213844299316406, 18.856159210205078, 20.498477935791016, 22.140792846679688, 23.783109664916992, 25.425426483154297, 27.0677433013916, 28.710060119628906, 30.352378845214844, 31.994693756103516, 33.63701248168945, 35.279327392578125, 36.92164611816406, 38.563961029052734, 40.20627975463867, 41.848594665527344, 43.49091339111328, 45.13322830200195, 46.77554702758789, 48.41786575317383, 50.060184478759766, 51.70249938964844, 53.344818115234375, 54.98713302612305, 56.629451751708984, 58.271766662597656, 59.914085388183594, 61.556400299072266]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 10.0, 8.0, 12.0, 9.0, 15.0, 11.0, 17.0, 15.0, 28.0, 17.0, 25.0, 33.0, 39.0, 37.0, 43.0, 44.0, 43.0, 35.0, 46.0, 52.0, 45.0, 40.0, 42.0, 37.0, 35.0, 39.0, 28.0, 27.0, 28.0, 18.0, 13.0, 21.0, 19.0, 17.0, 20.0, 11.0, 9.0, 2.0, 5.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-60.92025375366211, -59.243980407714844, -57.567710876464844, -55.89143753051758, -54.21516799926758, -52.53889465332031, -50.86262512207031, -49.18635177612305, -47.51007843017578, -45.833805084228516, -44.157535552978516, -42.48126220703125, -40.80499267578125, -39.128719329833984, -37.45244598388672, -35.77617645263672, -34.09990692138672, -32.42363357543945, -30.747364044189453, -29.071090698242188, -27.394821166992188, -25.718547821044922, -24.04227638244629, -22.366004943847656, -20.689733505249023, -19.01346206665039, -17.337190628051758, -15.660918235778809, -13.984646797180176, -12.308375358581543, -10.632102966308594, -8.955831527709961, -7.2795562744140625, -5.60328483581543, -3.9270129203796387, -2.2507410049438477, -0.5744695663452148, 1.101801872253418, 2.778074264526367, 4.454345703125, 6.130617141723633, 7.806888580322266, 9.483160018920898, 11.159432411193848, 12.83570384979248, 14.511975288391113, 16.188247680664062, 17.864519119262695, 19.540790557861328, 21.21706199645996, 22.893333435058594, 24.56960678100586, 26.24587631225586, 27.922149658203125, 29.598421096801758, 31.27469253540039, 32.950965881347656, 34.62723922729492, 36.30350875854492, 37.97978210449219, 39.65605163574219, 41.33232498168945, 43.00859832763672, 44.68486785888672, 46.36113739013672]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 12.0, 16.0, 20.0, 45.0, 47.0, 88.0, 130.0, 196.0, 258.0, 407.0, 589.0, 879.0, 1317.0, 2077.0, 3182.0, 5109.0, 8155.0, 13420.0, 22239.0, 37998.0, 65861.0, 115379.0, 184381.0, 214125.0, 153324.0, 90489.0, 51861.0, 29810.0, 17825.0, 10779.0, 6600.0, 4217.0, 2682.0, 1741.0, 1081.0, 757.0, 490.0, 323.0, 227.0, 141.0, 103.0, 60.0, 31.0, 15.0, 26.0, 14.0, 7.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-28.1875, -27.256591796875, -26.32568359375, -25.394775390625, -24.4638671875, -23.532958984375, -22.60205078125, -21.671142578125, -20.740234375, -19.809326171875, -18.87841796875, -17.947509765625, -17.0166015625, -16.085693359375, -15.15478515625, -14.223876953125, -13.29296875, -12.362060546875, -11.43115234375, -10.500244140625, -9.5693359375, -8.638427734375, -7.70751953125, -6.776611328125, -5.845703125, -4.914794921875, -3.98388671875, -3.052978515625, -2.1220703125, -1.191162109375, -0.26025390625, 0.670654296875, 1.6015625, 2.532470703125, 3.46337890625, 4.394287109375, 5.3251953125, 6.256103515625, 7.18701171875, 8.117919921875, 9.048828125, 9.979736328125, 10.91064453125, 11.841552734375, 12.7724609375, 13.703369140625, 14.63427734375, 15.565185546875, 16.49609375, 17.427001953125, 18.35791015625, 19.288818359375, 20.2197265625, 21.150634765625, 22.08154296875, 23.012451171875, 23.943359375, 24.874267578125, 25.80517578125, 26.736083984375, 27.6669921875, 28.597900390625, 29.52880859375, 30.459716796875, 31.390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 6.0, 4.0, 5.0, 5.0, 11.0, 12.0, 10.0, 13.0, 15.0, 25.0, 12.0, 24.0, 23.0, 29.0, 42.0, 24.0, 42.0, 43.0, 43.0, 35.0, 41.0, 40.0, 41.0, 45.0, 41.0, 36.0, 27.0, 44.0, 26.0, 28.0, 26.0, 24.0, 26.0, 26.0, 14.0, 20.0, 13.0, 8.0, 16.0, 8.0, 11.0, 8.0, 6.0, 2.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.09375, -48.5712890625, -47.048828125, -45.5263671875, -44.00390625, -42.4814453125, -40.958984375, -39.4365234375, -37.9140625, -36.3916015625, -34.869140625, -33.3466796875, -31.82421875, -30.3017578125, -28.779296875, -27.2568359375, -25.734375, -24.2119140625, -22.689453125, -21.1669921875, -19.64453125, -18.1220703125, -16.599609375, -15.0771484375, -13.5546875, -12.0322265625, -10.509765625, -8.9873046875, -7.46484375, -5.9423828125, -4.419921875, -2.8974609375, -1.375, 0.1474609375, 1.669921875, 3.1923828125, 4.71484375, 6.2373046875, 7.759765625, 9.2822265625, 10.8046875, 12.3271484375, 13.849609375, 15.3720703125, 16.89453125, 18.4169921875, 19.939453125, 21.4619140625, 22.984375, 24.5068359375, 26.029296875, 27.5517578125, 29.07421875, 30.5966796875, 32.119140625, 33.6416015625, 35.1640625, 36.6865234375, 38.208984375, 39.7314453125, 41.25390625, 42.7763671875, 44.298828125, 45.8212890625, 47.34375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 5.0, 9.0, 9.0, 9.0, 12.0, 16.0, 25.0, 33.0, 33.0, 56.0, 63.0, 87.0, 133.0, 192.0, 288.0, 411.0, 629.0, 954.0, 1609.0, 2687.0, 4600.0, 8076.0, 14688.0, 29051.0, 59421.0, 124690.0, 231141.0, 257896.0, 157322.0, 75845.0, 36315.0, 18455.0, 9737.0, 5519.0, 3129.0, 1906.0, 1211.0, 742.0, 497.0, 315.0, 214.0, 159.0, 111.0, 64.0, 52.0, 44.0, 35.0, 17.0, 17.0, 9.0, 9.0, 4.0, 7.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.21875, -20.537841796875, -19.85693359375, -19.176025390625, -18.4951171875, -17.814208984375, -17.13330078125, -16.452392578125, -15.771484375, -15.090576171875, -14.40966796875, -13.728759765625, -13.0478515625, -12.366943359375, -11.68603515625, -11.005126953125, -10.32421875, -9.643310546875, -8.96240234375, -8.281494140625, -7.6005859375, -6.919677734375, -6.23876953125, -5.557861328125, -4.876953125, -4.196044921875, -3.51513671875, -2.834228515625, -2.1533203125, -1.472412109375, -0.79150390625, -0.110595703125, 0.5703125, 1.251220703125, 1.93212890625, 2.613037109375, 3.2939453125, 3.974853515625, 4.65576171875, 5.336669921875, 6.017578125, 6.698486328125, 7.37939453125, 8.060302734375, 8.7412109375, 9.422119140625, 10.10302734375, 10.783935546875, 11.46484375, 12.145751953125, 12.82666015625, 13.507568359375, 14.1884765625, 14.869384765625, 15.55029296875, 16.231201171875, 16.912109375, 17.593017578125, 18.27392578125, 18.954833984375, 19.6357421875, 20.316650390625, 20.99755859375, 21.678466796875, 22.359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 2.0, 4.0, 8.0, 13.0, 15.0, 9.0, 14.0, 18.0, 35.0, 23.0, 25.0, 23.0, 24.0, 27.0, 28.0, 38.0, 36.0, 50.0, 37.0, 41.0, 53.0, 37.0, 37.0, 42.0, 33.0, 32.0, 40.0, 38.0, 36.0, 19.0, 19.0, 26.0, 16.0, 18.0, 9.0, 12.0, 11.0, 12.0, 12.0, 7.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.859375, -30.811767578125, -29.76416015625, -28.716552734375, -27.6689453125, -26.621337890625, -25.57373046875, -24.526123046875, -23.478515625, -22.430908203125, -21.38330078125, -20.335693359375, -19.2880859375, -18.240478515625, -17.19287109375, -16.145263671875, -15.09765625, -14.050048828125, -13.00244140625, -11.954833984375, -10.9072265625, -9.859619140625, -8.81201171875, -7.764404296875, -6.716796875, -5.669189453125, -4.62158203125, -3.573974609375, -2.5263671875, -1.478759765625, -0.43115234375, 0.616455078125, 1.6640625, 2.711669921875, 3.75927734375, 4.806884765625, 5.8544921875, 6.902099609375, 7.94970703125, 8.997314453125, 10.044921875, 11.092529296875, 12.14013671875, 13.187744140625, 14.2353515625, 15.282958984375, 16.33056640625, 17.378173828125, 18.42578125, 19.473388671875, 20.52099609375, 21.568603515625, 22.6162109375, 23.663818359375, 24.71142578125, 25.759033203125, 26.806640625, 27.854248046875, 28.90185546875, 29.949462890625, 30.9970703125, 32.044677734375, 33.09228515625, 34.139892578125, 35.1875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 10.0, 6.0, 5.0, 10.0, 8.0, 15.0, 26.0, 39.0, 39.0, 64.0, 89.0, 115.0, 184.0, 231.0, 339.0, 459.0, 654.0, 955.0, 1319.0, 2036.0, 3166.0, 5110.0, 8550.0, 15198.0, 30030.0, 72718.0, 279225.0, 433477.0, 108777.0, 39282.0, 18874.0, 10018.0, 6089.0, 3782.0, 2339.0, 1558.0, 1146.0, 775.0, 543.0, 382.0, 256.0, 180.0, 135.0, 93.0, 69.0, 65.0, 27.0, 21.0, 21.0, 13.0, 13.0, 12.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.640625, -15.138916015625, -14.63720703125, -14.135498046875, -13.6337890625, -13.132080078125, -12.63037109375, -12.128662109375, -11.626953125, -11.125244140625, -10.62353515625, -10.121826171875, -9.6201171875, -9.118408203125, -8.61669921875, -8.114990234375, -7.61328125, -7.111572265625, -6.60986328125, -6.108154296875, -5.6064453125, -5.104736328125, -4.60302734375, -4.101318359375, -3.599609375, -3.097900390625, -2.59619140625, -2.094482421875, -1.5927734375, -1.091064453125, -0.58935546875, -0.087646484375, 0.4140625, 0.915771484375, 1.41748046875, 1.919189453125, 2.4208984375, 2.922607421875, 3.42431640625, 3.926025390625, 4.427734375, 4.929443359375, 5.43115234375, 5.932861328125, 6.4345703125, 6.936279296875, 7.43798828125, 7.939697265625, 8.44140625, 8.943115234375, 9.44482421875, 9.946533203125, 10.4482421875, 10.949951171875, 11.45166015625, 11.953369140625, 12.455078125, 12.956787109375, 13.45849609375, 13.960205078125, 14.4619140625, 14.963623046875, 15.46533203125, 15.967041015625, 16.46875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 4.0, 3.0, 12.0, 16.0, 15.0, 9.0, 26.0, 25.0, 51.0, 104.0, 180.0, 201.0, 113.0, 57.0, 45.0, 33.0, 27.0, 17.0, 14.0, 9.0, 6.0, 9.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042877197265625, -0.004154324531555176, -0.0040209293365478516, -0.0038875341415405273, -0.003754138946533203, -0.003620743751525879, -0.0034873485565185547, -0.0033539533615112305, -0.0032205581665039062, -0.003087162971496582, -0.002953767776489258, -0.0028203725814819336, -0.0026869773864746094, -0.002553582191467285, -0.002420186996459961, -0.0022867918014526367, -0.0021533966064453125, -0.0020200014114379883, -0.001886606216430664, -0.0017532110214233398, -0.0016198158264160156, -0.0014864206314086914, -0.0013530254364013672, -0.001219630241394043, -0.0010862350463867188, -0.0009528398513793945, -0.0008194446563720703, -0.0006860494613647461, -0.0005526542663574219, -0.00041925907135009766, -0.00028586387634277344, -0.00015246868133544922, -1.9073486328125e-05, 0.00011432170867919922, 0.00024771690368652344, 0.00038111209869384766, 0.0005145072937011719, 0.0006479024887084961, 0.0007812976837158203, 0.0009146928787231445, 0.0010480880737304688, 0.001181483268737793, 0.0013148784637451172, 0.0014482736587524414, 0.0015816688537597656, 0.0017150640487670898, 0.001848459243774414, 0.0019818544387817383, 0.0021152496337890625, 0.0022486448287963867, 0.002382040023803711, 0.002515435218811035, 0.0026488304138183594, 0.0027822256088256836, 0.002915620803833008, 0.003049015998840332, 0.0031824111938476562, 0.0033158063888549805, 0.0034492015838623047, 0.003582596778869629, 0.003715991973876953, 0.0038493871688842773, 0.0039827823638916016, 0.004116177558898926, 0.00424957275390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 14.0, 18.0, 30.0, 37.0, 52.0, 75.0, 105.0, 169.0, 243.0, 353.0, 479.0, 707.0, 1053.0, 1531.0, 2225.0, 3399.0, 5310.0, 8285.0, 13562.0, 22394.0, 40037.0, 74961.0, 151805.0, 296265.0, 204997.0, 97008.0, 50373.0, 28144.0, 16286.0, 10054.0, 6278.0, 4103.0, 2634.0, 1741.0, 1198.0, 826.0, 558.0, 376.0, 258.0, 208.0, 135.0, 77.0, 66.0, 49.0, 27.0, 16.0, 14.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6484375, -13.2177734375, -12.787109375, -12.3564453125, -11.92578125, -11.4951171875, -11.064453125, -10.6337890625, -10.203125, -9.7724609375, -9.341796875, -8.9111328125, -8.48046875, -8.0498046875, -7.619140625, -7.1884765625, -6.7578125, -6.3271484375, -5.896484375, -5.4658203125, -5.03515625, -4.6044921875, -4.173828125, -3.7431640625, -3.3125, -2.8818359375, -2.451171875, -2.0205078125, -1.58984375, -1.1591796875, -0.728515625, -0.2978515625, 0.1328125, 0.5634765625, 0.994140625, 1.4248046875, 1.85546875, 2.2861328125, 2.716796875, 3.1474609375, 3.578125, 4.0087890625, 4.439453125, 4.8701171875, 5.30078125, 5.7314453125, 6.162109375, 6.5927734375, 7.0234375, 7.4541015625, 7.884765625, 8.3154296875, 8.74609375, 9.1767578125, 9.607421875, 10.0380859375, 10.46875, 10.8994140625, 11.330078125, 11.7607421875, 12.19140625, 12.6220703125, 13.052734375, 13.4833984375, 13.9140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 6.0, 10.0, 4.0, 14.0, 13.0, 19.0, 15.0, 16.0, 38.0, 38.0, 49.0, 63.0, 66.0, 67.0, 101.0, 92.0, 65.0, 61.0, 60.0, 45.0, 25.0, 19.0, 17.0, 12.0, 19.0, 8.0, 6.0, 3.0, 5.0, 6.0, 4.0, 2.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.9375, -4.79742431640625, -4.6573486328125, -4.51727294921875, -4.377197265625, -4.23712158203125, -4.0970458984375, -3.95697021484375, -3.81689453125, -3.67681884765625, -3.5367431640625, -3.39666748046875, -3.256591796875, -3.11651611328125, -2.9764404296875, -2.83636474609375, -2.6962890625, -2.55621337890625, -2.4161376953125, -2.27606201171875, -2.135986328125, -1.99591064453125, -1.8558349609375, -1.71575927734375, -1.57568359375, -1.43560791015625, -1.2955322265625, -1.15545654296875, -1.015380859375, -0.87530517578125, -0.7352294921875, -0.59515380859375, -0.455078125, -0.31500244140625, -0.1749267578125, -0.03485107421875, 0.105224609375, 0.24530029296875, 0.3853759765625, 0.52545166015625, 0.66552734375, 0.80560302734375, 0.9456787109375, 1.08575439453125, 1.225830078125, 1.36590576171875, 1.5059814453125, 1.64605712890625, 1.7861328125, 1.92620849609375, 2.0662841796875, 2.20635986328125, 2.346435546875, 2.48651123046875, 2.6265869140625, 2.76666259765625, 2.90673828125, 3.04681396484375, 3.1868896484375, 3.32696533203125, 3.467041015625, 3.60711669921875, 3.7471923828125, 3.88726806640625, 4.02734375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 8.0, 10.0, 7.0, 18.0, 18.0, 27.0, 19.0, 22.0, 42.0, 42.0, 43.0, 47.0, 34.0, 50.0, 44.0, 52.0, 46.0, 51.0, 46.0, 44.0, 35.0, 51.0, 38.0, 31.0, 32.0, 29.0, 14.0, 12.0, 12.0, 12.0, 6.0, 11.0, 10.0, 9.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.960784912109375, -45.37490463256836, -43.789024353027344, -42.20314025878906, -40.61725997924805, -39.03137969970703, -37.44549560546875, -35.859615325927734, -34.27373504638672, -32.6878547668457, -31.101972579956055, -29.516090393066406, -27.93021011352539, -26.344329833984375, -24.758447647094727, -23.172565460205078, -21.586685180664062, -20.000804901123047, -18.4149227142334, -16.82904052734375, -15.243160247802734, -13.657279014587402, -12.07139778137207, -10.485516548156738, -8.899635314941406, -7.313754081726074, -5.727872848510742, -4.14199161529541, -2.556110382080078, -0.9702291488647461, 0.6156520843505859, 2.201533317565918, 3.7874183654785156, 5.373299598693848, 6.95918083190918, 8.545062065124512, 10.130943298339844, 11.716824531555176, 13.302705764770508, 14.88858699798584, 16.474468231201172, 18.060348510742188, 19.646230697631836, 21.232112884521484, 22.8179931640625, 24.403873443603516, 25.989755630493164, 27.575637817382812, 29.161518096923828, 30.747398376464844, 32.333282470703125, 33.91916275024414, 35.505043029785156, 37.09092330932617, 38.67680358886719, 40.26268768310547, 41.848567962646484, 43.4344482421875, 45.02033233642578, 46.6062126159668, 48.19209289550781, 49.77797317504883, 51.363853454589844, 52.949737548828125, 54.53561782836914]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 10.0, 13.0, 13.0, 14.0, 16.0, 14.0, 17.0, 25.0, 29.0, 32.0, 35.0, 28.0, 44.0, 44.0, 44.0, 51.0, 45.0, 41.0, 42.0, 45.0, 42.0, 37.0, 40.0, 34.0, 25.0, 30.0, 31.0, 17.0, 21.0, 21.0, 17.0, 16.0, 25.0, 10.0, 6.0, 5.0, 3.0, 5.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-56.730491638183594, -55.174625396728516, -53.6187629699707, -52.062896728515625, -50.50703430175781, -48.951168060302734, -47.395301818847656, -45.839439392089844, -44.28357696533203, -42.72771072387695, -41.17184829711914, -39.61598205566406, -38.06011962890625, -36.50425338745117, -34.948387145996094, -33.39252471923828, -31.836658477783203, -30.280794143676758, -28.724929809570312, -27.169063568115234, -25.613201141357422, -24.057334899902344, -22.5014705657959, -20.945606231689453, -19.389741897583008, -17.833877563476562, -16.278013229370117, -14.722147941589355, -13.16628360748291, -11.610419273376465, -10.054553985595703, -8.498689651489258, -6.942829132080078, -5.386964797973633, -3.8310999870300293, -2.275235176086426, -0.7193708419799805, 0.8364934921264648, 2.3923587799072266, 3.948223114013672, 5.504087448120117, 7.0599517822265625, 8.615816116333008, 10.17168140411377, 11.727545738220215, 13.28341007232666, 14.839275360107422, 16.395139694213867, 17.951004028320312, 19.506868362426758, 21.062732696533203, 22.61859893798828, 24.174461364746094, 25.730327606201172, 27.286191940307617, 28.842056274414062, 30.397920608520508, 31.953784942626953, 33.50965118408203, 35.065513610839844, 36.62137985229492, 38.177242279052734, 39.73310852050781, 41.288970947265625, 42.8448371887207]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 11.0, 11.0, 23.0, 40.0, 51.0, 93.0, 128.0, 210.0, 354.0, 563.0, 859.0, 1282.0, 2009.0, 3122.0, 4727.0, 7262.0, 11127.0, 16647.0, 24240.0, 34748.0, 48068.0, 63970.0, 80513.0, 94429.0, 104199.0, 105437.0, 100115.0, 87733.0, 71920.0, 55916.0, 40866.0, 28949.0, 20057.0, 13515.0, 8838.0, 5765.0, 3785.0, 2503.0, 1618.0, 1007.0, 669.0, 449.0, 266.0, 187.0, 91.0, 72.0, 48.0, 23.0, 19.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0], "bins": [-32.65625, -31.702392578125, -30.74853515625, -29.794677734375, -28.8408203125, -27.886962890625, -26.93310546875, -25.979248046875, -25.025390625, -24.071533203125, -23.11767578125, -22.163818359375, -21.2099609375, -20.256103515625, -19.30224609375, -18.348388671875, -17.39453125, -16.440673828125, -15.48681640625, -14.532958984375, -13.5791015625, -12.625244140625, -11.67138671875, -10.717529296875, -9.763671875, -8.809814453125, -7.85595703125, -6.902099609375, -5.9482421875, -4.994384765625, -4.04052734375, -3.086669921875, -2.1328125, -1.178955078125, -0.22509765625, 0.728759765625, 1.6826171875, 2.636474609375, 3.59033203125, 4.544189453125, 5.498046875, 6.451904296875, 7.40576171875, 8.359619140625, 9.3134765625, 10.267333984375, 11.22119140625, 12.175048828125, 13.12890625, 14.082763671875, 15.03662109375, 15.990478515625, 16.9443359375, 17.898193359375, 18.85205078125, 19.805908203125, 20.759765625, 21.713623046875, 22.66748046875, 23.621337890625, 24.5751953125, 25.529052734375, 26.48291015625, 27.436767578125, 28.390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 6.0, 4.0, 2.0, 9.0, 6.0, 10.0, 15.0, 12.0, 21.0, 11.0, 27.0, 31.0, 23.0, 40.0, 35.0, 29.0, 36.0, 35.0, 45.0, 39.0, 36.0, 43.0, 41.0, 35.0, 51.0, 32.0, 32.0, 38.0, 34.0, 31.0, 19.0, 28.0, 24.0, 21.0, 20.0, 13.0, 8.0, 18.0, 13.0, 8.0, 10.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-50.8125, -49.4169921875, -48.021484375, -46.6259765625, -45.23046875, -43.8349609375, -42.439453125, -41.0439453125, -39.6484375, -38.2529296875, -36.857421875, -35.4619140625, -34.06640625, -32.6708984375, -31.275390625, -29.8798828125, -28.484375, -27.0888671875, -25.693359375, -24.2978515625, -22.90234375, -21.5068359375, -20.111328125, -18.7158203125, -17.3203125, -15.9248046875, -14.529296875, -13.1337890625, -11.73828125, -10.3427734375, -8.947265625, -7.5517578125, -6.15625, -4.7607421875, -3.365234375, -1.9697265625, -0.57421875, 0.8212890625, 2.216796875, 3.6123046875, 5.0078125, 6.4033203125, 7.798828125, 9.1943359375, 10.58984375, 11.9853515625, 13.380859375, 14.7763671875, 16.171875, 17.5673828125, 18.962890625, 20.3583984375, 21.75390625, 23.1494140625, 24.544921875, 25.9404296875, 27.3359375, 28.7314453125, 30.126953125, 31.5224609375, 32.91796875, 34.3134765625, 35.708984375, 37.1044921875, 38.5]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 6.0, 7.0, 8.0, 33.0, 55.0, 77.0, 115.0, 226.0, 358.0, 509.0, 844.0, 1332.0, 2060.0, 3229.0, 5107.0, 7945.0, 12442.0, 18378.0, 26769.0, 39058.0, 54026.0, 71789.0, 88862.0, 104032.0, 110916.0, 108697.0, 98298.0, 81919.0, 63473.0, 47355.0, 33657.0, 23046.0, 15568.0, 10185.0, 6558.0, 4283.0, 2646.0, 1752.0, 1113.0, 702.0, 417.0, 277.0, 184.0, 108.0, 57.0, 36.0, 17.0, 12.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0], "bins": [-42.3125, -41.09619140625, -39.8798828125, -38.66357421875, -37.447265625, -36.23095703125, -35.0146484375, -33.79833984375, -32.58203125, -31.36572265625, -30.1494140625, -28.93310546875, -27.716796875, -26.50048828125, -25.2841796875, -24.06787109375, -22.8515625, -21.63525390625, -20.4189453125, -19.20263671875, -17.986328125, -16.77001953125, -15.5537109375, -14.33740234375, -13.12109375, -11.90478515625, -10.6884765625, -9.47216796875, -8.255859375, -7.03955078125, -5.8232421875, -4.60693359375, -3.390625, -2.17431640625, -0.9580078125, 0.25830078125, 1.474609375, 2.69091796875, 3.9072265625, 5.12353515625, 6.33984375, 7.55615234375, 8.7724609375, 9.98876953125, 11.205078125, 12.42138671875, 13.6376953125, 14.85400390625, 16.0703125, 17.28662109375, 18.5029296875, 19.71923828125, 20.935546875, 22.15185546875, 23.3681640625, 24.58447265625, 25.80078125, 27.01708984375, 28.2333984375, 29.44970703125, 30.666015625, 31.88232421875, 33.0986328125, 34.31494140625, 35.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 3.0, 5.0, 12.0, 14.0, 21.0, 11.0, 23.0, 26.0, 25.0, 27.0, 32.0, 27.0, 37.0, 34.0, 44.0, 37.0, 47.0, 26.0, 46.0, 43.0, 36.0, 53.0, 28.0, 37.0, 30.0, 37.0, 34.0, 28.0, 37.0, 20.0, 17.0, 15.0, 15.0, 11.0, 7.0, 15.0, 9.0, 4.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.9375, -31.984375, -31.03125, -30.078125, -29.125, -28.171875, -27.21875, -26.265625, -25.3125, -24.359375, -23.40625, -22.453125, -21.5, -20.546875, -19.59375, -18.640625, -17.6875, -16.734375, -15.78125, -14.828125, -13.875, -12.921875, -11.96875, -11.015625, -10.0625, -9.109375, -8.15625, -7.203125, -6.25, -5.296875, -4.34375, -3.390625, -2.4375, -1.484375, -0.53125, 0.421875, 1.375, 2.328125, 3.28125, 4.234375, 5.1875, 6.140625, 7.09375, 8.046875, 9.0, 9.953125, 10.90625, 11.859375, 12.8125, 13.765625, 14.71875, 15.671875, 16.625, 17.578125, 18.53125, 19.484375, 20.4375, 21.390625, 22.34375, 23.296875, 24.25, 25.203125, 26.15625, 27.109375, 28.0625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 11.0, 11.0, 20.0, 29.0, 45.0, 64.0, 95.0, 134.0, 201.0, 316.0, 439.0, 730.0, 1188.0, 1932.0, 3170.0, 5159.0, 8377.0, 13529.0, 21633.0, 34756.0, 52675.0, 75986.0, 103619.0, 127321.0, 137029.0, 127711.0, 105843.0, 78568.0, 53851.0, 35391.0, 22439.0, 13764.0, 8598.0, 5242.0, 3242.0, 1937.0, 1238.0, 755.0, 534.0, 342.0, 196.0, 146.0, 100.0, 72.0, 37.0, 29.0, 18.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9652099609375, -9.649169921875, -9.3331298828125, -9.01708984375, -8.7010498046875, -8.385009765625, -8.0689697265625, -7.7529296875, -7.4368896484375, -7.120849609375, -6.8048095703125, -6.48876953125, -6.1727294921875, -5.856689453125, -5.5406494140625, -5.224609375, -4.9085693359375, -4.592529296875, -4.2764892578125, -3.96044921875, -3.6444091796875, -3.328369140625, -3.0123291015625, -2.6962890625, -2.3802490234375, -2.064208984375, -1.7481689453125, -1.43212890625, -1.1160888671875, -0.800048828125, -0.4840087890625, -0.16796875, 0.1480712890625, 0.464111328125, 0.7801513671875, 1.09619140625, 1.4122314453125, 1.728271484375, 2.0443115234375, 2.3603515625, 2.6763916015625, 2.992431640625, 3.3084716796875, 3.62451171875, 3.9405517578125, 4.256591796875, 4.5726318359375, 4.888671875, 5.2047119140625, 5.520751953125, 5.8367919921875, 6.15283203125, 6.4688720703125, 6.784912109375, 7.1009521484375, 7.4169921875, 7.7330322265625, 8.049072265625, 8.3651123046875, 8.68115234375, 8.9971923828125, 9.313232421875, 9.6292724609375, 9.9453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 3.0, 3.0, 7.0, 7.0, 7.0, 4.0, 5.0, 13.0, 16.0, 17.0, 17.0, 28.0, 19.0, 26.0, 33.0, 28.0, 41.0, 30.0, 49.0, 45.0, 42.0, 47.0, 36.0, 46.0, 50.0, 43.0, 37.0, 41.0, 37.0, 25.0, 18.0, 27.0, 29.0, 21.0, 20.0, 17.0, 10.0, 10.0, 10.0, 9.0, 0.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010251998901367188, -0.0009941458702087402, -0.0009630918502807617, -0.0009320378303527832, -0.0009009838104248047, -0.0008699297904968262, -0.0008388757705688477, -0.0008078217506408691, -0.0007767677307128906, -0.0007457137107849121, -0.0007146596908569336, -0.0006836056709289551, -0.0006525516510009766, -0.000621497631072998, -0.0005904436111450195, -0.000559389591217041, -0.0005283355712890625, -0.000497281551361084, -0.00046622753143310547, -0.00043517351150512695, -0.00040411949157714844, -0.0003730654716491699, -0.0003420114517211914, -0.0003109574317932129, -0.0002799034118652344, -0.00024884939193725586, -0.00021779537200927734, -0.00018674135208129883, -0.0001556873321533203, -0.0001246333122253418, -9.357929229736328e-05, -6.252527236938477e-05, -3.147125244140625e-05, -4.172325134277344e-07, 3.063678741455078e-05, 6.16908073425293e-05, 9.274482727050781e-05, 0.00012379884719848633, 0.00015485286712646484, 0.00018590688705444336, 0.00021696090698242188, 0.0002480149269104004, 0.0002790689468383789, 0.0003101229667663574, 0.00034117698669433594, 0.00037223100662231445, 0.00040328502655029297, 0.0004343390464782715, 0.00046539306640625, 0.0004964470863342285, 0.000527501106262207, 0.0005585551261901855, 0.0005896091461181641, 0.0006206631660461426, 0.0006517171859741211, 0.0006827712059020996, 0.0007138252258300781, 0.0007448792457580566, 0.0007759332656860352, 0.0008069872856140137, 0.0008380413055419922, 0.0008690953254699707, 0.0009001493453979492, 0.0009312033653259277, 0.0009622573852539062]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 11.0, 20.0, 33.0, 42.0, 41.0, 80.0, 133.0, 191.0, 325.0, 557.0, 861.0, 1410.0, 2214.0, 3621.0, 5442.0, 8759.0, 13867.0, 21410.0, 32883.0, 48388.0, 68165.0, 89608.0, 108746.0, 120212.0, 119691.0, 107951.0, 88696.0, 66784.0, 47606.0, 32467.0, 21296.0, 13675.0, 8743.0, 5424.0, 3461.0, 2097.0, 1321.0, 845.0, 532.0, 332.0, 234.0, 118.0, 90.0, 55.0, 43.0, 27.0, 23.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.931640625, -8.65234375, -8.373046875, -8.09375, -7.814453125, -7.53515625, -7.255859375, -6.9765625, -6.697265625, -6.41796875, -6.138671875, -5.859375, -5.580078125, -5.30078125, -5.021484375, -4.7421875, -4.462890625, -4.18359375, -3.904296875, -3.625, -3.345703125, -3.06640625, -2.787109375, -2.5078125, -2.228515625, -1.94921875, -1.669921875, -1.390625, -1.111328125, -0.83203125, -0.552734375, -0.2734375, 0.005859375, 0.28515625, 0.564453125, 0.84375, 1.123046875, 1.40234375, 1.681640625, 1.9609375, 2.240234375, 2.51953125, 2.798828125, 3.078125, 3.357421875, 3.63671875, 3.916015625, 4.1953125, 4.474609375, 4.75390625, 5.033203125, 5.3125, 5.591796875, 5.87109375, 6.150390625, 6.4296875, 6.708984375, 6.98828125, 7.267578125, 7.546875, 7.826171875, 8.10546875, 8.384765625, 8.6640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 2.0, 6.0, 17.0, 11.0, 11.0, 17.0, 22.0, 20.0, 20.0, 28.0, 43.0, 44.0, 45.0, 50.0, 46.0, 41.0, 55.0, 50.0, 58.0, 47.0, 47.0, 47.0, 37.0, 43.0, 31.0, 27.0, 17.0, 15.0, 19.0, 12.0, 16.0, 6.0, 12.0, 5.0, 5.0, 3.0, 6.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.64056396484375, -4.5115966796875, -4.38262939453125, -4.253662109375, -4.12469482421875, -3.9957275390625, -3.86676025390625, -3.73779296875, -3.60882568359375, -3.4798583984375, -3.35089111328125, -3.221923828125, -3.09295654296875, -2.9639892578125, -2.83502197265625, -2.7060546875, -2.57708740234375, -2.4481201171875, -2.31915283203125, -2.190185546875, -2.06121826171875, -1.9322509765625, -1.80328369140625, -1.67431640625, -1.54534912109375, -1.4163818359375, -1.28741455078125, -1.158447265625, -1.02947998046875, -0.9005126953125, -0.77154541015625, -0.642578125, -0.51361083984375, -0.3846435546875, -0.25567626953125, -0.126708984375, 0.00225830078125, 0.1312255859375, 0.26019287109375, 0.38916015625, 0.51812744140625, 0.6470947265625, 0.77606201171875, 0.905029296875, 1.03399658203125, 1.1629638671875, 1.29193115234375, 1.4208984375, 1.54986572265625, 1.6788330078125, 1.80780029296875, 1.936767578125, 2.06573486328125, 2.1947021484375, 2.32366943359375, 2.45263671875, 2.58160400390625, 2.7105712890625, 2.83953857421875, 2.968505859375, 3.09747314453125, 3.2264404296875, 3.35540771484375, 3.484375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 3.0, 10.0, 7.0, 5.0, 10.0, 8.0, 12.0, 15.0, 17.0, 20.0, 28.0, 22.0, 31.0, 37.0, 37.0, 27.0, 40.0, 49.0, 36.0, 38.0, 43.0, 44.0, 35.0, 35.0, 34.0, 35.0, 44.0, 38.0, 32.0, 35.0, 29.0, 27.0, 14.0, 13.0, 11.0, 20.0, 12.0, 11.0, 9.0, 12.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-47.87879943847656, -46.54505157470703, -45.211299896240234, -43.8775520324707, -42.543800354003906, -41.210052490234375, -39.876304626464844, -38.54255294799805, -37.20880126953125, -35.87505340576172, -34.54130172729492, -33.20755386352539, -31.873802185058594, -30.540054321289062, -29.2063045501709, -27.872554779052734, -26.538806915283203, -25.20505714416504, -23.871307373046875, -22.537559509277344, -21.203807830810547, -19.870059967041016, -18.53631019592285, -17.202560424804688, -15.868810653686523, -14.53506088256836, -13.201311111450195, -11.867562294006348, -10.533812522888184, -9.20006275177002, -7.866313934326172, -6.532564163208008, -5.198810577392578, -3.865061044692993, -2.531311511993408, -1.1975622177124023, 0.13618755340576172, 1.4699373245239258, 2.8036861419677734, 4.1374359130859375, 5.471185684204102, 6.804935455322266, 8.13868522644043, 9.472434043884277, 10.806183815002441, 12.139933586120605, 13.473682403564453, 14.807432174682617, 16.14118194580078, 17.474931716918945, 18.80868148803711, 20.14242935180664, 21.476181030273438, 22.80992889404297, 24.143678665161133, 25.477428436279297, 26.81117820739746, 28.144927978515625, 29.47867774963379, 30.812427520751953, 32.146175384521484, 33.47992706298828, 34.81367492675781, 36.147422790527344, 37.48117446899414]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 9.0, 11.0, 16.0, 14.0, 22.0, 33.0, 22.0, 34.0, 39.0, 46.0, 40.0, 30.0, 58.0, 34.0, 47.0, 37.0, 42.0, 45.0, 50.0, 50.0, 25.0, 27.0, 28.0, 41.0, 21.0, 25.0, 26.0, 19.0, 16.0, 16.0, 9.0, 15.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.19195556640625, -52.56753921508789, -50.94312286376953, -49.318702697753906, -47.69428634643555, -46.06986999511719, -44.44545364379883, -42.82103729248047, -41.196617126464844, -39.572200775146484, -37.947784423828125, -36.3233642578125, -34.69894790649414, -33.07453155517578, -31.450115203857422, -29.825698852539062, -28.201282501220703, -26.576866149902344, -24.95244789123535, -23.328031539916992, -21.70361328125, -20.07919692993164, -18.45478057861328, -16.830364227294922, -15.20594596862793, -13.581528663635254, -11.957111358642578, -10.332695007324219, -8.708277702331543, -7.083860397338867, -5.459444046020508, -3.835026741027832, -2.2106056213378906, -0.586188554763794, 1.0382285118103027, 2.6626453399658203, 4.287062644958496, 5.911479949951172, 7.535896301269531, 9.160313606262207, 10.784730911254883, 12.409148216247559, 14.033565521240234, 15.657981872558594, 17.282398223876953, 18.906816482543945, 20.531232833862305, 22.155651092529297, 23.780067443847656, 25.404483795166016, 27.028902053833008, 28.653318405151367, 30.27773666381836, 31.90215301513672, 33.52656936645508, 35.15098571777344, 36.77540588378906, 38.39982223510742, 40.02423858642578, 41.648658752441406, 43.273075103759766, 44.897491455078125, 46.521907806396484, 48.146324157714844, 49.7707405090332]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 7.0, 8.0, 14.0, 17.0, 39.0, 57.0, 101.0, 169.0, 229.0, 402.0, 598.0, 1103.0, 1682.0, 2748.0, 4497.0, 7686.0, 12982.0, 21269.0, 35578.0, 59487.0, 96597.0, 155917.0, 240455.0, 347017.0, 458528.0, 539414.0, 554723.0, 496018.0, 390989.0, 278977.0, 185856.0, 117529.0, 72423.0, 44286.0, 26204.0, 16047.0, 9720.0, 5873.0, 3558.0, 2126.0, 1288.0, 790.0, 478.0, 305.0, 205.0, 109.0, 70.0, 52.0, 28.0, 10.0, 13.0, 7.0, 4.0, 1.0, 1.0], "bins": [-33.75, -32.791015625, -31.83203125, -30.873046875, -29.9140625, -28.955078125, -27.99609375, -27.037109375, -26.078125, -25.119140625, -24.16015625, -23.201171875, -22.2421875, -21.283203125, -20.32421875, -19.365234375, -18.40625, -17.447265625, -16.48828125, -15.529296875, -14.5703125, -13.611328125, -12.65234375, -11.693359375, -10.734375, -9.775390625, -8.81640625, -7.857421875, -6.8984375, -5.939453125, -4.98046875, -4.021484375, -3.0625, -2.103515625, -1.14453125, -0.185546875, 0.7734375, 1.732421875, 2.69140625, 3.650390625, 4.609375, 5.568359375, 6.52734375, 7.486328125, 8.4453125, 9.404296875, 10.36328125, 11.322265625, 12.28125, 13.240234375, 14.19921875, 15.158203125, 16.1171875, 17.076171875, 18.03515625, 18.994140625, 19.953125, 20.912109375, 21.87109375, 22.830078125, 23.7890625, 24.748046875, 25.70703125, 26.666015625, 27.625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 1.0, 4.0, 7.0, 6.0, 6.0, 13.0, 19.0, 9.0, 16.0, 18.0, 23.0, 30.0, 30.0, 39.0, 43.0, 36.0, 40.0, 38.0, 44.0, 48.0, 46.0, 44.0, 44.0, 36.0, 41.0, 38.0, 37.0, 34.0, 23.0, 26.0, 26.0, 23.0, 21.0, 16.0, 17.0, 16.0, 10.0, 7.0, 10.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.0, -42.7587890625, -41.517578125, -40.2763671875, -39.03515625, -37.7939453125, -36.552734375, -35.3115234375, -34.0703125, -32.8291015625, -31.587890625, -30.3466796875, -29.10546875, -27.8642578125, -26.623046875, -25.3818359375, -24.140625, -22.8994140625, -21.658203125, -20.4169921875, -19.17578125, -17.9345703125, -16.693359375, -15.4521484375, -14.2109375, -12.9697265625, -11.728515625, -10.4873046875, -9.24609375, -8.0048828125, -6.763671875, -5.5224609375, -4.28125, -3.0400390625, -1.798828125, -0.5576171875, 0.68359375, 1.9248046875, 3.166015625, 4.4072265625, 5.6484375, 6.8896484375, 8.130859375, 9.3720703125, 10.61328125, 11.8544921875, 13.095703125, 14.3369140625, 15.578125, 16.8193359375, 18.060546875, 19.3017578125, 20.54296875, 21.7841796875, 23.025390625, 24.2666015625, 25.5078125, 26.7490234375, 27.990234375, 29.2314453125, 30.47265625, 31.7138671875, 32.955078125, 34.1962890625, 35.4375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 13.0, 26.0, 52.0, 96.0, 139.0, 235.0, 399.0, 762.0, 1288.0, 2262.0, 3904.0, 6722.0, 11611.0, 19397.0, 32404.0, 53155.0, 85197.0, 131649.0, 195110.0, 275613.0, 367865.0, 448747.0, 496965.0, 494290.0, 438781.0, 353971.0, 262259.0, 184655.0, 123432.0, 79431.0, 49748.0, 30307.0, 18219.0, 10709.0, 6289.0, 3656.0, 2153.0, 1204.0, 670.0, 375.0, 232.0, 129.0, 68.0, 44.0, 27.0, 9.0, 7.0, 6.0, 1.0, 0.0, 1.0, 3.0], "bins": [-33.84375, -32.874755859375, -31.90576171875, -30.936767578125, -29.9677734375, -28.998779296875, -28.02978515625, -27.060791015625, -26.091796875, -25.122802734375, -24.15380859375, -23.184814453125, -22.2158203125, -21.246826171875, -20.27783203125, -19.308837890625, -18.33984375, -17.370849609375, -16.40185546875, -15.432861328125, -14.4638671875, -13.494873046875, -12.52587890625, -11.556884765625, -10.587890625, -9.618896484375, -8.64990234375, -7.680908203125, -6.7119140625, -5.742919921875, -4.77392578125, -3.804931640625, -2.8359375, -1.866943359375, -0.89794921875, 0.071044921875, 1.0400390625, 2.009033203125, 2.97802734375, 3.947021484375, 4.916015625, 5.885009765625, 6.85400390625, 7.822998046875, 8.7919921875, 9.760986328125, 10.72998046875, 11.698974609375, 12.66796875, 13.636962890625, 14.60595703125, 15.574951171875, 16.5439453125, 17.512939453125, 18.48193359375, 19.450927734375, 20.419921875, 21.388916015625, 22.35791015625, 23.326904296875, 24.2958984375, 25.264892578125, 26.23388671875, 27.202880859375, 28.171875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 10.0, 9.0, 13.0, 28.0, 30.0, 40.0, 35.0, 64.0, 68.0, 97.0, 104.0, 128.0, 161.0, 170.0, 205.0, 208.0, 238.0, 225.0, 219.0, 237.0, 225.0, 223.0, 217.0, 165.0, 156.0, 152.0, 127.0, 96.0, 90.0, 62.0, 61.0, 51.0, 39.0, 25.0, 31.0, 9.0, 13.0, 11.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5234375, -14.9927978515625, -14.462158203125, -13.9315185546875, -13.40087890625, -12.8702392578125, -12.339599609375, -11.8089599609375, -11.2783203125, -10.7476806640625, -10.217041015625, -9.6864013671875, -9.15576171875, -8.6251220703125, -8.094482421875, -7.5638427734375, -7.033203125, -6.5025634765625, -5.971923828125, -5.4412841796875, -4.91064453125, -4.3800048828125, -3.849365234375, -3.3187255859375, -2.7880859375, -2.2574462890625, -1.726806640625, -1.1961669921875, -0.66552734375, -0.1348876953125, 0.395751953125, 0.9263916015625, 1.45703125, 1.9876708984375, 2.518310546875, 3.0489501953125, 3.57958984375, 4.1102294921875, 4.640869140625, 5.1715087890625, 5.7021484375, 6.2327880859375, 6.763427734375, 7.2940673828125, 7.82470703125, 8.3553466796875, 8.885986328125, 9.4166259765625, 9.947265625, 10.4779052734375, 11.008544921875, 11.5391845703125, 12.06982421875, 12.6004638671875, 13.131103515625, 13.6617431640625, 14.1923828125, 14.7230224609375, 15.253662109375, 15.7843017578125, 16.31494140625, 16.8455810546875, 17.376220703125, 17.9068603515625, 18.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 10.0, 8.0, 14.0, 10.0, 19.0, 13.0, 16.0, 18.0, 19.0, 42.0, 25.0, 33.0, 42.0, 29.0, 43.0, 29.0, 36.0, 47.0, 39.0, 48.0, 43.0, 36.0, 41.0, 35.0, 40.0, 32.0, 32.0, 28.0, 31.0, 32.0, 19.0, 20.0, 13.0, 12.0, 9.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.386783599853516, -36.2636833190918, -35.14058303833008, -34.01748275756836, -32.894386291503906, -31.771284103393555, -30.64818572998047, -29.52508544921875, -28.40198516845703, -27.278884887695312, -26.155784606933594, -25.032686233520508, -23.90958595275879, -22.78648567199707, -21.663387298583984, -20.540287017822266, -19.417186737060547, -18.294086456298828, -17.17098617553711, -16.047887802124023, -14.924787521362305, -13.801687240600586, -12.678587913513184, -11.555488586425781, -10.432388305664062, -9.309288024902344, -8.186188697814941, -7.063088893890381, -5.93998908996582, -4.81688928604126, -3.693789482116699, -2.5706896781921387, -1.4475860595703125, -0.32448625564575195, 0.7986135482788086, 1.9217133522033691, 3.0448131561279297, 4.16791296005249, 5.291012763977051, 6.414112567901611, 7.537212371826172, 8.66031265258789, 9.783411979675293, 10.906511306762695, 12.029611587524414, 13.152711868286133, 14.275811195373535, 15.398910522460938, 16.522010803222656, 17.645111083984375, 18.768211364746094, 19.89130973815918, 21.0144100189209, 22.137510299682617, 23.260608673095703, 24.383708953857422, 25.50680923461914, 26.62990951538086, 27.753009796142578, 28.876108169555664, 29.999208450317383, 31.1223087310791, 32.24540710449219, 33.368507385253906, 34.491607666015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 7.0, 8.0, 10.0, 7.0, 6.0, 7.0, 16.0, 15.0, 17.0, 16.0, 29.0, 34.0, 37.0, 19.0, 38.0, 37.0, 51.0, 50.0, 47.0, 39.0, 36.0, 38.0, 49.0, 43.0, 32.0, 38.0, 42.0, 31.0, 22.0, 28.0, 23.0, 16.0, 19.0, 18.0, 19.0, 15.0, 8.0, 14.0, 5.0, 5.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.15751647949219, -39.85011672973633, -38.542720794677734, -37.235321044921875, -35.927921295166016, -34.62052536010742, -33.31312561035156, -32.00572967529297, -30.69832992553711, -29.390932083129883, -28.083532333374023, -26.776134490966797, -25.46873664855957, -24.161338806152344, -22.853939056396484, -21.546541213989258, -20.2391414642334, -18.931743621826172, -17.624343872070312, -16.316946029663086, -15.00954818725586, -13.702149391174316, -12.394750595092773, -11.087352752685547, -9.779953956604004, -8.472555160522461, -7.165157318115234, -5.857758522033691, -4.550360202789307, -3.242961883544922, -1.935563087463379, -0.6281652450561523, 0.6792335510253906, 1.986631989479065, 3.2940304279327393, 4.601428985595703, 5.908827304840088, 7.216225624084473, 8.523624420166016, 9.831022262573242, 11.138421058654785, 12.445819854736328, 13.753217697143555, 15.060616493225098, 16.36801528930664, 17.675413131713867, 18.982810974121094, 20.290210723876953, 21.59760856628418, 22.905006408691406, 24.212406158447266, 25.519804000854492, 26.82720184326172, 28.134601593017578, 29.441999435424805, 30.74939727783203, 32.05679702758789, 33.36419677734375, 34.671592712402344, 35.9789924621582, 37.28639221191406, 38.593788146972656, 39.901187896728516, 41.208587646484375, 42.51598358154297]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 3.0, 8.0, 10.0, 9.0, 11.0, 23.0, 29.0, 62.0, 59.0, 87.0, 132.0, 212.0, 305.0, 562.0, 946.0, 1668.0, 2838.0, 5218.0, 9304.0, 17001.0, 31814.0, 56990.0, 96841.0, 153104.0, 197340.0, 179735.0, 124176.0, 75210.0, 42722.0, 23275.0, 12706.0, 7042.0, 3773.0, 2156.0, 1264.0, 712.0, 428.0, 242.0, 176.0, 105.0, 85.0, 45.0, 31.0, 28.0, 17.0, 9.0, 6.0, 4.0, 9.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.015625, -18.416748046875, -17.81787109375, -17.218994140625, -16.6201171875, -16.021240234375, -15.42236328125, -14.823486328125, -14.224609375, -13.625732421875, -13.02685546875, -12.427978515625, -11.8291015625, -11.230224609375, -10.63134765625, -10.032470703125, -9.43359375, -8.834716796875, -8.23583984375, -7.636962890625, -7.0380859375, -6.439208984375, -5.84033203125, -5.241455078125, -4.642578125, -4.043701171875, -3.44482421875, -2.845947265625, -2.2470703125, -1.648193359375, -1.04931640625, -0.450439453125, 0.1484375, 0.747314453125, 1.34619140625, 1.945068359375, 2.5439453125, 3.142822265625, 3.74169921875, 4.340576171875, 4.939453125, 5.538330078125, 6.13720703125, 6.736083984375, 7.3349609375, 7.933837890625, 8.53271484375, 9.131591796875, 9.73046875, 10.329345703125, 10.92822265625, 11.527099609375, 12.1259765625, 12.724853515625, 13.32373046875, 13.922607421875, 14.521484375, 15.120361328125, 15.71923828125, 16.318115234375, 16.9169921875, 17.515869140625, 18.11474609375, 18.713623046875, 19.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 4.0, 6.0, 11.0, 14.0, 13.0, 20.0, 13.0, 16.0, 18.0, 15.0, 33.0, 36.0, 30.0, 38.0, 43.0, 37.0, 40.0, 40.0, 38.0, 41.0, 35.0, 34.0, 43.0, 45.0, 27.0, 35.0, 40.0, 33.0, 37.0, 15.0, 18.0, 16.0, 13.0, 18.0, 9.0, 14.0, 10.0, 6.0, 10.0, 5.0, 3.0, 4.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-39.4375, -38.22412109375, -37.0107421875, -35.79736328125, -34.583984375, -33.37060546875, -32.1572265625, -30.94384765625, -29.73046875, -28.51708984375, -27.3037109375, -26.09033203125, -24.876953125, -23.66357421875, -22.4501953125, -21.23681640625, -20.0234375, -18.81005859375, -17.5966796875, -16.38330078125, -15.169921875, -13.95654296875, -12.7431640625, -11.52978515625, -10.31640625, -9.10302734375, -7.8896484375, -6.67626953125, -5.462890625, -4.24951171875, -3.0361328125, -1.82275390625, -0.609375, 0.60400390625, 1.8173828125, 3.03076171875, 4.244140625, 5.45751953125, 6.6708984375, 7.88427734375, 9.09765625, 10.31103515625, 11.5244140625, 12.73779296875, 13.951171875, 15.16455078125, 16.3779296875, 17.59130859375, 18.8046875, 20.01806640625, 21.2314453125, 22.44482421875, 23.658203125, 24.87158203125, 26.0849609375, 27.29833984375, 28.51171875, 29.72509765625, 30.9384765625, 32.15185546875, 33.365234375, 34.57861328125, 35.7919921875, 37.00537109375, 38.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 13.0, 10.0, 21.0, 33.0, 64.0, 93.0, 166.0, 307.0, 545.0, 1077.0, 2163.0, 4582.0, 9939.0, 23224.0, 57138.0, 137570.0, 264522.0, 278877.0, 155263.0, 65015.0, 26526.0, 11325.0, 5144.0, 2325.0, 1174.0, 657.0, 328.0, 196.0, 93.0, 70.0, 29.0, 23.0, 12.0, 8.0, 7.0, 3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4453125, -14.8951416015625, -14.344970703125, -13.7947998046875, -13.24462890625, -12.6944580078125, -12.144287109375, -11.5941162109375, -11.0439453125, -10.4937744140625, -9.943603515625, -9.3934326171875, -8.84326171875, -8.2930908203125, -7.742919921875, -7.1927490234375, -6.642578125, -6.0924072265625, -5.542236328125, -4.9920654296875, -4.44189453125, -3.8917236328125, -3.341552734375, -2.7913818359375, -2.2412109375, -1.6910400390625, -1.140869140625, -0.5906982421875, -0.04052734375, 0.5096435546875, 1.059814453125, 1.6099853515625, 2.16015625, 2.7103271484375, 3.260498046875, 3.8106689453125, 4.36083984375, 4.9110107421875, 5.461181640625, 6.0113525390625, 6.5615234375, 7.1116943359375, 7.661865234375, 8.2120361328125, 8.76220703125, 9.3123779296875, 9.862548828125, 10.4127197265625, 10.962890625, 11.5130615234375, 12.063232421875, 12.6134033203125, 13.16357421875, 13.7137451171875, 14.263916015625, 14.8140869140625, 15.3642578125, 15.9144287109375, 16.464599609375, 17.0147705078125, 17.56494140625, 18.1151123046875, 18.665283203125, 19.2154541015625, 19.765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 4.0, 7.0, 10.0, 9.0, 10.0, 9.0, 8.0, 19.0, 18.0, 26.0, 29.0, 31.0, 36.0, 36.0, 41.0, 32.0, 44.0, 37.0, 44.0, 43.0, 38.0, 44.0, 43.0, 42.0, 36.0, 42.0, 35.0, 29.0, 29.0, 21.0, 28.0, 24.0, 26.0, 17.0, 7.0, 11.0, 10.0, 10.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.875, -24.021484375, -23.16796875, -22.314453125, -21.4609375, -20.607421875, -19.75390625, -18.900390625, -18.046875, -17.193359375, -16.33984375, -15.486328125, -14.6328125, -13.779296875, -12.92578125, -12.072265625, -11.21875, -10.365234375, -9.51171875, -8.658203125, -7.8046875, -6.951171875, -6.09765625, -5.244140625, -4.390625, -3.537109375, -2.68359375, -1.830078125, -0.9765625, -0.123046875, 0.73046875, 1.583984375, 2.4375, 3.291015625, 4.14453125, 4.998046875, 5.8515625, 6.705078125, 7.55859375, 8.412109375, 9.265625, 10.119140625, 10.97265625, 11.826171875, 12.6796875, 13.533203125, 14.38671875, 15.240234375, 16.09375, 16.947265625, 17.80078125, 18.654296875, 19.5078125, 20.361328125, 21.21484375, 22.068359375, 22.921875, 23.775390625, 24.62890625, 25.482421875, 26.3359375, 27.189453125, 28.04296875, 28.896484375, 29.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 8.0, 7.0, 14.0, 28.0, 26.0, 28.0, 46.0, 69.0, 94.0, 133.0, 247.0, 361.0, 587.0, 1100.0, 2035.0, 4420.0, 11043.0, 34100.0, 153909.0, 559333.0, 213513.0, 43556.0, 13273.0, 5196.0, 2350.0, 1209.0, 698.0, 397.0, 237.0, 172.0, 94.0, 79.0, 50.0, 40.0, 29.0, 21.0, 10.0, 8.0, 9.0, 5.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.28125, -9.9658203125, -9.650390625, -9.3349609375, -9.01953125, -8.7041015625, -8.388671875, -8.0732421875, -7.7578125, -7.4423828125, -7.126953125, -6.8115234375, -6.49609375, -6.1806640625, -5.865234375, -5.5498046875, -5.234375, -4.9189453125, -4.603515625, -4.2880859375, -3.97265625, -3.6572265625, -3.341796875, -3.0263671875, -2.7109375, -2.3955078125, -2.080078125, -1.7646484375, -1.44921875, -1.1337890625, -0.818359375, -0.5029296875, -0.1875, 0.1279296875, 0.443359375, 0.7587890625, 1.07421875, 1.3896484375, 1.705078125, 2.0205078125, 2.3359375, 2.6513671875, 2.966796875, 3.2822265625, 3.59765625, 3.9130859375, 4.228515625, 4.5439453125, 4.859375, 5.1748046875, 5.490234375, 5.8056640625, 6.12109375, 6.4365234375, 6.751953125, 7.0673828125, 7.3828125, 7.6982421875, 8.013671875, 8.3291015625, 8.64453125, 8.9599609375, 9.275390625, 9.5908203125, 9.90625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 6.0, 3.0, 2.0, 8.0, 5.0, 12.0, 8.0, 9.0, 15.0, 18.0, 24.0, 29.0, 52.0, 66.0, 90.0, 114.0, 113.0, 122.0, 76.0, 60.0, 43.0, 29.0, 13.0, 18.0, 21.0, 14.0, 7.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0013628005981445312, -0.0013146549463272095, -0.0012665092945098877, -0.001218363642692566, -0.0011702179908752441, -0.0011220723390579224, -0.0010739266872406006, -0.0010257810354232788, -0.000977635383605957, -0.0009294897317886353, -0.0008813440799713135, -0.0008331984281539917, -0.0007850527763366699, -0.0007369071245193481, -0.0006887614727020264, -0.0006406158208847046, -0.0005924701690673828, -0.000544324517250061, -0.0004961788654327393, -0.0004480332136154175, -0.0003998875617980957, -0.0003517419099807739, -0.00030359625816345215, -0.00025545060634613037, -0.0002073049545288086, -0.00015915930271148682, -0.00011101365089416504, -6.286799907684326e-05, -1.4722347259521484e-05, 3.342330455780029e-05, 8.156895637512207e-05, 0.00012971460819244385, 0.00017786026000976562, 0.0002260059118270874, 0.0002741515636444092, 0.00032229721546173096, 0.00037044286727905273, 0.0004185885190963745, 0.0004667341709136963, 0.0005148798227310181, 0.0005630254745483398, 0.0006111711263656616, 0.0006593167781829834, 0.0007074624300003052, 0.000755608081817627, 0.0008037537336349487, 0.0008518993854522705, 0.0009000450372695923, 0.0009481906890869141, 0.0009963363409042358, 0.0010444819927215576, 0.0010926276445388794, 0.0011407732963562012, 0.001188918948173523, 0.0012370645999908447, 0.0012852102518081665, 0.0013333559036254883, 0.00138150155544281, 0.0014296472072601318, 0.0014777928590774536, 0.0015259385108947754, 0.0015740841627120972, 0.001622229814529419, 0.0016703754663467407, 0.0017185211181640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 8.0, 13.0, 17.0, 19.0, 26.0, 39.0, 70.0, 102.0, 138.0, 188.0, 286.0, 413.0, 634.0, 975.0, 1682.0, 2716.0, 4651.0, 8953.0, 16492.0, 33447.0, 66438.0, 130745.0, 224042.0, 243332.0, 150942.0, 78599.0, 39813.0, 19797.0, 10255.0, 5581.0, 3065.0, 1820.0, 1155.0, 697.0, 459.0, 302.0, 184.0, 133.0, 104.0, 59.0, 46.0, 42.0, 25.0, 19.0, 10.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.234375, -7.97802734375, -7.7216796875, -7.46533203125, -7.208984375, -6.95263671875, -6.6962890625, -6.43994140625, -6.18359375, -5.92724609375, -5.6708984375, -5.41455078125, -5.158203125, -4.90185546875, -4.6455078125, -4.38916015625, -4.1328125, -3.87646484375, -3.6201171875, -3.36376953125, -3.107421875, -2.85107421875, -2.5947265625, -2.33837890625, -2.08203125, -1.82568359375, -1.5693359375, -1.31298828125, -1.056640625, -0.80029296875, -0.5439453125, -0.28759765625, -0.03125, 0.22509765625, 0.4814453125, 0.73779296875, 0.994140625, 1.25048828125, 1.5068359375, 1.76318359375, 2.01953125, 2.27587890625, 2.5322265625, 2.78857421875, 3.044921875, 3.30126953125, 3.5576171875, 3.81396484375, 4.0703125, 4.32666015625, 4.5830078125, 4.83935546875, 5.095703125, 5.35205078125, 5.6083984375, 5.86474609375, 6.12109375, 6.37744140625, 6.6337890625, 6.89013671875, 7.146484375, 7.40283203125, 7.6591796875, 7.91552734375, 8.171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 0.0, 6.0, 10.0, 10.0, 10.0, 17.0, 44.0, 49.0, 86.0, 80.0, 95.0, 89.0, 113.0, 97.0, 75.0, 62.0, 60.0, 33.0, 16.0, 15.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.4375, -4.306884765625, -4.17626953125, -4.045654296875, -3.9150390625, -3.784423828125, -3.65380859375, -3.523193359375, -3.392578125, -3.261962890625, -3.13134765625, -3.000732421875, -2.8701171875, -2.739501953125, -2.60888671875, -2.478271484375, -2.34765625, -2.217041015625, -2.08642578125, -1.955810546875, -1.8251953125, -1.694580078125, -1.56396484375, -1.433349609375, -1.302734375, -1.172119140625, -1.04150390625, -0.910888671875, -0.7802734375, -0.649658203125, -0.51904296875, -0.388427734375, -0.2578125, -0.127197265625, 0.00341796875, 0.134033203125, 0.2646484375, 0.395263671875, 0.52587890625, 0.656494140625, 0.787109375, 0.917724609375, 1.04833984375, 1.178955078125, 1.3095703125, 1.440185546875, 1.57080078125, 1.701416015625, 1.83203125, 1.962646484375, 2.09326171875, 2.223876953125, 2.3544921875, 2.485107421875, 2.61572265625, 2.746337890625, 2.876953125, 3.007568359375, 3.13818359375, 3.268798828125, 3.3994140625, 3.530029296875, 3.66064453125, 3.791259765625, 3.921875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 5.0, 4.0, 14.0, 13.0, 13.0, 20.0, 20.0, 20.0, 23.0, 26.0, 20.0, 39.0, 40.0, 35.0, 29.0, 36.0, 50.0, 40.0, 40.0, 40.0, 50.0, 39.0, 37.0, 47.0, 34.0, 45.0, 26.0, 31.0, 20.0, 27.0, 27.0, 21.0, 17.0, 11.0, 3.0, 8.0, 2.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.30130386352539, -37.19415283203125, -36.087005615234375, -34.979854583740234, -33.872703552246094, -32.76555633544922, -31.658405303955078, -30.551254272460938, -29.44410514831543, -28.336956024169922, -27.22980499267578, -26.122655868530273, -25.015506744384766, -23.908355712890625, -22.801206588745117, -21.69405746459961, -20.58690643310547, -19.47975730895996, -18.37260627746582, -17.265457153320312, -16.158306121826172, -15.051156997680664, -13.944007873535156, -12.836857795715332, -11.729707717895508, -10.622557640075684, -9.51540756225586, -8.408258438110352, -7.301108360290527, -6.193958282470703, -5.086808681488037, -3.979659080505371, -2.8725128173828125, -1.7653629779815674, -0.6582131385803223, 0.44893670082092285, 1.556086540222168, 2.663236618041992, 3.770386219024658, 4.877535820007324, 5.984685897827148, 7.091835975646973, 8.198986053466797, 9.306135177612305, 10.413285255432129, 11.520435333251953, 12.627584457397461, 13.734734535217285, 14.84188461303711, 15.949034690856934, 17.056184768676758, 18.163333892822266, 19.270484924316406, 20.377634048461914, 21.484783172607422, 22.591934204101562, 23.69908332824707, 24.806232452392578, 25.91338348388672, 27.020532608032227, 28.127681732177734, 29.234832763671875, 30.341981887817383, 31.44913101196289, 32.55628204345703]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 11.0, 9.0, 6.0, 8.0, 11.0, 9.0, 20.0, 20.0, 17.0, 35.0, 36.0, 31.0, 27.0, 39.0, 46.0, 43.0, 49.0, 40.0, 40.0, 41.0, 35.0, 56.0, 34.0, 36.0, 39.0, 42.0, 28.0, 24.0, 25.0, 18.0, 17.0, 18.0, 18.0, 10.0, 16.0, 11.0, 9.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.1461181640625, -37.879295349121094, -36.61247253417969, -35.34564971923828, -34.078826904296875, -32.81200408935547, -31.54517936706543, -30.278356552124023, -29.011533737182617, -27.74471092224121, -26.477888107299805, -25.2110652923584, -23.94424057006836, -22.677417755126953, -21.410594940185547, -20.14377212524414, -18.876949310302734, -17.610126495361328, -16.343303680419922, -15.0764799118042, -13.809657096862793, -12.542834281921387, -11.276010513305664, -10.009187698364258, -8.742364883422852, -7.475542068481445, -6.208718776702881, -4.941895484924316, -3.67507266998291, -2.408249855041504, -1.1414265632629395, 0.125396728515625, 1.3922233581542969, 2.6590464115142822, 3.9258694648742676, 5.192692756652832, 6.459515571594238, 7.7263383865356445, 8.993162155151367, 10.259984970092773, 11.52680778503418, 12.793630599975586, 14.060453414916992, 15.327277183532715, 16.594100952148438, 17.860923767089844, 19.12774658203125, 20.394569396972656, 21.661392211914062, 22.92821502685547, 24.195037841796875, 25.46186065673828, 26.728683471679688, 27.995506286621094, 29.262331008911133, 30.52915382385254, 31.795976638793945, 33.062801361083984, 34.32962417602539, 35.5964469909668, 36.8632698059082, 38.13009262084961, 39.396915435791016, 40.66373825073242, 41.93056106567383]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 9.0, 6.0, 13.0, 18.0, 22.0, 47.0, 54.0, 95.0, 144.0, 226.0, 364.0, 579.0, 879.0, 1405.0, 2059.0, 3379.0, 5286.0, 8133.0, 12288.0, 18434.0, 26647.0, 37764.0, 51348.0, 66999.0, 81942.0, 94460.0, 102553.0, 103182.0, 96896.0, 84710.0, 69371.0, 54100.0, 39421.0, 28393.0, 19904.0, 13329.0, 8571.0, 5548.0, 3560.0, 2366.0, 1445.0, 925.0, 627.0, 392.0, 262.0, 147.0, 94.0, 60.0, 41.0, 27.0, 8.0, 9.0, 10.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.71875, -24.891357421875, -24.06396484375, -23.236572265625, -22.4091796875, -21.581787109375, -20.75439453125, -19.927001953125, -19.099609375, -18.272216796875, -17.44482421875, -16.617431640625, -15.7900390625, -14.962646484375, -14.13525390625, -13.307861328125, -12.48046875, -11.653076171875, -10.82568359375, -9.998291015625, -9.1708984375, -8.343505859375, -7.51611328125, -6.688720703125, -5.861328125, -5.033935546875, -4.20654296875, -3.379150390625, -2.5517578125, -1.724365234375, -0.89697265625, -0.069580078125, 0.7578125, 1.585205078125, 2.41259765625, 3.239990234375, 4.0673828125, 4.894775390625, 5.72216796875, 6.549560546875, 7.376953125, 8.204345703125, 9.03173828125, 9.859130859375, 10.6865234375, 11.513916015625, 12.34130859375, 13.168701171875, 13.99609375, 14.823486328125, 15.65087890625, 16.478271484375, 17.3056640625, 18.133056640625, 18.96044921875, 19.787841796875, 20.615234375, 21.442626953125, 22.27001953125, 23.097412109375, 23.9248046875, 24.752197265625, 25.57958984375, 26.406982421875, 27.234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 8.0, 8.0, 8.0, 8.0, 17.0, 20.0, 22.0, 29.0, 28.0, 37.0, 34.0, 31.0, 44.0, 32.0, 47.0, 45.0, 43.0, 46.0, 43.0, 44.0, 40.0, 41.0, 35.0, 36.0, 35.0, 19.0, 27.0, 29.0, 15.0, 18.0, 14.0, 9.0, 15.0, 13.0, 14.0, 7.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-43.8125, -42.57568359375, -41.3388671875, -40.10205078125, -38.865234375, -37.62841796875, -36.3916015625, -35.15478515625, -33.91796875, -32.68115234375, -31.4443359375, -30.20751953125, -28.970703125, -27.73388671875, -26.4970703125, -25.26025390625, -24.0234375, -22.78662109375, -21.5498046875, -20.31298828125, -19.076171875, -17.83935546875, -16.6025390625, -15.36572265625, -14.12890625, -12.89208984375, -11.6552734375, -10.41845703125, -9.181640625, -7.94482421875, -6.7080078125, -5.47119140625, -4.234375, -2.99755859375, -1.7607421875, -0.52392578125, 0.712890625, 1.94970703125, 3.1865234375, 4.42333984375, 5.66015625, 6.89697265625, 8.1337890625, 9.37060546875, 10.607421875, 11.84423828125, 13.0810546875, 14.31787109375, 15.5546875, 16.79150390625, 18.0283203125, 19.26513671875, 20.501953125, 21.73876953125, 22.9755859375, 24.21240234375, 25.44921875, 26.68603515625, 27.9228515625, 29.15966796875, 30.396484375, 31.63330078125, 32.8701171875, 34.10693359375, 35.34375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 10.0, 11.0, 20.0, 43.0, 63.0, 114.0, 155.0, 237.0, 423.0, 618.0, 1004.0, 1545.0, 2493.0, 3523.0, 5378.0, 8032.0, 11724.0, 17222.0, 24157.0, 33071.0, 44742.0, 58048.0, 71131.0, 83445.0, 92778.0, 96393.0, 94841.0, 87866.0, 75858.0, 62235.0, 48423.0, 36772.0, 26661.0, 18985.0, 13436.0, 9042.0, 6269.0, 4186.0, 2704.0, 1747.0, 1203.0, 732.0, 465.0, 256.0, 166.0, 121.0, 90.0, 47.0, 31.0, 16.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.09375, -26.238037109375, -25.38232421875, -24.526611328125, -23.6708984375, -22.815185546875, -21.95947265625, -21.103759765625, -20.248046875, -19.392333984375, -18.53662109375, -17.680908203125, -16.8251953125, -15.969482421875, -15.11376953125, -14.258056640625, -13.40234375, -12.546630859375, -11.69091796875, -10.835205078125, -9.9794921875, -9.123779296875, -8.26806640625, -7.412353515625, -6.556640625, -5.700927734375, -4.84521484375, -3.989501953125, -3.1337890625, -2.278076171875, -1.42236328125, -0.566650390625, 0.2890625, 1.144775390625, 2.00048828125, 2.856201171875, 3.7119140625, 4.567626953125, 5.42333984375, 6.279052734375, 7.134765625, 7.990478515625, 8.84619140625, 9.701904296875, 10.5576171875, 11.413330078125, 12.26904296875, 13.124755859375, 13.98046875, 14.836181640625, 15.69189453125, 16.547607421875, 17.4033203125, 18.259033203125, 19.11474609375, 19.970458984375, 20.826171875, 21.681884765625, 22.53759765625, 23.393310546875, 24.2490234375, 25.104736328125, 25.96044921875, 26.816162109375, 27.671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 2.0, 1.0, 4.0, 7.0, 8.0, 11.0, 17.0, 13.0, 23.0, 15.0, 23.0, 15.0, 25.0, 19.0, 24.0, 30.0, 29.0, 37.0, 30.0, 44.0, 33.0, 42.0, 37.0, 46.0, 33.0, 40.0, 37.0, 35.0, 30.0, 29.0, 22.0, 34.0, 31.0, 30.0, 25.0, 15.0, 22.0, 12.0, 10.0, 17.0, 6.0, 7.0, 6.0, 9.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.03125, -21.310546875, -20.58984375, -19.869140625, -19.1484375, -18.427734375, -17.70703125, -16.986328125, -16.265625, -15.544921875, -14.82421875, -14.103515625, -13.3828125, -12.662109375, -11.94140625, -11.220703125, -10.5, -9.779296875, -9.05859375, -8.337890625, -7.6171875, -6.896484375, -6.17578125, -5.455078125, -4.734375, -4.013671875, -3.29296875, -2.572265625, -1.8515625, -1.130859375, -0.41015625, 0.310546875, 1.03125, 1.751953125, 2.47265625, 3.193359375, 3.9140625, 4.634765625, 5.35546875, 6.076171875, 6.796875, 7.517578125, 8.23828125, 8.958984375, 9.6796875, 10.400390625, 11.12109375, 11.841796875, 12.5625, 13.283203125, 14.00390625, 14.724609375, 15.4453125, 16.166015625, 16.88671875, 17.607421875, 18.328125, 19.048828125, 19.76953125, 20.490234375, 21.2109375, 21.931640625, 22.65234375, 23.373046875, 24.09375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 9.0, 13.0, 11.0, 22.0, 26.0, 47.0, 45.0, 78.0, 94.0, 133.0, 185.0, 246.0, 370.0, 543.0, 857.0, 1333.0, 2308.0, 4093.0, 7684.0, 14622.0, 28705.0, 55453.0, 99709.0, 155026.0, 193389.0, 182282.0, 132568.0, 78631.0, 42670.0, 21706.0, 11450.0, 5930.0, 3206.0, 1743.0, 1134.0, 658.0, 479.0, 298.0, 222.0, 144.0, 107.0, 87.0, 75.0, 48.0, 35.0, 22.0, 18.0, 11.0, 7.0, 10.0, 4.0, 8.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-15.671875, -15.178955078125, -14.68603515625, -14.193115234375, -13.7001953125, -13.207275390625, -12.71435546875, -12.221435546875, -11.728515625, -11.235595703125, -10.74267578125, -10.249755859375, -9.7568359375, -9.263916015625, -8.77099609375, -8.278076171875, -7.78515625, -7.292236328125, -6.79931640625, -6.306396484375, -5.8134765625, -5.320556640625, -4.82763671875, -4.334716796875, -3.841796875, -3.348876953125, -2.85595703125, -2.363037109375, -1.8701171875, -1.377197265625, -0.88427734375, -0.391357421875, 0.1015625, 0.594482421875, 1.08740234375, 1.580322265625, 2.0732421875, 2.566162109375, 3.05908203125, 3.552001953125, 4.044921875, 4.537841796875, 5.03076171875, 5.523681640625, 6.0166015625, 6.509521484375, 7.00244140625, 7.495361328125, 7.98828125, 8.481201171875, 8.97412109375, 9.467041015625, 9.9599609375, 10.452880859375, 10.94580078125, 11.438720703125, 11.931640625, 12.424560546875, 12.91748046875, 13.410400390625, 13.9033203125, 14.396240234375, 14.88916015625, 15.382080078125, 15.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 5.0, 6.0, 6.0, 12.0, 7.0, 7.0, 17.0, 28.0, 28.0, 28.0, 43.0, 38.0, 49.0, 65.0, 49.0, 63.0, 62.0, 64.0, 52.0, 59.0, 47.0, 56.0, 46.0, 35.0, 19.0, 26.0, 17.0, 9.0, 11.0, 8.0, 10.0, 6.0, 7.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0014410018920898438, -0.0013992488384246826, -0.0013574957847595215, -0.0013157427310943604, -0.0012739896774291992, -0.001232236623764038, -0.001190483570098877, -0.0011487305164337158, -0.0011069774627685547, -0.0010652244091033936, -0.0010234713554382324, -0.0009817183017730713, -0.0009399652481079102, -0.000898212194442749, -0.0008564591407775879, -0.0008147060871124268, -0.0007729530334472656, -0.0007311999797821045, -0.0006894469261169434, -0.0006476938724517822, -0.0006059408187866211, -0.00056418776512146, -0.0005224347114562988, -0.0004806816577911377, -0.00043892860412597656, -0.00039717555046081543, -0.0003554224967956543, -0.00031366944313049316, -0.00027191638946533203, -0.0002301633358001709, -0.00018841028213500977, -0.00014665722846984863, -0.0001049041748046875, -6.315112113952637e-05, -2.1398067474365234e-05, 2.03549861907959e-05, 6.210803985595703e-05, 0.00010386109352111816, 0.0001456141471862793, 0.00018736720085144043, 0.00022912025451660156, 0.0002708733081817627, 0.00031262636184692383, 0.00035437941551208496, 0.0003961324691772461, 0.0004378855228424072, 0.00047963857650756836, 0.0005213916301727295, 0.0005631446838378906, 0.0006048977375030518, 0.0006466507911682129, 0.000688403844833374, 0.0007301568984985352, 0.0007719099521636963, 0.0008136630058288574, 0.0008554160594940186, 0.0008971691131591797, 0.0009389221668243408, 0.000980675220489502, 0.001022428274154663, 0.0010641813278198242, 0.0011059343814849854, 0.0011476874351501465, 0.0011894404888153076, 0.0012311935424804688]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 10.0, 18.0, 28.0, 39.0, 48.0, 80.0, 136.0, 252.0, 325.0, 661.0, 1016.0, 1845.0, 3198.0, 5665.0, 10208.0, 17458.0, 29899.0, 50524.0, 78807.0, 113129.0, 141379.0, 152656.0, 140353.0, 109577.0, 76051.0, 48012.0, 28772.0, 16379.0, 9439.0, 5245.0, 3073.0, 1651.0, 1046.0, 618.0, 371.0, 214.0, 144.0, 86.0, 57.0, 29.0, 26.0, 14.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1484375, -12.75537109375, -12.3623046875, -11.96923828125, -11.576171875, -11.18310546875, -10.7900390625, -10.39697265625, -10.00390625, -9.61083984375, -9.2177734375, -8.82470703125, -8.431640625, -8.03857421875, -7.6455078125, -7.25244140625, -6.859375, -6.46630859375, -6.0732421875, -5.68017578125, -5.287109375, -4.89404296875, -4.5009765625, -4.10791015625, -3.71484375, -3.32177734375, -2.9287109375, -2.53564453125, -2.142578125, -1.74951171875, -1.3564453125, -0.96337890625, -0.5703125, -0.17724609375, 0.2158203125, 0.60888671875, 1.001953125, 1.39501953125, 1.7880859375, 2.18115234375, 2.57421875, 2.96728515625, 3.3603515625, 3.75341796875, 4.146484375, 4.53955078125, 4.9326171875, 5.32568359375, 5.71875, 6.11181640625, 6.5048828125, 6.89794921875, 7.291015625, 7.68408203125, 8.0771484375, 8.47021484375, 8.86328125, 9.25634765625, 9.6494140625, 10.04248046875, 10.435546875, 10.82861328125, 11.2216796875, 11.61474609375, 12.0078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 11.0, 6.0, 4.0, 9.0, 16.0, 20.0, 17.0, 23.0, 24.0, 38.0, 45.0, 59.0, 52.0, 56.0, 62.0, 57.0, 77.0, 71.0, 72.0, 43.0, 50.0, 49.0, 25.0, 25.0, 20.0, 15.0, 11.0, 12.0, 5.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.65625, -5.47161865234375, -5.2869873046875, -5.10235595703125, -4.917724609375, -4.73309326171875, -4.5484619140625, -4.36383056640625, -4.17919921875, -3.99456787109375, -3.8099365234375, -3.62530517578125, -3.440673828125, -3.25604248046875, -3.0714111328125, -2.88677978515625, -2.7021484375, -2.51751708984375, -2.3328857421875, -2.14825439453125, -1.963623046875, -1.77899169921875, -1.5943603515625, -1.40972900390625, -1.22509765625, -1.04046630859375, -0.8558349609375, -0.67120361328125, -0.486572265625, -0.30194091796875, -0.1173095703125, 0.06732177734375, 0.251953125, 0.43658447265625, 0.6212158203125, 0.80584716796875, 0.990478515625, 1.17510986328125, 1.3597412109375, 1.54437255859375, 1.72900390625, 1.91363525390625, 2.0982666015625, 2.28289794921875, 2.467529296875, 2.65216064453125, 2.8367919921875, 3.02142333984375, 3.2060546875, 3.39068603515625, 3.5753173828125, 3.75994873046875, 3.944580078125, 4.12921142578125, 4.3138427734375, 4.49847412109375, 4.68310546875, 4.86773681640625, 5.0523681640625, 5.23699951171875, 5.421630859375, 5.60626220703125, 5.7908935546875, 5.97552490234375, 6.16015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 4.0, 1.0, 5.0, 11.0, 10.0, 7.0, 9.0, 7.0, 14.0, 11.0, 20.0, 21.0, 28.0, 23.0, 25.0, 27.0, 26.0, 26.0, 36.0, 32.0, 42.0, 36.0, 36.0, 32.0, 44.0, 38.0, 36.0, 38.0, 42.0, 35.0, 37.0, 25.0, 27.0, 31.0, 27.0, 23.0, 11.0, 23.0, 10.0, 16.0, 12.0, 11.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-32.09178161621094, -31.142948150634766, -30.194114685058594, -29.245281219482422, -28.29644775390625, -27.347614288330078, -26.398780822753906, -25.449947357177734, -24.501113891601562, -23.55228042602539, -22.60344696044922, -21.654613494873047, -20.705780029296875, -19.756946563720703, -18.80811309814453, -17.85927963256836, -16.910446166992188, -15.961612701416016, -15.012779235839844, -14.063945770263672, -13.1151123046875, -12.166278839111328, -11.217445373535156, -10.268611907958984, -9.319778442382812, -8.37094497680664, -7.422111511230469, -6.473278045654297, -5.524444580078125, -4.575611114501953, -3.6267776489257812, -2.6779441833496094, -1.7291126251220703, -0.7802791595458984, 0.16855430603027344, 1.1173877716064453, 2.066221237182617, 3.015054702758789, 3.963888168334961, 4.912721633911133, 5.861555099487305, 6.810388565063477, 7.759222030639648, 8.70805549621582, 9.656888961791992, 10.605722427368164, 11.554555892944336, 12.503389358520508, 13.45222282409668, 14.401056289672852, 15.349889755249023, 16.298723220825195, 17.247556686401367, 18.19639015197754, 19.14522361755371, 20.094057083129883, 21.042890548706055, 21.991724014282227, 22.9405574798584, 23.88939094543457, 24.838224411010742, 25.787057876586914, 26.735891342163086, 27.684724807739258, 28.63355827331543]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 11.0, 4.0, 9.0, 6.0, 12.0, 17.0, 14.0, 12.0, 15.0, 19.0, 27.0, 24.0, 36.0, 38.0, 35.0, 36.0, 45.0, 32.0, 45.0, 48.0, 35.0, 52.0, 45.0, 35.0, 43.0, 38.0, 33.0, 41.0, 34.0, 28.0, 18.0, 22.0, 22.0, 16.0, 14.0, 11.0, 6.0, 8.0, 5.0, 4.0, 5.0, 5.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.34571075439453, -41.03445053100586, -39.72319030761719, -38.41193389892578, -37.10067367553711, -35.78941345214844, -34.478153228759766, -33.166893005371094, -31.855634689331055, -30.544374465942383, -29.233116149902344, -27.921855926513672, -26.610595703125, -25.29933738708496, -23.98807716369629, -22.67681884765625, -21.365558624267578, -20.054298400878906, -18.743040084838867, -17.431779861450195, -16.120521545410156, -14.809261322021484, -13.498001098632812, -12.186741828918457, -10.875482559204102, -9.564223289489746, -8.25296401977539, -6.941703796386719, -5.630444526672363, -4.319185256958008, -3.007925510406494, -1.6966657638549805, -0.3854026794433594, 0.9258568286895752, 2.2371163368225098, 3.5483758449554443, 4.859635353088379, 6.170894622802734, 7.482154369354248, 8.793414115905762, 10.104673385620117, 11.415932655334473, 12.727191925048828, 14.0384521484375, 15.349711418151855, 16.66097068786621, 17.972230911254883, 19.283489227294922, 20.594749450683594, 21.906009674072266, 23.217267990112305, 24.528528213500977, 25.839786529541016, 27.151046752929688, 28.46230697631836, 29.77356719970703, 31.08482551574707, 32.39608383178711, 33.70734405517578, 35.01860427856445, 36.329864501953125, 37.64112091064453, 38.9523811340332, 40.263641357421875, 41.57490158081055]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 13.0, 25.0, 33.0, 47.0, 81.0, 139.0, 265.0, 391.0, 665.0, 1193.0, 2035.0, 3361.0, 5908.0, 10023.0, 16822.0, 28450.0, 46892.0, 76656.0, 121951.0, 188291.0, 274831.0, 373979.0, 466791.0, 521445.0, 518542.0, 453939.0, 357404.0, 258461.0, 175922.0, 112480.0, 70667.0, 42850.0, 26035.0, 15440.0, 9068.0, 5449.0, 3204.0, 1869.0, 1077.0, 654.0, 384.0, 230.0, 116.0, 84.0, 56.0, 25.0, 22.0, 8.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.640625, -25.80615234375, -24.9716796875, -24.13720703125, -23.302734375, -22.46826171875, -21.6337890625, -20.79931640625, -19.96484375, -19.13037109375, -18.2958984375, -17.46142578125, -16.626953125, -15.79248046875, -14.9580078125, -14.12353515625, -13.2890625, -12.45458984375, -11.6201171875, -10.78564453125, -9.951171875, -9.11669921875, -8.2822265625, -7.44775390625, -6.61328125, -5.77880859375, -4.9443359375, -4.10986328125, -3.275390625, -2.44091796875, -1.6064453125, -0.77197265625, 0.0625, 0.89697265625, 1.7314453125, 2.56591796875, 3.400390625, 4.23486328125, 5.0693359375, 5.90380859375, 6.73828125, 7.57275390625, 8.4072265625, 9.24169921875, 10.076171875, 10.91064453125, 11.7451171875, 12.57958984375, 13.4140625, 14.24853515625, 15.0830078125, 15.91748046875, 16.751953125, 17.58642578125, 18.4208984375, 19.25537109375, 20.08984375, 20.92431640625, 21.7587890625, 22.59326171875, 23.427734375, 24.26220703125, 25.0966796875, 25.93115234375, 26.765625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 8.0, 20.0, 11.0, 15.0, 14.0, 18.0, 18.0, 19.0, 27.0, 33.0, 34.0, 36.0, 32.0, 33.0, 43.0, 48.0, 50.0, 48.0, 43.0, 40.0, 45.0, 44.0, 31.0, 33.0, 36.0, 28.0, 32.0, 37.0, 21.0, 17.0, 15.0, 16.0, 9.0, 10.0, 6.0, 8.0, 2.0, 5.0, 6.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.96875, -29.96142578125, -28.9541015625, -27.94677734375, -26.939453125, -25.93212890625, -24.9248046875, -23.91748046875, -22.91015625, -21.90283203125, -20.8955078125, -19.88818359375, -18.880859375, -17.87353515625, -16.8662109375, -15.85888671875, -14.8515625, -13.84423828125, -12.8369140625, -11.82958984375, -10.822265625, -9.81494140625, -8.8076171875, -7.80029296875, -6.79296875, -5.78564453125, -4.7783203125, -3.77099609375, -2.763671875, -1.75634765625, -0.7490234375, 0.25830078125, 1.265625, 2.27294921875, 3.2802734375, 4.28759765625, 5.294921875, 6.30224609375, 7.3095703125, 8.31689453125, 9.32421875, 10.33154296875, 11.3388671875, 12.34619140625, 13.353515625, 14.36083984375, 15.3681640625, 16.37548828125, 17.3828125, 18.39013671875, 19.3974609375, 20.40478515625, 21.412109375, 22.41943359375, 23.4267578125, 24.43408203125, 25.44140625, 26.44873046875, 27.4560546875, 28.46337890625, 29.470703125, 30.47802734375, 31.4853515625, 32.49267578125, 33.5]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 19.0, 30.0, 48.0, 85.0, 111.0, 173.0, 296.0, 480.0, 765.0, 1237.0, 2126.0, 3208.0, 5316.0, 8195.0, 12912.0, 20312.0, 31180.0, 46370.0, 67790.0, 99668.0, 137080.0, 186088.0, 241251.0, 298699.0, 350631.0, 387364.0, 400303.0, 386639.0, 350338.0, 297091.0, 240891.0, 184443.0, 137140.0, 97023.0, 67740.0, 46251.0, 30562.0, 19992.0, 12605.0, 8241.0, 5102.0, 3291.0, 1992.0, 1249.0, 744.0, 435.0, 299.0, 166.0, 131.0, 72.0, 41.0, 26.0, 17.0, 10.0, 6.0, 2.0, 3.0, 3.0], "bins": [-22.390625, -21.701416015625, -21.01220703125, -20.322998046875, -19.6337890625, -18.944580078125, -18.25537109375, -17.566162109375, -16.876953125, -16.187744140625, -15.49853515625, -14.809326171875, -14.1201171875, -13.430908203125, -12.74169921875, -12.052490234375, -11.36328125, -10.674072265625, -9.98486328125, -9.295654296875, -8.6064453125, -7.917236328125, -7.22802734375, -6.538818359375, -5.849609375, -5.160400390625, -4.47119140625, -3.781982421875, -3.0927734375, -2.403564453125, -1.71435546875, -1.025146484375, -0.3359375, 0.353271484375, 1.04248046875, 1.731689453125, 2.4208984375, 3.110107421875, 3.79931640625, 4.488525390625, 5.177734375, 5.866943359375, 6.55615234375, 7.245361328125, 7.9345703125, 8.623779296875, 9.31298828125, 10.002197265625, 10.69140625, 11.380615234375, 12.06982421875, 12.759033203125, 13.4482421875, 14.137451171875, 14.82666015625, 15.515869140625, 16.205078125, 16.894287109375, 17.58349609375, 18.272705078125, 18.9619140625, 19.651123046875, 20.34033203125, 21.029541015625, 21.71875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 15.0, 9.0, 19.0, 7.0, 32.0, 26.0, 38.0, 43.0, 61.0, 72.0, 98.0, 119.0, 124.0, 154.0, 217.0, 212.0, 227.0, 229.0, 229.0, 239.0, 251.0, 231.0, 216.0, 221.0, 184.0, 153.0, 119.0, 117.0, 85.0, 73.0, 67.0, 46.0, 45.0, 24.0, 18.0, 17.0, 10.0, 9.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.5892333984375, -12.108154296875, -11.6270751953125, -11.14599609375, -10.6649169921875, -10.183837890625, -9.7027587890625, -9.2216796875, -8.7406005859375, -8.259521484375, -7.7784423828125, -7.29736328125, -6.8162841796875, -6.335205078125, -5.8541259765625, -5.373046875, -4.8919677734375, -4.410888671875, -3.9298095703125, -3.44873046875, -2.9676513671875, -2.486572265625, -2.0054931640625, -1.5244140625, -1.0433349609375, -0.562255859375, -0.0811767578125, 0.39990234375, 0.8809814453125, 1.362060546875, 1.8431396484375, 2.32421875, 2.8052978515625, 3.286376953125, 3.7674560546875, 4.24853515625, 4.7296142578125, 5.210693359375, 5.6917724609375, 6.1728515625, 6.6539306640625, 7.135009765625, 7.6160888671875, 8.09716796875, 8.5782470703125, 9.059326171875, 9.5404052734375, 10.021484375, 10.5025634765625, 10.983642578125, 11.4647216796875, 11.94580078125, 12.4268798828125, 12.907958984375, 13.3890380859375, 13.8701171875, 14.3511962890625, 14.832275390625, 15.3133544921875, 15.79443359375, 16.2755126953125, 16.756591796875, 17.2376708984375, 17.71875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 8.0, 1.0, 4.0, 6.0, 8.0, 5.0, 11.0, 12.0, 17.0, 15.0, 20.0, 26.0, 21.0, 37.0, 32.0, 37.0, 32.0, 54.0, 27.0, 34.0, 44.0, 40.0, 36.0, 37.0, 36.0, 45.0, 29.0, 51.0, 31.0, 36.0, 36.0, 26.0, 22.0, 24.0, 12.0, 12.0, 10.0, 10.0, 8.0, 11.0, 11.0, 5.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-31.60767364501953, -30.733016967773438, -29.858360290527344, -28.98370361328125, -28.109045028686523, -27.23438835144043, -26.359731674194336, -25.485074996948242, -24.610416412353516, -23.735759735107422, -22.861103057861328, -21.986446380615234, -21.111787796020508, -20.237131118774414, -19.36247444152832, -18.487817764282227, -17.613161087036133, -16.73850440979004, -15.863846778869629, -14.989190101623535, -14.114532470703125, -13.239875793457031, -12.365219116210938, -11.490562438964844, -10.615904808044434, -9.74124813079834, -8.86659049987793, -7.991933822631836, -7.117276668548584, -6.242619514465332, -5.367962837219238, -4.493305683135986, -3.6186485290527344, -2.7439913749694824, -1.8693344593048096, -0.9946775436401367, -0.12002038955688477, 0.7546367645263672, 1.629293441772461, 2.503950595855713, 3.378607749938965, 4.253264904022217, 5.127922058105469, 6.0025787353515625, 6.8772358894348145, 7.751893043518066, 8.62654972076416, 9.50120735168457, 10.375864028930664, 11.250520706176758, 12.125178337097168, 12.999835014343262, 13.874492645263672, 14.749149322509766, 15.62380599975586, 16.498462677001953, 17.373119354248047, 18.24777603149414, 19.122432708740234, 19.997089385986328, 20.871747970581055, 21.74640464782715, 22.621061325073242, 23.495718002319336, 24.370376586914062]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 4.0, 9.0, 8.0, 5.0, 7.0, 15.0, 12.0, 19.0, 25.0, 30.0, 23.0, 20.0, 36.0, 43.0, 36.0, 48.0, 29.0, 33.0, 42.0, 35.0, 46.0, 40.0, 40.0, 50.0, 41.0, 40.0, 30.0, 31.0, 27.0, 19.0, 23.0, 30.0, 11.0, 20.0, 7.0, 13.0, 11.0, 8.0, 1.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.73747634887695, -31.653339385986328, -30.569204330444336, -29.48506736755371, -28.40093231201172, -27.316795349121094, -26.23265838623047, -25.148521423339844, -24.06438636779785, -22.980249404907227, -21.896114349365234, -20.81197738647461, -19.727840423583984, -18.643705368041992, -17.559568405151367, -16.475433349609375, -15.39129638671875, -14.307160377502441, -13.223024368286133, -12.138887405395508, -11.0547513961792, -9.97061538696289, -8.886478424072266, -7.802342414855957, -6.718206405639648, -5.63407039642334, -4.549933910369873, -3.4657976627349854, -2.3816614151000977, -1.297525405883789, -0.21338891983032227, 0.8707475662231445, 1.9548873901367188, 3.0390236377716064, 4.123159885406494, 5.207296371459961, 6.2914323806762695, 7.375568389892578, 8.459705352783203, 9.543841361999512, 10.62797737121582, 11.712113380432129, 12.796249389648438, 13.880386352539062, 14.964522361755371, 16.04865837097168, 17.132795333862305, 18.216930389404297, 19.301067352294922, 20.385204315185547, 21.46933937072754, 22.553476333618164, 23.637611389160156, 24.72174835205078, 25.805885314941406, 26.89002227783203, 27.974157333374023, 29.05829429626465, 30.14242935180664, 31.226566314697266, 32.31070327758789, 33.39483642578125, 34.478973388671875, 35.5631103515625, 36.647247314453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 6.0, 13.0, 22.0, 30.0, 44.0, 41.0, 93.0, 115.0, 206.0, 301.0, 493.0, 817.0, 1377.0, 2310.0, 4009.0, 6763.0, 12256.0, 22502.0, 40070.0, 70428.0, 114805.0, 166864.0, 190421.0, 159066.0, 106773.0, 64861.0, 36580.0, 20516.0, 11512.0, 6324.0, 3565.0, 2123.0, 1210.0, 775.0, 470.0, 283.0, 191.0, 108.0, 62.0, 50.0, 29.0, 25.0, 22.0, 3.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.3125, -11.920654296875, -11.52880859375, -11.136962890625, -10.7451171875, -10.353271484375, -9.96142578125, -9.569580078125, -9.177734375, -8.785888671875, -8.39404296875, -8.002197265625, -7.6103515625, -7.218505859375, -6.82666015625, -6.434814453125, -6.04296875, -5.651123046875, -5.25927734375, -4.867431640625, -4.4755859375, -4.083740234375, -3.69189453125, -3.300048828125, -2.908203125, -2.516357421875, -2.12451171875, -1.732666015625, -1.3408203125, -0.948974609375, -0.55712890625, -0.165283203125, 0.2265625, 0.618408203125, 1.01025390625, 1.402099609375, 1.7939453125, 2.185791015625, 2.57763671875, 2.969482421875, 3.361328125, 3.753173828125, 4.14501953125, 4.536865234375, 4.9287109375, 5.320556640625, 5.71240234375, 6.104248046875, 6.49609375, 6.887939453125, 7.27978515625, 7.671630859375, 8.0634765625, 8.455322265625, 8.84716796875, 9.239013671875, 9.630859375, 10.022705078125, 10.41455078125, 10.806396484375, 11.1982421875, 11.590087890625, 11.98193359375, 12.373779296875, 12.765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 12.0, 4.0, 10.0, 4.0, 11.0, 14.0, 20.0, 18.0, 29.0, 21.0, 19.0, 35.0, 30.0, 35.0, 32.0, 47.0, 39.0, 47.0, 44.0, 40.0, 50.0, 51.0, 49.0, 44.0, 29.0, 33.0, 36.0, 28.0, 21.0, 25.0, 19.0, 22.0, 13.0, 14.0, 11.0, 9.0, 9.0, 4.0, 9.0, 4.0, 6.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -31.90185546875, -30.7412109375, -29.58056640625, -28.419921875, -27.25927734375, -26.0986328125, -24.93798828125, -23.77734375, -22.61669921875, -21.4560546875, -20.29541015625, -19.134765625, -17.97412109375, -16.8134765625, -15.65283203125, -14.4921875, -13.33154296875, -12.1708984375, -11.01025390625, -9.849609375, -8.68896484375, -7.5283203125, -6.36767578125, -5.20703125, -4.04638671875, -2.8857421875, -1.72509765625, -0.564453125, 0.59619140625, 1.7568359375, 2.91748046875, 4.078125, 5.23876953125, 6.3994140625, 7.56005859375, 8.720703125, 9.88134765625, 11.0419921875, 12.20263671875, 13.36328125, 14.52392578125, 15.6845703125, 16.84521484375, 18.005859375, 19.16650390625, 20.3271484375, 21.48779296875, 22.6484375, 23.80908203125, 24.9697265625, 26.13037109375, 27.291015625, 28.45166015625, 29.6123046875, 30.77294921875, 31.93359375, 33.09423828125, 34.2548828125, 35.41552734375, 36.576171875, 37.73681640625, 38.8974609375, 40.05810546875, 41.21875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 8.0, 8.0, 15.0, 18.0, 23.0, 42.0, 68.0, 118.0, 174.0, 290.0, 474.0, 710.0, 1274.0, 2254.0, 4166.0, 7545.0, 14091.0, 27569.0, 52371.0, 97072.0, 160767.0, 207476.0, 190280.0, 128108.0, 72031.0, 38642.0, 19676.0, 10379.0, 5675.0, 2969.0, 1774.0, 968.0, 570.0, 374.0, 199.0, 139.0, 84.0, 52.0, 46.0, 24.0, 22.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.0535888671875, -7.763427734375, -7.4732666015625, -7.18310546875, -6.8929443359375, -6.602783203125, -6.3126220703125, -6.0224609375, -5.7322998046875, -5.442138671875, -5.1519775390625, -4.86181640625, -4.5716552734375, -4.281494140625, -3.9913330078125, -3.701171875, -3.4110107421875, -3.120849609375, -2.8306884765625, -2.54052734375, -2.2503662109375, -1.960205078125, -1.6700439453125, -1.3798828125, -1.0897216796875, -0.799560546875, -0.5093994140625, -0.21923828125, 0.0709228515625, 0.361083984375, 0.6512451171875, 0.94140625, 1.2315673828125, 1.521728515625, 1.8118896484375, 2.10205078125, 2.3922119140625, 2.682373046875, 2.9725341796875, 3.2626953125, 3.5528564453125, 3.843017578125, 4.1331787109375, 4.42333984375, 4.7135009765625, 5.003662109375, 5.2938232421875, 5.583984375, 5.8741455078125, 6.164306640625, 6.4544677734375, 6.74462890625, 7.0347900390625, 7.324951171875, 7.6151123046875, 7.9052734375, 8.1954345703125, 8.485595703125, 8.7757568359375, 9.06591796875, 9.3560791015625, 9.646240234375, 9.9364013671875, 10.2265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 7.0, 15.0, 18.0, 16.0, 13.0, 18.0, 28.0, 27.0, 27.0, 32.0, 30.0, 42.0, 36.0, 32.0, 38.0, 41.0, 50.0, 43.0, 40.0, 41.0, 42.0, 44.0, 27.0, 36.0, 23.0, 29.0, 21.0, 28.0, 15.0, 18.0, 23.0, 20.0, 12.0, 15.0, 12.0, 3.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.453125, -20.741943359375, -20.03076171875, -19.319580078125, -18.6083984375, -17.897216796875, -17.18603515625, -16.474853515625, -15.763671875, -15.052490234375, -14.34130859375, -13.630126953125, -12.9189453125, -12.207763671875, -11.49658203125, -10.785400390625, -10.07421875, -9.363037109375, -8.65185546875, -7.940673828125, -7.2294921875, -6.518310546875, -5.80712890625, -5.095947265625, -4.384765625, -3.673583984375, -2.96240234375, -2.251220703125, -1.5400390625, -0.828857421875, -0.11767578125, 0.593505859375, 1.3046875, 2.015869140625, 2.72705078125, 3.438232421875, 4.1494140625, 4.860595703125, 5.57177734375, 6.282958984375, 6.994140625, 7.705322265625, 8.41650390625, 9.127685546875, 9.8388671875, 10.550048828125, 11.26123046875, 11.972412109375, 12.68359375, 13.394775390625, 14.10595703125, 14.817138671875, 15.5283203125, 16.239501953125, 16.95068359375, 17.661865234375, 18.373046875, 19.084228515625, 19.79541015625, 20.506591796875, 21.2177734375, 21.928955078125, 22.64013671875, 23.351318359375, 24.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 6.0, 9.0, 15.0, 17.0, 44.0, 57.0, 66.0, 100.0, 140.0, 186.0, 284.0, 418.0, 551.0, 862.0, 1234.0, 1883.0, 2988.0, 5102.0, 8777.0, 16503.0, 34912.0, 82220.0, 202588.0, 332736.0, 201034.0, 82058.0, 34636.0, 16544.0, 8658.0, 5033.0, 3054.0, 1875.0, 1221.0, 845.0, 567.0, 428.0, 260.0, 203.0, 144.0, 89.0, 64.0, 47.0, 26.0, 22.0, 8.0, 17.0, 11.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.529296875, -3.41357421875, -3.2978515625, -3.18212890625, -3.06640625, -2.95068359375, -2.8349609375, -2.71923828125, -2.603515625, -2.48779296875, -2.3720703125, -2.25634765625, -2.140625, -2.02490234375, -1.9091796875, -1.79345703125, -1.677734375, -1.56201171875, -1.4462890625, -1.33056640625, -1.21484375, -1.09912109375, -0.9833984375, -0.86767578125, -0.751953125, -0.63623046875, -0.5205078125, -0.40478515625, -0.2890625, -0.17333984375, -0.0576171875, 0.05810546875, 0.173828125, 0.28955078125, 0.4052734375, 0.52099609375, 0.63671875, 0.75244140625, 0.8681640625, 0.98388671875, 1.099609375, 1.21533203125, 1.3310546875, 1.44677734375, 1.5625, 1.67822265625, 1.7939453125, 1.90966796875, 2.025390625, 2.14111328125, 2.2568359375, 2.37255859375, 2.48828125, 2.60400390625, 2.7197265625, 2.83544921875, 2.951171875, 3.06689453125, 3.1826171875, 3.29833984375, 3.4140625, 3.52978515625, 3.6455078125, 3.76123046875, 3.876953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 19.0, 14.0, 22.0, 33.0, 72.0, 118.0, 160.0, 156.0, 153.0, 85.0, 58.0, 37.0, 25.0, 14.0, 10.0, 11.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0018568038940429688, -0.00181589275598526, -0.0017749816179275513, -0.0017340704798698425, -0.0016931593418121338, -0.001652248203754425, -0.0016113370656967163, -0.0015704259276390076, -0.0015295147895812988, -0.00148860365152359, -0.0014476925134658813, -0.0014067813754081726, -0.0013658702373504639, -0.0013249590992927551, -0.0012840479612350464, -0.0012431368231773376, -0.001202225685119629, -0.0011613145470619202, -0.0011204034090042114, -0.0010794922709465027, -0.001038581132888794, -0.0009976699948310852, -0.0009567588567733765, -0.0009158477187156677, -0.000874936580657959, -0.0008340254426002502, -0.0007931143045425415, -0.0007522031664848328, -0.000711292028427124, -0.0006703808903694153, -0.0006294697523117065, -0.0005885586142539978, -0.0005476474761962891, -0.0005067363381385803, -0.0004658252000808716, -0.00042491406202316284, -0.0003840029239654541, -0.00034309178590774536, -0.0003021806478500366, -0.0002612695097923279, -0.00022035837173461914, -0.0001794472336769104, -0.00013853609561920166, -9.762495756149292e-05, -5.671381950378418e-05, -1.580268144607544e-05, 2.51084566116333e-05, 6.601959466934204e-05, 0.00010693073272705078, 0.00014784187078475952, 0.00018875300884246826, 0.000229664146900177, 0.00027057528495788574, 0.0003114864230155945, 0.0003523975610733032, 0.00039330869913101196, 0.0004342198371887207, 0.00047513097524642944, 0.0005160421133041382, 0.0005569532513618469, 0.0005978643894195557, 0.0006387755274772644, 0.0006796866655349731, 0.0007205978035926819, 0.0007615089416503906]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 9.0, 24.0, 17.0, 32.0, 50.0, 67.0, 117.0, 156.0, 220.0, 311.0, 423.0, 693.0, 979.0, 1468.0, 2204.0, 3245.0, 4904.0, 7494.0, 11883.0, 19335.0, 32328.0, 54773.0, 93136.0, 149717.0, 197481.0, 175314.0, 116296.0, 69198.0, 40825.0, 24053.0, 14679.0, 9374.0, 5884.0, 3879.0, 2572.0, 1711.0, 1165.0, 801.0, 525.0, 352.0, 249.0, 198.0, 134.0, 102.0, 49.0, 35.0, 36.0, 23.0, 13.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.40625, -4.2628173828125, -4.119384765625, -3.9759521484375, -3.83251953125, -3.6890869140625, -3.545654296875, -3.4022216796875, -3.2587890625, -3.1153564453125, -2.971923828125, -2.8284912109375, -2.68505859375, -2.5416259765625, -2.398193359375, -2.2547607421875, -2.111328125, -1.9678955078125, -1.824462890625, -1.6810302734375, -1.53759765625, -1.3941650390625, -1.250732421875, -1.1072998046875, -0.9638671875, -0.8204345703125, -0.677001953125, -0.5335693359375, -0.39013671875, -0.2467041015625, -0.103271484375, 0.0401611328125, 0.18359375, 0.3270263671875, 0.470458984375, 0.6138916015625, 0.75732421875, 0.9007568359375, 1.044189453125, 1.1876220703125, 1.3310546875, 1.4744873046875, 1.617919921875, 1.7613525390625, 1.90478515625, 2.0482177734375, 2.191650390625, 2.3350830078125, 2.478515625, 2.6219482421875, 2.765380859375, 2.9088134765625, 3.05224609375, 3.1956787109375, 3.339111328125, 3.4825439453125, 3.6259765625, 3.7694091796875, 3.912841796875, 4.0562744140625, 4.19970703125, 4.3431396484375, 4.486572265625, 4.6300048828125, 4.7734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 4.0, 3.0, 7.0, 7.0, 5.0, 10.0, 16.0, 18.0, 13.0, 24.0, 17.0, 27.0, 31.0, 46.0, 51.0, 43.0, 76.0, 54.0, 72.0, 68.0, 62.0, 55.0, 48.0, 48.0, 25.0, 23.0, 28.0, 14.0, 11.0, 14.0, 11.0, 8.0, 8.0, 5.0, 6.0, 6.0, 6.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.369140625, -1.3266143798828125, -1.284088134765625, -1.2415618896484375, -1.19903564453125, -1.1565093994140625, -1.113983154296875, -1.0714569091796875, -1.0289306640625, -0.9864044189453125, -0.943878173828125, -0.9013519287109375, -0.85882568359375, -0.8162994384765625, -0.773773193359375, -0.7312469482421875, -0.688720703125, -0.6461944580078125, -0.603668212890625, -0.5611419677734375, -0.51861572265625, -0.4760894775390625, -0.433563232421875, -0.3910369873046875, -0.3485107421875, -0.3059844970703125, -0.263458251953125, -0.2209320068359375, -0.17840576171875, -0.1358795166015625, -0.093353271484375, -0.0508270263671875, -0.00830078125, 0.0342254638671875, 0.076751708984375, 0.1192779541015625, 0.16180419921875, 0.2043304443359375, 0.246856689453125, 0.2893829345703125, 0.3319091796875, 0.3744354248046875, 0.416961669921875, 0.4594879150390625, 0.50201416015625, 0.5445404052734375, 0.587066650390625, 0.6295928955078125, 0.672119140625, 0.7146453857421875, 0.757171630859375, 0.7996978759765625, 0.84222412109375, 0.8847503662109375, 0.927276611328125, 0.9698028564453125, 1.0123291015625, 1.0548553466796875, 1.097381591796875, 1.1399078369140625, 1.18243408203125, 1.2249603271484375, 1.267486572265625, 1.3100128173828125, 1.3525390625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 2.0, 2.0, 7.0, 7.0, 4.0, 4.0, 7.0, 8.0, 18.0, 9.0, 17.0, 21.0, 32.0, 30.0, 33.0, 29.0, 41.0, 30.0, 43.0, 42.0, 24.0, 46.0, 34.0, 40.0, 47.0, 40.0, 48.0, 30.0, 48.0, 31.0, 35.0, 27.0, 27.0, 22.0, 15.0, 17.0, 8.0, 12.0, 16.0, 13.0, 8.0, 4.0, 7.0, 6.0, 6.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-31.824756622314453, -30.9390869140625, -30.053415298461914, -29.16774559020996, -28.282075881958008, -27.396404266357422, -26.51073455810547, -25.625064849853516, -24.73939323425293, -23.853723526000977, -22.96805191040039, -22.082382202148438, -21.196712493896484, -20.3110408782959, -19.425371170043945, -18.53969955444336, -17.654029846191406, -16.768360137939453, -15.882689476013184, -14.997018814086914, -14.111348152160645, -13.225677490234375, -12.340007781982422, -11.454337120056152, -10.568668365478516, -9.682997703552246, -8.797327995300293, -7.911657333374023, -7.025986671447754, -6.140316486358643, -5.254646301269531, -4.368975639343262, -3.483304977416992, -2.5976345539093018, -1.7119642496109009, -0.8262939453125, 0.05937647819519043, 0.9450469017028809, 1.8307170867919922, 2.7163877487182617, 3.602057933807373, 4.487728118896484, 5.373398780822754, 6.259068965911865, 7.144739151000977, 8.030409812927246, 8.916080474853516, 9.801750183105469, 10.687420845031738, 11.573091506958008, 12.458761215209961, 13.34443187713623, 14.2301025390625, 15.115772247314453, 16.001441955566406, 16.887113571166992, 17.772783279418945, 18.6584529876709, 19.544124603271484, 20.429794311523438, 21.31546401977539, 22.201135635375977, 23.08680534362793, 23.972476959228516, 24.85814666748047]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 1.0, 5.0, 4.0, 9.0, 7.0, 6.0, 5.0, 11.0, 17.0, 22.0, 19.0, 34.0, 17.0, 25.0, 31.0, 37.0, 44.0, 47.0, 33.0, 34.0, 37.0, 44.0, 33.0, 49.0, 35.0, 55.0, 35.0, 46.0, 29.0, 26.0, 30.0, 21.0, 31.0, 25.0, 13.0, 16.0, 7.0, 12.0, 11.0, 10.0, 3.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.50355529785156, -31.424339294433594, -30.345121383666992, -29.265905380249023, -28.186687469482422, -27.107471466064453, -26.028255462646484, -24.949037551879883, -23.86981964111328, -22.790603637695312, -21.71138572692871, -20.632169723510742, -19.55295181274414, -18.473735809326172, -17.394519805908203, -16.3153018951416, -15.236085891723633, -14.156868934631348, -13.077651977539062, -11.998435974121094, -10.919218063354492, -9.840002059936523, -8.760785102844238, -7.681568145751953, -6.602351188659668, -5.523134231567383, -4.443917274475098, -3.3647007942199707, -2.2854838371276855, -1.2062668800354004, -0.12705039978027344, 0.9521665573120117, 2.031383514404297, 3.110600471496582, 4.189817428588867, 5.269033908843994, 6.348250865936279, 7.4274678230285645, 8.506684303283691, 9.585901260375977, 10.665118217468262, 11.744335174560547, 12.823552131652832, 13.902769088745117, 14.981985092163086, 16.061203002929688, 17.140419006347656, 18.219635009765625, 19.298852920532227, 20.378068923950195, 21.457286834716797, 22.536502838134766, 23.615720748901367, 24.694936752319336, 25.774154663085938, 26.853370666503906, 27.932586669921875, 29.011802673339844, 30.091020584106445, 31.170236587524414, 32.249454498291016, 33.328670501708984, 34.40788650512695, 35.48710632324219, 36.566322326660156]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 10.0, 10.0, 17.0, 33.0, 46.0, 57.0, 139.0, 212.0, 251.0, 403.0, 600.0, 932.0, 1410.0, 2157.0, 3335.0, 4874.0, 7318.0, 10556.0, 15587.0, 21969.0, 30119.0, 40230.0, 52326.0, 65091.0, 77601.0, 87027.0, 93436.0, 93597.0, 88491.0, 79700.0, 67422.0, 54437.0, 43155.0, 31506.0, 23136.0, 16459.0, 11373.0, 7797.0, 5389.0, 3450.0, 2431.0, 1521.0, 993.0, 646.0, 450.0, 323.0, 174.0, 141.0, 81.0, 42.0, 37.0, 20.0, 16.0, 10.0, 4.0, 0.0, 8.0, 4.0], "bins": [-22.53125, -21.850341796875, -21.16943359375, -20.488525390625, -19.8076171875, -19.126708984375, -18.44580078125, -17.764892578125, -17.083984375, -16.403076171875, -15.72216796875, -15.041259765625, -14.3603515625, -13.679443359375, -12.99853515625, -12.317626953125, -11.63671875, -10.955810546875, -10.27490234375, -9.593994140625, -8.9130859375, -8.232177734375, -7.55126953125, -6.870361328125, -6.189453125, -5.508544921875, -4.82763671875, -4.146728515625, -3.4658203125, -2.784912109375, -2.10400390625, -1.423095703125, -0.7421875, -0.061279296875, 0.61962890625, 1.300537109375, 1.9814453125, 2.662353515625, 3.34326171875, 4.024169921875, 4.705078125, 5.385986328125, 6.06689453125, 6.747802734375, 7.4287109375, 8.109619140625, 8.79052734375, 9.471435546875, 10.15234375, 10.833251953125, 11.51416015625, 12.195068359375, 12.8759765625, 13.556884765625, 14.23779296875, 14.918701171875, 15.599609375, 16.280517578125, 16.96142578125, 17.642333984375, 18.3232421875, 19.004150390625, 19.68505859375, 20.365966796875, 21.046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 9.0, 17.0, 11.0, 18.0, 21.0, 17.0, 24.0, 31.0, 33.0, 31.0, 39.0, 36.0, 33.0, 38.0, 35.0, 41.0, 43.0, 40.0, 41.0, 33.0, 31.0, 38.0, 37.0, 29.0, 29.0, 30.0, 19.0, 30.0, 22.0, 12.0, 20.0, 10.0, 10.0, 6.0, 6.0, 2.0, 10.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.78125, -28.80126953125, -27.8212890625, -26.84130859375, -25.861328125, -24.88134765625, -23.9013671875, -22.92138671875, -21.94140625, -20.96142578125, -19.9814453125, -19.00146484375, -18.021484375, -17.04150390625, -16.0615234375, -15.08154296875, -14.1015625, -13.12158203125, -12.1416015625, -11.16162109375, -10.181640625, -9.20166015625, -8.2216796875, -7.24169921875, -6.26171875, -5.28173828125, -4.3017578125, -3.32177734375, -2.341796875, -1.36181640625, -0.3818359375, 0.59814453125, 1.578125, 2.55810546875, 3.5380859375, 4.51806640625, 5.498046875, 6.47802734375, 7.4580078125, 8.43798828125, 9.41796875, 10.39794921875, 11.3779296875, 12.35791015625, 13.337890625, 14.31787109375, 15.2978515625, 16.27783203125, 17.2578125, 18.23779296875, 19.2177734375, 20.19775390625, 21.177734375, 22.15771484375, 23.1376953125, 24.11767578125, 25.09765625, 26.07763671875, 27.0576171875, 28.03759765625, 29.017578125, 29.99755859375, 30.9775390625, 31.95751953125, 32.9375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 5.0, 14.0, 21.0, 26.0, 25.0, 88.0, 130.0, 184.0, 289.0, 432.0, 708.0, 1128.0, 1835.0, 2725.0, 4332.0, 6603.0, 9826.0, 15006.0, 21760.0, 30546.0, 42490.0, 56592.0, 71149.0, 85340.0, 95525.0, 101181.0, 99270.0, 91537.0, 79408.0, 64011.0, 49646.0, 36597.0, 26208.0, 18160.0, 12443.0, 8090.0, 5524.0, 3462.0, 2297.0, 1398.0, 942.0, 580.0, 383.0, 233.0, 168.0, 90.0, 54.0, 49.0, 16.0, 19.0, 5.0, 9.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.109375, -22.3330078125, -21.556640625, -20.7802734375, -20.00390625, -19.2275390625, -18.451171875, -17.6748046875, -16.8984375, -16.1220703125, -15.345703125, -14.5693359375, -13.79296875, -13.0166015625, -12.240234375, -11.4638671875, -10.6875, -9.9111328125, -9.134765625, -8.3583984375, -7.58203125, -6.8056640625, -6.029296875, -5.2529296875, -4.4765625, -3.7001953125, -2.923828125, -2.1474609375, -1.37109375, -0.5947265625, 0.181640625, 0.9580078125, 1.734375, 2.5107421875, 3.287109375, 4.0634765625, 4.83984375, 5.6162109375, 6.392578125, 7.1689453125, 7.9453125, 8.7216796875, 9.498046875, 10.2744140625, 11.05078125, 11.8271484375, 12.603515625, 13.3798828125, 14.15625, 14.9326171875, 15.708984375, 16.4853515625, 17.26171875, 18.0380859375, 18.814453125, 19.5908203125, 20.3671875, 21.1435546875, 21.919921875, 22.6962890625, 23.47265625, 24.2490234375, 25.025390625, 25.8017578125, 26.578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 4.0, 11.0, 2.0, 10.0, 16.0, 9.0, 11.0, 15.0, 22.0, 28.0, 22.0, 31.0, 20.0, 29.0, 23.0, 35.0, 27.0, 42.0, 33.0, 38.0, 48.0, 25.0, 40.0, 46.0, 39.0, 33.0, 37.0, 35.0, 35.0, 31.0, 27.0, 25.0, 27.0, 19.0, 11.0, 26.0, 15.0, 11.0, 11.0, 6.0, 4.0, 4.0, 4.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.6220703125, -17.962890625, -17.3037109375, -16.64453125, -15.9853515625, -15.326171875, -14.6669921875, -14.0078125, -13.3486328125, -12.689453125, -12.0302734375, -11.37109375, -10.7119140625, -10.052734375, -9.3935546875, -8.734375, -8.0751953125, -7.416015625, -6.7568359375, -6.09765625, -5.4384765625, -4.779296875, -4.1201171875, -3.4609375, -2.8017578125, -2.142578125, -1.4833984375, -0.82421875, -0.1650390625, 0.494140625, 1.1533203125, 1.8125, 2.4716796875, 3.130859375, 3.7900390625, 4.44921875, 5.1083984375, 5.767578125, 6.4267578125, 7.0859375, 7.7451171875, 8.404296875, 9.0634765625, 9.72265625, 10.3818359375, 11.041015625, 11.7001953125, 12.359375, 13.0185546875, 13.677734375, 14.3369140625, 14.99609375, 15.6552734375, 16.314453125, 16.9736328125, 17.6328125, 18.2919921875, 18.951171875, 19.6103515625, 20.26953125, 20.9287109375, 21.587890625, 22.2470703125, 22.90625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 2.0, 7.0, 15.0, 20.0, 38.0, 34.0, 63.0, 76.0, 121.0, 204.0, 341.0, 500.0, 827.0, 1379.0, 2357.0, 4477.0, 9272.0, 21494.0, 52216.0, 123762.0, 231871.0, 268864.0, 182349.0, 84570.0, 34505.0, 14589.0, 6460.0, 3396.0, 1859.0, 1063.0, 657.0, 407.0, 281.0, 150.0, 132.0, 73.0, 45.0, 26.0, 20.0, 13.0, 11.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.765625, -24.0634765625, -23.361328125, -22.6591796875, -21.95703125, -21.2548828125, -20.552734375, -19.8505859375, -19.1484375, -18.4462890625, -17.744140625, -17.0419921875, -16.33984375, -15.6376953125, -14.935546875, -14.2333984375, -13.53125, -12.8291015625, -12.126953125, -11.4248046875, -10.72265625, -10.0205078125, -9.318359375, -8.6162109375, -7.9140625, -7.2119140625, -6.509765625, -5.8076171875, -5.10546875, -4.4033203125, -3.701171875, -2.9990234375, -2.296875, -1.5947265625, -0.892578125, -0.1904296875, 0.51171875, 1.2138671875, 1.916015625, 2.6181640625, 3.3203125, 4.0224609375, 4.724609375, 5.4267578125, 6.12890625, 6.8310546875, 7.533203125, 8.2353515625, 8.9375, 9.6396484375, 10.341796875, 11.0439453125, 11.74609375, 12.4482421875, 13.150390625, 13.8525390625, 14.5546875, 15.2568359375, 15.958984375, 16.6611328125, 17.36328125, 18.0654296875, 18.767578125, 19.4697265625, 20.171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 8.0, 13.0, 13.0, 10.0, 27.0, 28.0, 39.0, 44.0, 47.0, 67.0, 64.0, 81.0, 59.0, 80.0, 64.0, 70.0, 58.0, 43.0, 34.0, 25.0, 28.0, 23.0, 14.0, 17.0, 11.0, 7.0, 3.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018367767333984375, -0.0017850697040557861, -0.0017333626747131348, -0.0016816556453704834, -0.001629948616027832, -0.0015782415866851807, -0.0015265345573425293, -0.001474827527999878, -0.0014231204986572266, -0.0013714134693145752, -0.0013197064399719238, -0.0012679994106292725, -0.001216292381286621, -0.0011645853519439697, -0.0011128783226013184, -0.001061171293258667, -0.0010094642639160156, -0.0009577572345733643, -0.0009060502052307129, -0.0008543431758880615, -0.0008026361465454102, -0.0007509291172027588, -0.0006992220878601074, -0.0006475150585174561, -0.0005958080291748047, -0.0005441009998321533, -0.000492393970489502, -0.0004406869411468506, -0.0003889799118041992, -0.00033727288246154785, -0.0002855658531188965, -0.00023385882377624512, -0.00018215179443359375, -0.00013044476509094238, -7.873773574829102e-05, -2.703070640563965e-05, 2.467632293701172e-05, 7.638335227966309e-05, 0.00012809038162231445, 0.00017979741096496582, 0.0002315044403076172, 0.00028321146965026855, 0.0003349184989929199, 0.0003866255283355713, 0.00043833255767822266, 0.000490039587020874, 0.0005417466163635254, 0.0005934536457061768, 0.0006451606750488281, 0.0006968677043914795, 0.0007485747337341309, 0.0008002817630767822, 0.0008519887924194336, 0.000903695821762085, 0.0009554028511047363, 0.0010071098804473877, 0.001058816909790039, 0.0011105239391326904, 0.0011622309684753418, 0.0012139379978179932, 0.0012656450271606445, 0.001317352056503296, 0.0013690590858459473, 0.0014207661151885986, 0.00147247314453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 6.0, 14.0, 20.0, 26.0, 36.0, 62.0, 73.0, 139.0, 215.0, 322.0, 459.0, 680.0, 1050.0, 1549.0, 2364.0, 3803.0, 6120.0, 9759.0, 15717.0, 26101.0, 41600.0, 64423.0, 94072.0, 124207.0, 143367.0, 142286.0, 119838.0, 89428.0, 59488.0, 38281.0, 23715.0, 14480.0, 9069.0, 5557.0, 3573.0, 2274.0, 1494.0, 978.0, 631.0, 428.0, 278.0, 193.0, 132.0, 78.0, 59.0, 34.0, 21.0, 15.0, 19.0, 6.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.6328125, -11.268310546875, -10.90380859375, -10.539306640625, -10.1748046875, -9.810302734375, -9.44580078125, -9.081298828125, -8.716796875, -8.352294921875, -7.98779296875, -7.623291015625, -7.2587890625, -6.894287109375, -6.52978515625, -6.165283203125, -5.80078125, -5.436279296875, -5.07177734375, -4.707275390625, -4.3427734375, -3.978271484375, -3.61376953125, -3.249267578125, -2.884765625, -2.520263671875, -2.15576171875, -1.791259765625, -1.4267578125, -1.062255859375, -0.69775390625, -0.333251953125, 0.03125, 0.395751953125, 0.76025390625, 1.124755859375, 1.4892578125, 1.853759765625, 2.21826171875, 2.582763671875, 2.947265625, 3.311767578125, 3.67626953125, 4.040771484375, 4.4052734375, 4.769775390625, 5.13427734375, 5.498779296875, 5.86328125, 6.227783203125, 6.59228515625, 6.956787109375, 7.3212890625, 7.685791015625, 8.05029296875, 8.414794921875, 8.779296875, 9.143798828125, 9.50830078125, 9.872802734375, 10.2373046875, 10.601806640625, 10.96630859375, 11.330810546875, 11.6953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 10.0, 12.0, 11.0, 12.0, 17.0, 18.0, 23.0, 25.0, 30.0, 31.0, 34.0, 43.0, 54.0, 47.0, 57.0, 52.0, 38.0, 46.0, 59.0, 50.0, 41.0, 44.0, 47.0, 35.0, 23.0, 23.0, 16.0, 16.0, 13.0, 9.0, 10.0, 7.0, 6.0, 2.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.5546875, -5.401123046875, -5.24755859375, -5.093994140625, -4.9404296875, -4.786865234375, -4.63330078125, -4.479736328125, -4.326171875, -4.172607421875, -4.01904296875, -3.865478515625, -3.7119140625, -3.558349609375, -3.40478515625, -3.251220703125, -3.09765625, -2.944091796875, -2.79052734375, -2.636962890625, -2.4833984375, -2.329833984375, -2.17626953125, -2.022705078125, -1.869140625, -1.715576171875, -1.56201171875, -1.408447265625, -1.2548828125, -1.101318359375, -0.94775390625, -0.794189453125, -0.640625, -0.487060546875, -0.33349609375, -0.179931640625, -0.0263671875, 0.127197265625, 0.28076171875, 0.434326171875, 0.587890625, 0.741455078125, 0.89501953125, 1.048583984375, 1.2021484375, 1.355712890625, 1.50927734375, 1.662841796875, 1.81640625, 1.969970703125, 2.12353515625, 2.277099609375, 2.4306640625, 2.584228515625, 2.73779296875, 2.891357421875, 3.044921875, 3.198486328125, 3.35205078125, 3.505615234375, 3.6591796875, 3.812744140625, 3.96630859375, 4.119873046875, 4.2734375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 7.0, 10.0, 8.0, 14.0, 14.0, 24.0, 31.0, 35.0, 26.0, 41.0, 36.0, 35.0, 60.0, 46.0, 55.0, 49.0, 35.0, 58.0, 47.0, 60.0, 40.0, 36.0, 30.0, 40.0, 27.0, 17.0, 19.0, 13.0, 16.0, 10.0, 10.0, 7.0, 12.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-37.054561614990234, -36.048763275146484, -35.04296112060547, -34.03716278076172, -33.03136444091797, -32.02556610107422, -31.019763946533203, -30.013965606689453, -29.008167266845703, -28.00236701965332, -26.99656867980957, -25.990768432617188, -24.984970092773438, -23.979169845581055, -22.973369598388672, -21.967571258544922, -20.96177101135254, -19.955970764160156, -18.950172424316406, -17.944372177124023, -16.938573837280273, -15.93277359008789, -14.926974296569824, -13.921175003051758, -12.915375709533691, -11.909576416015625, -10.903777122497559, -9.897977828979492, -8.89217758178711, -7.886378765106201, -6.880578994750977, -5.87477970123291, -4.868980407714844, -3.8631811141967773, -2.857381582260132, -1.8515820503234863, -0.8457827568054199, 0.16001653671264648, 1.165816307067871, 2.1716156005859375, 3.177414894104004, 4.18321418762207, 5.189013481140137, 6.194813251495361, 7.200612545013428, 8.206411361694336, 9.212211608886719, 10.218010902404785, 11.223810195922852, 12.229609489440918, 13.235408782958984, 14.241209030151367, 15.247007369995117, 16.2528076171875, 17.25860595703125, 18.264406204223633, 19.270206451416016, 20.2760066986084, 21.28180503845215, 22.28760528564453, 23.29340362548828, 24.299203872680664, 25.305004119873047, 26.310802459716797, 27.316600799560547]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 2.0, 5.0, 5.0, 14.0, 11.0, 17.0, 8.0, 15.0, 24.0, 14.0, 19.0, 23.0, 30.0, 21.0, 28.0, 33.0, 41.0, 37.0, 50.0, 49.0, 44.0, 36.0, 43.0, 42.0, 40.0, 39.0, 36.0, 24.0, 35.0, 33.0, 26.0, 30.0, 16.0, 15.0, 15.0, 16.0, 14.0, 9.0, 6.0, 7.0, 8.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-35.0855827331543, -33.9887580871582, -32.89193344116211, -31.79511070251465, -30.698287963867188, -29.601463317871094, -28.504638671875, -27.40781593322754, -26.310993194580078, -25.214168548583984, -24.117345809936523, -23.02052116394043, -21.92369842529297, -20.826873779296875, -19.73004913330078, -18.63322639465332, -17.536401748657227, -16.439577102661133, -15.342754364013672, -14.245929718017578, -13.149106979370117, -12.052282333374023, -10.955458641052246, -9.858634948730469, -8.761811256408691, -7.664987564086914, -6.568163871765137, -5.471339702606201, -4.374516010284424, -3.2776923179626465, -2.180868148803711, -1.0840444564819336, 0.01277923583984375, 1.1096030473709106, 2.2064268589019775, 3.303250789642334, 4.400074481964111, 5.496898174285889, 6.593722343444824, 7.690546035766602, 8.787369728088379, 9.884193420410156, 10.981017112731934, 12.077840805053711, 13.174665451049805, 14.271488189697266, 15.36831283569336, 16.465137481689453, 17.561960220336914, 18.658784866333008, 19.75560760498047, 20.852432250976562, 21.949254989624023, 23.046079635620117, 24.142902374267578, 25.239727020263672, 26.336551666259766, 27.43337631225586, 28.53019905090332, 29.627023696899414, 30.723846435546875, 31.82067108154297, 32.91749572753906, 34.014320373535156, 35.111141204833984]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 11.0, 22.0, 26.0, 52.0, 92.0, 139.0, 275.0, 431.0, 762.0, 1225.0, 2251.0, 3741.0, 6377.0, 10697.0, 17823.0, 29778.0, 48909.0, 78669.0, 123691.0, 187390.0, 271230.0, 366086.0, 451836.0, 507107.0, 506536.0, 451042.0, 360783.0, 266089.0, 184077.0, 121390.0, 76712.0, 47350.0, 28844.0, 17522.0, 10337.0, 6128.0, 3652.0, 2098.0, 1260.0, 756.0, 458.0, 282.0, 148.0, 86.0, 47.0, 27.0, 23.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.786865234375, -22.02685546875, -21.266845703125, -20.5068359375, -19.746826171875, -18.98681640625, -18.226806640625, -17.466796875, -16.706787109375, -15.94677734375, -15.186767578125, -14.4267578125, -13.666748046875, -12.90673828125, -12.146728515625, -11.38671875, -10.626708984375, -9.86669921875, -9.106689453125, -8.3466796875, -7.586669921875, -6.82666015625, -6.066650390625, -5.306640625, -4.546630859375, -3.78662109375, -3.026611328125, -2.2666015625, -1.506591796875, -0.74658203125, 0.013427734375, 0.7734375, 1.533447265625, 2.29345703125, 3.053466796875, 3.8134765625, 4.573486328125, 5.33349609375, 6.093505859375, 6.853515625, 7.613525390625, 8.37353515625, 9.133544921875, 9.8935546875, 10.653564453125, 11.41357421875, 12.173583984375, 12.93359375, 13.693603515625, 14.45361328125, 15.213623046875, 15.9736328125, 16.733642578125, 17.49365234375, 18.253662109375, 19.013671875, 19.773681640625, 20.53369140625, 21.293701171875, 22.0537109375, 22.813720703125, 23.57373046875, 24.333740234375, 25.09375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 10.0, 14.0, 10.0, 8.0, 14.0, 20.0, 14.0, 18.0, 19.0, 21.0, 28.0, 33.0, 31.0, 26.0, 40.0, 36.0, 37.0, 56.0, 44.0, 50.0, 39.0, 45.0, 44.0, 36.0, 30.0, 32.0, 44.0, 21.0, 26.0, 24.0, 21.0, 26.0, 13.0, 13.0, 10.0, 10.0, 5.0, 6.0, 10.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.453125, -30.562744140625, -29.67236328125, -28.781982421875, -27.8916015625, -27.001220703125, -26.11083984375, -25.220458984375, -24.330078125, -23.439697265625, -22.54931640625, -21.658935546875, -20.7685546875, -19.878173828125, -18.98779296875, -18.097412109375, -17.20703125, -16.316650390625, -15.42626953125, -14.535888671875, -13.6455078125, -12.755126953125, -11.86474609375, -10.974365234375, -10.083984375, -9.193603515625, -8.30322265625, -7.412841796875, -6.5224609375, -5.632080078125, -4.74169921875, -3.851318359375, -2.9609375, -2.070556640625, -1.18017578125, -0.289794921875, 0.6005859375, 1.490966796875, 2.38134765625, 3.271728515625, 4.162109375, 5.052490234375, 5.94287109375, 6.833251953125, 7.7236328125, 8.614013671875, 9.50439453125, 10.394775390625, 11.28515625, 12.175537109375, 13.06591796875, 13.956298828125, 14.8466796875, 15.737060546875, 16.62744140625, 17.517822265625, 18.408203125, 19.298583984375, 20.18896484375, 21.079345703125, 21.9697265625, 22.860107421875, 23.75048828125, 24.640869140625, 25.53125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 3.0, 15.0, 30.0, 40.0, 65.0, 114.0, 157.0, 290.0, 488.0, 759.0, 1288.0, 2045.0, 3232.0, 5286.0, 8156.0, 12683.0, 19413.0, 29535.0, 43795.0, 63950.0, 90407.0, 126574.0, 168791.0, 218043.0, 271050.0, 320028.0, 359007.0, 379377.0, 376799.0, 353851.0, 314721.0, 263808.0, 211216.0, 162102.0, 120669.0, 86585.0, 60118.0, 41101.0, 27670.0, 18379.0, 11908.0, 7569.0, 4943.0, 3112.0, 1918.0, 1203.0, 773.0, 459.0, 260.0, 195.0, 110.0, 72.0, 58.0, 25.0, 21.0, 9.0, 9.0, 8.0, 1.0, 0.0, 2.0], "bins": [-18.9375, -18.3251953125, -17.712890625, -17.1005859375, -16.48828125, -15.8759765625, -15.263671875, -14.6513671875, -14.0390625, -13.4267578125, -12.814453125, -12.2021484375, -11.58984375, -10.9775390625, -10.365234375, -9.7529296875, -9.140625, -8.5283203125, -7.916015625, -7.3037109375, -6.69140625, -6.0791015625, -5.466796875, -4.8544921875, -4.2421875, -3.6298828125, -3.017578125, -2.4052734375, -1.79296875, -1.1806640625, -0.568359375, 0.0439453125, 0.65625, 1.2685546875, 1.880859375, 2.4931640625, 3.10546875, 3.7177734375, 4.330078125, 4.9423828125, 5.5546875, 6.1669921875, 6.779296875, 7.3916015625, 8.00390625, 8.6162109375, 9.228515625, 9.8408203125, 10.453125, 11.0654296875, 11.677734375, 12.2900390625, 12.90234375, 13.5146484375, 14.126953125, 14.7392578125, 15.3515625, 15.9638671875, 16.576171875, 17.1884765625, 17.80078125, 18.4130859375, 19.025390625, 19.6376953125, 20.25]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 8.0, 5.0, 6.0, 8.0, 16.0, 14.0, 13.0, 20.0, 27.0, 19.0, 44.0, 54.0, 50.0, 63.0, 74.0, 100.0, 95.0, 107.0, 129.0, 137.0, 163.0, 143.0, 161.0, 184.0, 173.0, 188.0, 188.0, 166.0, 175.0, 174.0, 148.0, 145.0, 152.0, 133.0, 121.0, 102.0, 93.0, 79.0, 60.0, 74.0, 54.0, 40.0, 38.0, 31.0, 19.0, 14.0, 17.0, 12.0, 10.0, 9.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-10.375, -10.029296875, -9.68359375, -9.337890625, -8.9921875, -8.646484375, -8.30078125, -7.955078125, -7.609375, -7.263671875, -6.91796875, -6.572265625, -6.2265625, -5.880859375, -5.53515625, -5.189453125, -4.84375, -4.498046875, -4.15234375, -3.806640625, -3.4609375, -3.115234375, -2.76953125, -2.423828125, -2.078125, -1.732421875, -1.38671875, -1.041015625, -0.6953125, -0.349609375, -0.00390625, 0.341796875, 0.6875, 1.033203125, 1.37890625, 1.724609375, 2.0703125, 2.416015625, 2.76171875, 3.107421875, 3.453125, 3.798828125, 4.14453125, 4.490234375, 4.8359375, 5.181640625, 5.52734375, 5.873046875, 6.21875, 6.564453125, 6.91015625, 7.255859375, 7.6015625, 7.947265625, 8.29296875, 8.638671875, 8.984375, 9.330078125, 9.67578125, 10.021484375, 10.3671875, 10.712890625, 11.05859375, 11.404296875, 11.75]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 8.0, 11.0, 8.0, 15.0, 21.0, 25.0, 22.0, 30.0, 31.0, 34.0, 28.0, 48.0, 36.0, 42.0, 37.0, 37.0, 58.0, 46.0, 46.0, 37.0, 42.0, 34.0, 42.0, 36.0, 33.0, 26.0, 26.0, 12.0, 22.0, 14.0, 21.0, 11.0, 13.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-28.06747817993164, -27.208215713500977, -26.34895133972168, -25.489688873291016, -24.63042449951172, -23.771162033081055, -22.91189956665039, -22.052635192871094, -21.193370819091797, -20.334108352661133, -19.474843978881836, -18.615581512451172, -17.756317138671875, -16.89705467224121, -16.037792205810547, -15.17852783203125, -14.319265365600586, -13.460001945495605, -12.600738525390625, -11.741476058959961, -10.882211685180664, -10.02294921875, -9.16368579864502, -8.304422378540039, -7.445158958435059, -6.585895538330078, -5.726632118225098, -4.867369174957275, -4.008105754852295, -3.1488423347473145, -2.289579391479492, -1.4303159713745117, -0.5710506439208984, 0.2882126569747925, 1.1474759578704834, 2.0067391395568848, 2.8660025596618652, 3.7252659797668457, 4.584528923034668, 5.443792343139648, 6.303055763244629, 7.162319183349609, 8.02158260345459, 8.88084602355957, 9.740108489990234, 10.599372863769531, 11.458635330200195, 12.317898750305176, 13.177162170410156, 14.036425590515137, 14.895689010620117, 15.754951477050781, 16.614215850830078, 17.473478317260742, 18.332740783691406, 19.192005157470703, 20.05126953125, 20.910531997680664, 21.76979637145996, 22.629058837890625, 23.488323211669922, 24.347585678100586, 25.20684814453125, 26.066112518310547, 26.92537498474121]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 10.0, 12.0, 16.0, 13.0, 15.0, 20.0, 26.0, 22.0, 19.0, 23.0, 29.0, 34.0, 33.0, 41.0, 53.0, 41.0, 46.0, 46.0, 28.0, 40.0, 43.0, 36.0, 41.0, 38.0, 42.0, 22.0, 23.0, 27.0, 16.0, 20.0, 19.0, 19.0, 13.0, 17.0, 12.0, 10.0, 7.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-30.571224212646484, -29.551654815673828, -28.532087326049805, -27.51251792907715, -26.492950439453125, -25.47338104248047, -24.453811645507812, -23.434242248535156, -22.414674758911133, -21.395105361938477, -20.375537872314453, -19.355968475341797, -18.33639907836914, -17.316831588745117, -16.29726219177246, -15.277693748474121, -14.258125305175781, -13.238556861877441, -12.218988418579102, -11.199419021606445, -10.179850578308105, -9.160282135009766, -8.14071273803711, -7.1211442947387695, -6.10157585144043, -5.08200740814209, -4.062438488006592, -3.042869806289673, -2.023301124572754, -1.003732681274414, 0.015836238861083984, 1.035405158996582, 2.0549697875976562, 3.074538469314575, 4.094107151031494, 5.113676071166992, 6.133244514465332, 7.152812957763672, 8.172382354736328, 9.191950798034668, 10.211519241333008, 11.231087684631348, 12.250656127929688, 13.270225524902344, 14.289793968200684, 15.309362411499023, 16.32893180847168, 17.348499298095703, 18.36806869506836, 19.387638092041016, 20.40720558166504, 21.426774978637695, 22.44634246826172, 23.465911865234375, 24.48548126220703, 25.505050659179688, 26.52461814880371, 27.544187545776367, 28.56375503540039, 29.583324432373047, 30.602893829345703, 31.622461318969727, 32.64202880859375, 33.661598205566406, 34.68116760253906]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 10.0, 11.0, 21.0, 43.0, 67.0, 141.0, 211.0, 365.0, 552.0, 1050.0, 1674.0, 2961.0, 4611.0, 7658.0, 12484.0, 19685.0, 31316.0, 49527.0, 74296.0, 104274.0, 132962.0, 146877.0, 134860.0, 107550.0, 76971.0, 51402.0, 32873.0, 21136.0, 12891.0, 7849.0, 4751.0, 3021.0, 1829.0, 1067.0, 613.0, 379.0, 206.0, 141.0, 90.0, 57.0, 30.0, 17.0, 14.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.8203125, -8.5789794921875, -8.337646484375, -8.0963134765625, -7.85498046875, -7.6136474609375, -7.372314453125, -7.1309814453125, -6.8896484375, -6.6483154296875, -6.406982421875, -6.1656494140625, -5.92431640625, -5.6829833984375, -5.441650390625, -5.2003173828125, -4.958984375, -4.7176513671875, -4.476318359375, -4.2349853515625, -3.99365234375, -3.7523193359375, -3.510986328125, -3.2696533203125, -3.0283203125, -2.7869873046875, -2.545654296875, -2.3043212890625, -2.06298828125, -1.8216552734375, -1.580322265625, -1.3389892578125, -1.09765625, -0.8563232421875, -0.614990234375, -0.3736572265625, -0.13232421875, 0.1090087890625, 0.350341796875, 0.5916748046875, 0.8330078125, 1.0743408203125, 1.315673828125, 1.5570068359375, 1.79833984375, 2.0396728515625, 2.281005859375, 2.5223388671875, 2.763671875, 3.0050048828125, 3.246337890625, 3.4876708984375, 3.72900390625, 3.9703369140625, 4.211669921875, 4.4530029296875, 4.6943359375, 4.9356689453125, 5.177001953125, 5.4183349609375, 5.65966796875, 5.9010009765625, 6.142333984375, 6.3836669921875, 6.625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 7.0, 17.0, 20.0, 12.0, 18.0, 17.0, 25.0, 25.0, 27.0, 32.0, 37.0, 32.0, 33.0, 41.0, 37.0, 37.0, 54.0, 38.0, 42.0, 40.0, 38.0, 35.0, 37.0, 42.0, 33.0, 32.0, 22.0, 26.0, 18.0, 22.0, 19.0, 14.0, 16.0, 7.0, 10.0, 5.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.46875, -31.39794921875, -30.3271484375, -29.25634765625, -28.185546875, -27.11474609375, -26.0439453125, -24.97314453125, -23.90234375, -22.83154296875, -21.7607421875, -20.68994140625, -19.619140625, -18.54833984375, -17.4775390625, -16.40673828125, -15.3359375, -14.26513671875, -13.1943359375, -12.12353515625, -11.052734375, -9.98193359375, -8.9111328125, -7.84033203125, -6.76953125, -5.69873046875, -4.6279296875, -3.55712890625, -2.486328125, -1.41552734375, -0.3447265625, 0.72607421875, 1.796875, 2.86767578125, 3.9384765625, 5.00927734375, 6.080078125, 7.15087890625, 8.2216796875, 9.29248046875, 10.36328125, 11.43408203125, 12.5048828125, 13.57568359375, 14.646484375, 15.71728515625, 16.7880859375, 17.85888671875, 18.9296875, 20.00048828125, 21.0712890625, 22.14208984375, 23.212890625, 24.28369140625, 25.3544921875, 26.42529296875, 27.49609375, 28.56689453125, 29.6376953125, 30.70849609375, 31.779296875, 32.85009765625, 33.9208984375, 34.99169921875, 36.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 10.0, 7.0, 7.0, 18.0, 37.0, 39.0, 65.0, 118.0, 185.0, 344.0, 544.0, 1020.0, 1756.0, 3340.0, 6209.0, 11754.0, 22525.0, 41792.0, 76088.0, 126670.0, 179112.0, 194965.0, 156227.0, 101156.0, 58162.0, 31001.0, 16516.0, 8583.0, 4554.0, 2480.0, 1354.0, 785.0, 430.0, 266.0, 167.0, 102.0, 57.0, 40.0, 25.0, 18.0, 11.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1171875, -6.88201904296875, -6.6468505859375, -6.41168212890625, -6.176513671875, -5.94134521484375, -5.7061767578125, -5.47100830078125, -5.23583984375, -5.00067138671875, -4.7655029296875, -4.53033447265625, -4.295166015625, -4.05999755859375, -3.8248291015625, -3.58966064453125, -3.3544921875, -3.11932373046875, -2.8841552734375, -2.64898681640625, -2.413818359375, -2.17864990234375, -1.9434814453125, -1.70831298828125, -1.47314453125, -1.23797607421875, -1.0028076171875, -0.76763916015625, -0.532470703125, -0.29730224609375, -0.0621337890625, 0.17303466796875, 0.408203125, 0.64337158203125, 0.8785400390625, 1.11370849609375, 1.348876953125, 1.58404541015625, 1.8192138671875, 2.05438232421875, 2.28955078125, 2.52471923828125, 2.7598876953125, 2.99505615234375, 3.230224609375, 3.46539306640625, 3.7005615234375, 3.93572998046875, 4.1708984375, 4.40606689453125, 4.6412353515625, 4.87640380859375, 5.111572265625, 5.34674072265625, 5.5819091796875, 5.81707763671875, 6.05224609375, 6.28741455078125, 6.5225830078125, 6.75775146484375, 6.992919921875, 7.22808837890625, 7.4632568359375, 7.69842529296875, 7.93359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 8.0, 8.0, 12.0, 8.0, 16.0, 21.0, 18.0, 16.0, 30.0, 24.0, 31.0, 28.0, 31.0, 35.0, 36.0, 45.0, 51.0, 47.0, 36.0, 57.0, 42.0, 50.0, 39.0, 48.0, 38.0, 39.0, 25.0, 16.0, 29.0, 19.0, 15.0, 13.0, 10.0, 15.0, 8.0, 11.0, 2.0, 3.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.147216796875, -21.38818359375, -20.629150390625, -19.8701171875, -19.111083984375, -18.35205078125, -17.593017578125, -16.833984375, -16.074951171875, -15.31591796875, -14.556884765625, -13.7978515625, -13.038818359375, -12.27978515625, -11.520751953125, -10.76171875, -10.002685546875, -9.24365234375, -8.484619140625, -7.7255859375, -6.966552734375, -6.20751953125, -5.448486328125, -4.689453125, -3.930419921875, -3.17138671875, -2.412353515625, -1.6533203125, -0.894287109375, -0.13525390625, 0.623779296875, 1.3828125, 2.141845703125, 2.90087890625, 3.659912109375, 4.4189453125, 5.177978515625, 5.93701171875, 6.696044921875, 7.455078125, 8.214111328125, 8.97314453125, 9.732177734375, 10.4912109375, 11.250244140625, 12.00927734375, 12.768310546875, 13.52734375, 14.286376953125, 15.04541015625, 15.804443359375, 16.5634765625, 17.322509765625, 18.08154296875, 18.840576171875, 19.599609375, 20.358642578125, 21.11767578125, 21.876708984375, 22.6357421875, 23.394775390625, 24.15380859375, 24.912841796875, 25.671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 15.0, 13.0, 16.0, 25.0, 39.0, 34.0, 35.0, 83.0, 110.0, 144.0, 190.0, 271.0, 459.0, 618.0, 990.0, 1561.0, 2779.0, 4893.0, 9479.0, 19836.0, 46339.0, 116502.0, 268672.0, 312474.0, 151571.0, 60400.0, 25081.0, 11606.0, 5868.0, 3160.0, 1856.0, 1076.0, 714.0, 492.0, 335.0, 217.0, 147.0, 128.0, 78.0, 68.0, 48.0, 28.0, 17.0, 24.0, 15.0, 9.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.87109375, -2.781768798828125, -2.69244384765625, -2.603118896484375, -2.5137939453125, -2.424468994140625, -2.33514404296875, -2.245819091796875, -2.156494140625, -2.067169189453125, -1.97784423828125, -1.888519287109375, -1.7991943359375, -1.709869384765625, -1.62054443359375, -1.531219482421875, -1.44189453125, -1.352569580078125, -1.26324462890625, -1.173919677734375, -1.0845947265625, -0.995269775390625, -0.90594482421875, -0.816619873046875, -0.727294921875, -0.637969970703125, -0.54864501953125, -0.459320068359375, -0.3699951171875, -0.280670166015625, -0.19134521484375, -0.102020263671875, -0.0126953125, 0.076629638671875, 0.16595458984375, 0.255279541015625, 0.3446044921875, 0.433929443359375, 0.52325439453125, 0.612579345703125, 0.701904296875, 0.791229248046875, 0.88055419921875, 0.969879150390625, 1.0592041015625, 1.148529052734375, 1.23785400390625, 1.327178955078125, 1.41650390625, 1.505828857421875, 1.59515380859375, 1.684478759765625, 1.7738037109375, 1.863128662109375, 1.95245361328125, 2.041778564453125, 2.131103515625, 2.220428466796875, 2.30975341796875, 2.399078369140625, 2.4884033203125, 2.577728271484375, 2.66705322265625, 2.756378173828125, 2.845703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 1.0, 6.0, 11.0, 9.0, 10.0, 15.0, 19.0, 22.0, 29.0, 29.0, 44.0, 51.0, 52.0, 73.0, 77.0, 82.0, 73.0, 76.0, 63.0, 57.0, 37.0, 50.0, 28.0, 25.0, 13.0, 10.0, 11.0, 4.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00042939186096191406, -0.00041761621832847595, -0.00040584057569503784, -0.00039406493306159973, -0.0003822892904281616, -0.0003705136477947235, -0.0003587380051612854, -0.0003469623625278473, -0.0003351867198944092, -0.00032341107726097107, -0.00031163543462753296, -0.00029985979199409485, -0.00028808414936065674, -0.00027630850672721863, -0.0002645328640937805, -0.0002527572214603424, -0.0002409815788269043, -0.0002292059361934662, -0.00021743029356002808, -0.00020565465092658997, -0.00019387900829315186, -0.00018210336565971375, -0.00017032772302627563, -0.00015855208039283752, -0.00014677643775939941, -0.0001350007951259613, -0.0001232251524925232, -0.00011144950985908508, -9.967386722564697e-05, -8.789822459220886e-05, -7.612258195877075e-05, -6.434693932533264e-05, -5.257129669189453e-05, -4.079565405845642e-05, -2.902001142501831e-05, -1.72443687915802e-05, -5.46872615814209e-06, 6.3069164752960205e-06, 1.808255910873413e-05, 2.985820174217224e-05, 4.163384437561035e-05, 5.340948700904846e-05, 6.518512964248657e-05, 7.696077227592468e-05, 8.873641490936279e-05, 0.0001005120575428009, 0.00011228770017623901, 0.00012406334280967712, 0.00013583898544311523, 0.00014761462807655334, 0.00015939027070999146, 0.00017116591334342957, 0.00018294155597686768, 0.00019471719861030579, 0.0002064928412437439, 0.000218268483877182, 0.00023004412651062012, 0.00024181976914405823, 0.00025359541177749634, 0.00026537105441093445, 0.00027714669704437256, 0.00028892233967781067, 0.0003006979823112488, 0.0003124736249446869, 0.000324249267578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 10.0, 6.0, 11.0, 13.0, 21.0, 33.0, 46.0, 59.0, 86.0, 83.0, 159.0, 228.0, 342.0, 468.0, 661.0, 972.0, 1347.0, 2018.0, 3084.0, 4873.0, 7765.0, 12549.0, 21151.0, 37565.0, 68089.0, 121573.0, 195052.0, 217249.0, 150890.0, 86279.0, 47539.0, 26492.0, 15289.0, 9181.0, 5785.0, 3682.0, 2503.0, 1607.0, 1184.0, 756.0, 537.0, 393.0, 298.0, 198.0, 138.0, 96.0, 58.0, 48.0, 32.0, 19.0, 9.0, 10.0, 8.0, 7.0, 6.0, 2.0], "bins": [-4.2421875, -4.121673583984375, -4.00115966796875, -3.880645751953125, -3.7601318359375, -3.639617919921875, -3.51910400390625, -3.398590087890625, -3.278076171875, -3.157562255859375, -3.03704833984375, -2.916534423828125, -2.7960205078125, -2.675506591796875, -2.55499267578125, -2.434478759765625, -2.31396484375, -2.193450927734375, -2.07293701171875, -1.952423095703125, -1.8319091796875, -1.711395263671875, -1.59088134765625, -1.470367431640625, -1.349853515625, -1.229339599609375, -1.10882568359375, -0.988311767578125, -0.8677978515625, -0.747283935546875, -0.62677001953125, -0.506256103515625, -0.3857421875, -0.265228271484375, -0.14471435546875, -0.024200439453125, 0.0963134765625, 0.216827392578125, 0.33734130859375, 0.457855224609375, 0.578369140625, 0.698883056640625, 0.81939697265625, 0.939910888671875, 1.0604248046875, 1.180938720703125, 1.30145263671875, 1.421966552734375, 1.54248046875, 1.662994384765625, 1.78350830078125, 1.904022216796875, 2.0245361328125, 2.145050048828125, 2.26556396484375, 2.386077880859375, 2.506591796875, 2.627105712890625, 2.74761962890625, 2.868133544921875, 2.9886474609375, 3.109161376953125, 3.22967529296875, 3.350189208984375, 3.470703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 10.0, 13.0, 20.0, 20.0, 27.0, 39.0, 40.0, 51.0, 62.0, 66.0, 81.0, 80.0, 82.0, 69.0, 61.0, 44.0, 54.0, 34.0, 25.0, 26.0, 13.0, 17.0, 14.0, 9.0, 3.0, 13.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.427734375, -1.379791259765625, -1.33184814453125, -1.283905029296875, -1.2359619140625, -1.188018798828125, -1.14007568359375, -1.092132568359375, -1.044189453125, -0.996246337890625, -0.94830322265625, -0.900360107421875, -0.8524169921875, -0.804473876953125, -0.75653076171875, -0.708587646484375, -0.66064453125, -0.612701416015625, -0.56475830078125, -0.516815185546875, -0.4688720703125, -0.420928955078125, -0.37298583984375, -0.325042724609375, -0.277099609375, -0.229156494140625, -0.18121337890625, -0.133270263671875, -0.0853271484375, -0.037384033203125, 0.01055908203125, 0.058502197265625, 0.1064453125, 0.154388427734375, 0.20233154296875, 0.250274658203125, 0.2982177734375, 0.346160888671875, 0.39410400390625, 0.442047119140625, 0.489990234375, 0.537933349609375, 0.58587646484375, 0.633819580078125, 0.6817626953125, 0.729705810546875, 0.77764892578125, 0.825592041015625, 0.87353515625, 0.921478271484375, 0.96942138671875, 1.017364501953125, 1.0653076171875, 1.113250732421875, 1.16119384765625, 1.209136962890625, 1.257080078125, 1.305023193359375, 1.35296630859375, 1.400909423828125, 1.4488525390625, 1.496795654296875, 1.54473876953125, 1.592681884765625, 1.640625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 10.0, 7.0, 7.0, 7.0, 11.0, 9.0, 19.0, 20.0, 28.0, 22.0, 31.0, 38.0, 39.0, 38.0, 46.0, 36.0, 39.0, 45.0, 52.0, 34.0, 51.0, 47.0, 38.0, 40.0, 34.0, 46.0, 25.0, 29.0, 32.0, 20.0, 14.0, 14.0, 21.0, 13.0, 5.0, 11.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-29.735157012939453, -28.855043411254883, -27.974929809570312, -27.094816207885742, -26.214702606201172, -25.3345890045166, -24.45447540283203, -23.57436180114746, -22.69424819946289, -21.81413459777832, -20.93402099609375, -20.05390739440918, -19.17379379272461, -18.29368019104004, -17.41356658935547, -16.5334529876709, -15.653340339660645, -14.773226737976074, -13.893113136291504, -13.012999534606934, -12.132885932922363, -11.25277328491211, -10.372659683227539, -9.492546081542969, -8.612432479858398, -7.732318878173828, -6.852205276489258, -5.9720916748046875, -5.091978073120117, -4.211864948272705, -3.3317513465881348, -2.4516377449035645, -1.571523666381836, -0.6914101243019104, 0.18870341777801514, 1.068816900253296, 1.9489305019378662, 2.8290438652038574, 3.7091574668884277, 4.589271068572998, 5.469384670257568, 6.349498271942139, 7.229611873626709, 8.109724998474121, 8.989838600158691, 9.869952201843262, 10.750065803527832, 11.630179405212402, 12.510293006896973, 13.390406608581543, 14.270520210266113, 15.150633811950684, 16.030746459960938, 16.910860061645508, 17.790973663330078, 18.67108726501465, 19.55120086669922, 20.43131446838379, 21.31142807006836, 22.19154167175293, 23.0716552734375, 23.95176887512207, 24.83188247680664, 25.71199607849121, 26.59210968017578]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 8.0, 8.0, 13.0, 16.0, 12.0, 12.0, 20.0, 27.0, 22.0, 21.0, 19.0, 33.0, 33.0, 28.0, 38.0, 49.0, 47.0, 37.0, 53.0, 26.0, 41.0, 47.0, 36.0, 37.0, 43.0, 35.0, 33.0, 21.0, 22.0, 20.0, 21.0, 18.0, 17.0, 20.0, 14.0, 11.0, 9.0, 7.0, 12.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-30.27671241760254, -29.27250862121582, -28.268306732177734, -27.264102935791016, -26.259899139404297, -25.25569725036621, -24.251493453979492, -23.247291564941406, -22.243087768554688, -21.23888397216797, -20.234682083129883, -19.230478286743164, -18.226276397705078, -17.22207260131836, -16.21786880493164, -15.213665962219238, -14.209463119506836, -13.205260276794434, -12.201057434082031, -11.196853637695312, -10.19265079498291, -9.188447952270508, -8.184244155883789, -7.180041313171387, -6.175838470458984, -5.171635627746582, -4.1674323081970215, -3.16322922706604, -2.1590261459350586, -1.1548233032226562, -0.1506199836730957, 0.8535833358764648, 1.8577842712402344, 2.861987352371216, 3.8661904335021973, 4.870393753051758, 5.87459659576416, 6.8787994384765625, 7.883002758026123, 8.887206077575684, 9.891408920288086, 10.895611763000488, 11.89981460571289, 12.90401840209961, 13.908221244812012, 14.912424087524414, 15.916627883911133, 16.92082977294922, 17.925033569335938, 18.929237365722656, 19.933439254760742, 20.93764305114746, 21.941844940185547, 22.946048736572266, 23.950252532958984, 24.954456329345703, 25.95865821838379, 26.962862014770508, 27.967063903808594, 28.971267700195312, 29.97547149658203, 30.979673385620117, 31.983877182006836, 32.98807907104492, 33.99228286743164]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 5.0, 9.0, 7.0, 14.0, 21.0, 34.0, 62.0, 76.0, 133.0, 215.0, 335.0, 537.0, 763.0, 1244.0, 2032.0, 3066.0, 4731.0, 7131.0, 10785.0, 15793.0, 22746.0, 31818.0, 43320.0, 55669.0, 69277.0, 81762.0, 91040.0, 96755.0, 95439.0, 88750.0, 78096.0, 65223.0, 51544.0, 39279.0, 28948.0, 20526.0, 14074.0, 9506.0, 6247.0, 4141.0, 2628.0, 1757.0, 1114.0, 671.0, 448.0, 303.0, 177.0, 102.0, 90.0, 43.0, 23.0, 20.0, 17.0, 9.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-20.703125, -20.052978515625, -19.40283203125, -18.752685546875, -18.1025390625, -17.452392578125, -16.80224609375, -16.152099609375, -15.501953125, -14.851806640625, -14.20166015625, -13.551513671875, -12.9013671875, -12.251220703125, -11.60107421875, -10.950927734375, -10.30078125, -9.650634765625, -9.00048828125, -8.350341796875, -7.7001953125, -7.050048828125, -6.39990234375, -5.749755859375, -5.099609375, -4.449462890625, -3.79931640625, -3.149169921875, -2.4990234375, -1.848876953125, -1.19873046875, -0.548583984375, 0.1015625, 0.751708984375, 1.40185546875, 2.052001953125, 2.7021484375, 3.352294921875, 4.00244140625, 4.652587890625, 5.302734375, 5.952880859375, 6.60302734375, 7.253173828125, 7.9033203125, 8.553466796875, 9.20361328125, 9.853759765625, 10.50390625, 11.154052734375, 11.80419921875, 12.454345703125, 13.1044921875, 13.754638671875, 14.40478515625, 15.054931640625, 15.705078125, 16.355224609375, 17.00537109375, 17.655517578125, 18.3056640625, 18.955810546875, 19.60595703125, 20.256103515625, 20.90625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 12.0, 14.0, 15.0, 11.0, 16.0, 16.0, 21.0, 18.0, 26.0, 26.0, 29.0, 18.0, 33.0, 39.0, 42.0, 45.0, 50.0, 51.0, 40.0, 43.0, 37.0, 36.0, 37.0, 28.0, 38.0, 36.0, 27.0, 24.0, 22.0, 33.0, 26.0, 18.0, 12.0, 13.0, 16.0, 6.0, 8.0, 8.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.953125, -29.938232421875, -28.92333984375, -27.908447265625, -26.8935546875, -25.878662109375, -24.86376953125, -23.848876953125, -22.833984375, -21.819091796875, -20.80419921875, -19.789306640625, -18.7744140625, -17.759521484375, -16.74462890625, -15.729736328125, -14.71484375, -13.699951171875, -12.68505859375, -11.670166015625, -10.6552734375, -9.640380859375, -8.62548828125, -7.610595703125, -6.595703125, -5.580810546875, -4.56591796875, -3.551025390625, -2.5361328125, -1.521240234375, -0.50634765625, 0.508544921875, 1.5234375, 2.538330078125, 3.55322265625, 4.568115234375, 5.5830078125, 6.597900390625, 7.61279296875, 8.627685546875, 9.642578125, 10.657470703125, 11.67236328125, 12.687255859375, 13.7021484375, 14.717041015625, 15.73193359375, 16.746826171875, 17.76171875, 18.776611328125, 19.79150390625, 20.806396484375, 21.8212890625, 22.836181640625, 23.85107421875, 24.865966796875, 25.880859375, 26.895751953125, 27.91064453125, 28.925537109375, 29.9404296875, 30.955322265625, 31.97021484375, 32.985107421875, 34.0]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 14.0, 31.0, 34.0, 72.0, 96.0, 189.0, 324.0, 508.0, 889.0, 1456.0, 2438.0, 4093.0, 6356.0, 10204.0, 16118.0, 24820.0, 37724.0, 53766.0, 71963.0, 91136.0, 106023.0, 114890.0, 113265.0, 101870.0, 85214.0, 65899.0, 47194.0, 33198.0, 21692.0, 14237.0, 8679.0, 5519.0, 3498.0, 2050.0, 1252.0, 711.0, 420.0, 280.0, 165.0, 97.0, 60.0, 35.0, 14.0, 19.0, 11.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.421875, -23.6298828125, -22.837890625, -22.0458984375, -21.25390625, -20.4619140625, -19.669921875, -18.8779296875, -18.0859375, -17.2939453125, -16.501953125, -15.7099609375, -14.91796875, -14.1259765625, -13.333984375, -12.5419921875, -11.75, -10.9580078125, -10.166015625, -9.3740234375, -8.58203125, -7.7900390625, -6.998046875, -6.2060546875, -5.4140625, -4.6220703125, -3.830078125, -3.0380859375, -2.24609375, -1.4541015625, -0.662109375, 0.1298828125, 0.921875, 1.7138671875, 2.505859375, 3.2978515625, 4.08984375, 4.8818359375, 5.673828125, 6.4658203125, 7.2578125, 8.0498046875, 8.841796875, 9.6337890625, 10.42578125, 11.2177734375, 12.009765625, 12.8017578125, 13.59375, 14.3857421875, 15.177734375, 15.9697265625, 16.76171875, 17.5537109375, 18.345703125, 19.1376953125, 19.9296875, 20.7216796875, 21.513671875, 22.3056640625, 23.09765625, 23.8896484375, 24.681640625, 25.4736328125, 26.265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 7.0, 11.0, 7.0, 7.0, 7.0, 19.0, 19.0, 14.0, 26.0, 12.0, 34.0, 19.0, 33.0, 30.0, 38.0, 32.0, 44.0, 34.0, 26.0, 30.0, 43.0, 46.0, 49.0, 38.0, 33.0, 44.0, 39.0, 26.0, 26.0, 29.0, 21.0, 26.0, 19.0, 15.0, 15.0, 19.0, 9.0, 7.0, 6.0, 7.0, 6.0, 7.0, 6.0, 2.0, 6.0, 3.0, 3.0, 1.0], "bins": [-22.828125, -22.19921875, -21.5703125, -20.94140625, -20.3125, -19.68359375, -19.0546875, -18.42578125, -17.796875, -17.16796875, -16.5390625, -15.91015625, -15.28125, -14.65234375, -14.0234375, -13.39453125, -12.765625, -12.13671875, -11.5078125, -10.87890625, -10.25, -9.62109375, -8.9921875, -8.36328125, -7.734375, -7.10546875, -6.4765625, -5.84765625, -5.21875, -4.58984375, -3.9609375, -3.33203125, -2.703125, -2.07421875, -1.4453125, -0.81640625, -0.1875, 0.44140625, 1.0703125, 1.69921875, 2.328125, 2.95703125, 3.5859375, 4.21484375, 4.84375, 5.47265625, 6.1015625, 6.73046875, 7.359375, 7.98828125, 8.6171875, 9.24609375, 9.875, 10.50390625, 11.1328125, 11.76171875, 12.390625, 13.01953125, 13.6484375, 14.27734375, 14.90625, 15.53515625, 16.1640625, 16.79296875, 17.421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 11.0, 11.0, 25.0, 29.0, 43.0, 56.0, 77.0, 113.0, 146.0, 235.0, 353.0, 594.0, 1069.0, 1849.0, 3391.0, 6785.0, 14911.0, 35909.0, 94753.0, 221059.0, 308475.0, 209476.0, 87716.0, 33695.0, 13806.0, 6460.0, 3187.0, 1666.0, 1017.0, 588.0, 333.0, 232.0, 124.0, 85.0, 53.0, 48.0, 40.0, 27.0, 21.0, 20.0, 9.0, 9.0, 9.0, 6.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.953125, -25.10107421875, -24.2490234375, -23.39697265625, -22.544921875, -21.69287109375, -20.8408203125, -19.98876953125, -19.13671875, -18.28466796875, -17.4326171875, -16.58056640625, -15.728515625, -14.87646484375, -14.0244140625, -13.17236328125, -12.3203125, -11.46826171875, -10.6162109375, -9.76416015625, -8.912109375, -8.06005859375, -7.2080078125, -6.35595703125, -5.50390625, -4.65185546875, -3.7998046875, -2.94775390625, -2.095703125, -1.24365234375, -0.3916015625, 0.46044921875, 1.3125, 2.16455078125, 3.0166015625, 3.86865234375, 4.720703125, 5.57275390625, 6.4248046875, 7.27685546875, 8.12890625, 8.98095703125, 9.8330078125, 10.68505859375, 11.537109375, 12.38916015625, 13.2412109375, 14.09326171875, 14.9453125, 15.79736328125, 16.6494140625, 17.50146484375, 18.353515625, 19.20556640625, 20.0576171875, 20.90966796875, 21.76171875, 22.61376953125, 23.4658203125, 24.31787109375, 25.169921875, 26.02197265625, 26.8740234375, 27.72607421875, 28.578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 17.0, 14.0, 23.0, 27.0, 42.0, 45.0, 76.0, 46.0, 85.0, 78.0, 94.0, 83.0, 74.0, 64.0, 58.0, 26.0, 25.0, 21.0, 23.0, 9.0, 12.0, 6.0, 7.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021915435791015625, -0.0021255016326904297, -0.002059459686279297, -0.001993417739868164, -0.0019273757934570312, -0.0018613338470458984, -0.0017952919006347656, -0.0017292499542236328, -0.0016632080078125, -0.0015971660614013672, -0.0015311241149902344, -0.0014650821685791016, -0.0013990402221679688, -0.001332998275756836, -0.0012669563293457031, -0.0012009143829345703, -0.0011348724365234375, -0.0010688304901123047, -0.0010027885437011719, -0.0009367465972900391, -0.0008707046508789062, -0.0008046627044677734, -0.0007386207580566406, -0.0006725788116455078, -0.000606536865234375, -0.0005404949188232422, -0.0004744529724121094, -0.00040841102600097656, -0.00034236907958984375, -0.00027632713317871094, -0.00021028518676757812, -0.0001442432403564453, -7.82012939453125e-05, -1.2159347534179688e-05, 5.3882598876953125e-05, 0.00011992454528808594, 0.00018596649169921875, 0.00025200843811035156, 0.0003180503845214844, 0.0003840923309326172, 0.00045013427734375, 0.0005161762237548828, 0.0005822181701660156, 0.0006482601165771484, 0.0007143020629882812, 0.0007803440093994141, 0.0008463859558105469, 0.0009124279022216797, 0.0009784698486328125, 0.0010445117950439453, 0.0011105537414550781, 0.001176595687866211, 0.0012426376342773438, 0.0013086795806884766, 0.0013747215270996094, 0.0014407634735107422, 0.001506805419921875, 0.0015728473663330078, 0.0016388893127441406, 0.0017049312591552734, 0.0017709732055664062, 0.001837015151977539, 0.0019030570983886719, 0.0019690990447998047, 0.0020351409912109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 18.0, 16.0, 23.0, 29.0, 38.0, 55.0, 69.0, 100.0, 144.0, 148.0, 233.0, 340.0, 447.0, 746.0, 1159.0, 2358.0, 4948.0, 11285.0, 27418.0, 66821.0, 151477.0, 253333.0, 254785.0, 153953.0, 68304.0, 27825.0, 11439.0, 4971.0, 2315.0, 1278.0, 763.0, 443.0, 321.0, 248.0, 169.0, 132.0, 106.0, 71.0, 64.0, 39.0, 34.0, 24.0, 13.0, 12.0, 3.0, 8.0, 6.0, 6.0, 3.0, 3.0], "bins": [-27.5, -26.736328125, -25.97265625, -25.208984375, -24.4453125, -23.681640625, -22.91796875, -22.154296875, -21.390625, -20.626953125, -19.86328125, -19.099609375, -18.3359375, -17.572265625, -16.80859375, -16.044921875, -15.28125, -14.517578125, -13.75390625, -12.990234375, -12.2265625, -11.462890625, -10.69921875, -9.935546875, -9.171875, -8.408203125, -7.64453125, -6.880859375, -6.1171875, -5.353515625, -4.58984375, -3.826171875, -3.0625, -2.298828125, -1.53515625, -0.771484375, -0.0078125, 0.755859375, 1.51953125, 2.283203125, 3.046875, 3.810546875, 4.57421875, 5.337890625, 6.1015625, 6.865234375, 7.62890625, 8.392578125, 9.15625, 9.919921875, 10.68359375, 11.447265625, 12.2109375, 12.974609375, 13.73828125, 14.501953125, 15.265625, 16.029296875, 16.79296875, 17.556640625, 18.3203125, 19.083984375, 19.84765625, 20.611328125, 21.375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 3.0, 15.0, 13.0, 20.0, 14.0, 27.0, 31.0, 41.0, 52.0, 54.0, 79.0, 71.0, 68.0, 68.0, 80.0, 72.0, 69.0, 38.0, 46.0, 27.0, 34.0, 17.0, 19.0, 13.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.5081787109375, -6.258544921875, -6.0089111328125, -5.75927734375, -5.5096435546875, -5.260009765625, -5.0103759765625, -4.7607421875, -4.5111083984375, -4.261474609375, -4.0118408203125, -3.76220703125, -3.5125732421875, -3.262939453125, -3.0133056640625, -2.763671875, -2.5140380859375, -2.264404296875, -2.0147705078125, -1.76513671875, -1.5155029296875, -1.265869140625, -1.0162353515625, -0.7666015625, -0.5169677734375, -0.267333984375, -0.0177001953125, 0.23193359375, 0.4815673828125, 0.731201171875, 0.9808349609375, 1.23046875, 1.4801025390625, 1.729736328125, 1.9793701171875, 2.22900390625, 2.4786376953125, 2.728271484375, 2.9779052734375, 3.2275390625, 3.4771728515625, 3.726806640625, 3.9764404296875, 4.22607421875, 4.4757080078125, 4.725341796875, 4.9749755859375, 5.224609375, 5.4742431640625, 5.723876953125, 5.9735107421875, 6.22314453125, 6.4727783203125, 6.722412109375, 6.9720458984375, 7.2216796875, 7.4713134765625, 7.720947265625, 7.9705810546875, 8.22021484375, 8.4698486328125, 8.719482421875, 8.9691162109375, 9.21875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 9.0, 12.0, 7.0, 6.0, 21.0, 21.0, 30.0, 18.0, 35.0, 26.0, 32.0, 43.0, 41.0, 40.0, 55.0, 53.0, 37.0, 41.0, 47.0, 50.0, 53.0, 41.0, 30.0, 25.0, 31.0, 37.0, 26.0, 19.0, 20.0, 12.0, 16.0, 11.0, 8.0, 10.0, 3.0, 6.0, 8.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.68899917602539, -28.79994010925293, -27.9108829498291, -27.02182388305664, -26.13276481628418, -25.24370574951172, -24.35464859008789, -23.46558952331543, -22.57653045654297, -21.687471389770508, -20.79841423034668, -19.90935516357422, -19.020296096801758, -18.131237030029297, -17.24217987060547, -16.353120803833008, -15.46406364440918, -14.575005531311035, -13.685946464538574, -12.79688835144043, -11.907829284667969, -11.018771171569824, -10.12971305847168, -9.240653991699219, -8.351595878601074, -7.4625372886657715, -6.573478698730469, -5.684420585632324, -4.7953619956970215, -3.9063034057617188, -3.017245292663574, -2.1281867027282715, -1.239126205444336, -0.35006773471832275, 0.5389907360076904, 1.428049087524414, 2.317107677459717, 3.2061662673950195, 4.095224380493164, 4.984282970428467, 5.8733415603637695, 6.762400150299072, 7.651458740234375, 8.54051685333252, 9.429574966430664, 10.318634033203125, 11.20769214630127, 12.096750259399414, 12.985809326171875, 13.87486743927002, 14.76392650604248, 15.652984619140625, 16.542043685913086, 17.431102752685547, 18.320159912109375, 19.209218978881836, 20.098278045654297, 20.987337112426758, 21.876394271850586, 22.765453338623047, 23.654512405395508, 24.54357147216797, 25.432628631591797, 26.321687698364258, 27.210744857788086]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 7.0, 10.0, 16.0, 14.0, 11.0, 25.0, 15.0, 23.0, 30.0, 40.0, 30.0, 41.0, 37.0, 49.0, 36.0, 55.0, 42.0, 41.0, 48.0, 38.0, 45.0, 37.0, 45.0, 34.0, 29.0, 20.0, 30.0, 20.0, 16.0, 23.0, 25.0, 7.0, 14.0, 8.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.83268737792969, -31.704620361328125, -30.576553344726562, -29.448486328125, -28.320417404174805, -27.192350387573242, -26.06428337097168, -24.936216354370117, -23.808147430419922, -22.68008041381836, -21.552013397216797, -20.423946380615234, -19.29587745666504, -18.167810440063477, -17.039743423461914, -15.911676406860352, -14.783609390258789, -13.655542373657227, -12.527474403381348, -11.399407386779785, -10.271339416503906, -9.143272399902344, -8.015205383300781, -6.8871378898620605, -5.75907039642334, -4.631002902984619, -3.5029356479644775, -2.374868392944336, -1.2468008995056152, -0.11873340606689453, 1.009333610534668, 2.1374011039733887, 3.2654685974121094, 4.39353609085083, 5.521603584289551, 6.649670600891113, 7.777738094329834, 8.905805587768555, 10.033872604370117, 11.16193962097168, 12.290007591247559, 13.418074607849121, 14.546142578125, 15.674209594726562, 16.802276611328125, 17.930343627929688, 19.05841064453125, 20.186479568481445, 21.314546585083008, 22.44261360168457, 23.570680618286133, 24.698749542236328, 25.82681655883789, 26.954883575439453, 28.082950592041016, 29.211017608642578, 30.33908462524414, 31.467151641845703, 32.595218658447266, 33.72328567504883, 34.85135269165039, 35.97942352294922, 37.10749053955078, 38.235557556152344, 39.363624572753906]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 6.0, 12.0, 17.0, 31.0, 52.0, 104.0, 144.0, 227.0, 387.0, 599.0, 893.0, 1458.0, 2378.0, 3892.0, 5840.0, 9503.0, 15062.0, 23837.0, 37163.0, 57320.0, 86289.0, 129044.0, 184690.0, 254244.0, 329482.0, 398577.0, 447319.0, 456187.0, 426556.0, 364133.0, 289105.0, 216000.0, 153390.0, 105205.0, 70105.0, 45635.0, 29094.0, 18421.0, 11825.0, 7433.0, 4666.0, 2960.0, 1842.0, 1148.0, 706.0, 491.0, 314.0, 210.0, 125.0, 53.0, 42.0, 30.0, 21.0, 14.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0], "bins": [-19.40625, -18.7646484375, -18.123046875, -17.4814453125, -16.83984375, -16.1982421875, -15.556640625, -14.9150390625, -14.2734375, -13.6318359375, -12.990234375, -12.3486328125, -11.70703125, -11.0654296875, -10.423828125, -9.7822265625, -9.140625, -8.4990234375, -7.857421875, -7.2158203125, -6.57421875, -5.9326171875, -5.291015625, -4.6494140625, -4.0078125, -3.3662109375, -2.724609375, -2.0830078125, -1.44140625, -0.7998046875, -0.158203125, 0.4833984375, 1.125, 1.7666015625, 2.408203125, 3.0498046875, 3.69140625, 4.3330078125, 4.974609375, 5.6162109375, 6.2578125, 6.8994140625, 7.541015625, 8.1826171875, 8.82421875, 9.4658203125, 10.107421875, 10.7490234375, 11.390625, 12.0322265625, 12.673828125, 13.3154296875, 13.95703125, 14.5986328125, 15.240234375, 15.8818359375, 16.5234375, 17.1650390625, 17.806640625, 18.4482421875, 19.08984375, 19.7314453125, 20.373046875, 21.0146484375, 21.65625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 7.0, 7.0, 6.0, 20.0, 15.0, 18.0, 21.0, 22.0, 26.0, 32.0, 35.0, 40.0, 37.0, 41.0, 40.0, 37.0, 60.0, 44.0, 35.0, 51.0, 48.0, 43.0, 39.0, 40.0, 44.0, 27.0, 24.0, 26.0, 21.0, 18.0, 15.0, 10.0, 10.0, 7.0, 5.0, 10.0, 7.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.84375, -24.939453125, -24.03515625, -23.130859375, -22.2265625, -21.322265625, -20.41796875, -19.513671875, -18.609375, -17.705078125, -16.80078125, -15.896484375, -14.9921875, -14.087890625, -13.18359375, -12.279296875, -11.375, -10.470703125, -9.56640625, -8.662109375, -7.7578125, -6.853515625, -5.94921875, -5.044921875, -4.140625, -3.236328125, -2.33203125, -1.427734375, -0.5234375, 0.380859375, 1.28515625, 2.189453125, 3.09375, 3.998046875, 4.90234375, 5.806640625, 6.7109375, 7.615234375, 8.51953125, 9.423828125, 10.328125, 11.232421875, 12.13671875, 13.041015625, 13.9453125, 14.849609375, 15.75390625, 16.658203125, 17.5625, 18.466796875, 19.37109375, 20.275390625, 21.1796875, 22.083984375, 22.98828125, 23.892578125, 24.796875, 25.701171875, 26.60546875, 27.509765625, 28.4140625, 29.318359375, 30.22265625, 31.126953125, 32.03125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 21.0, 48.0, 78.0, 122.0, 221.0, 400.0, 697.0, 1165.0, 2153.0, 3671.0, 6006.0, 10004.0, 16786.0, 26700.0, 42582.0, 65196.0, 97316.0, 141623.0, 195313.0, 259396.0, 324635.0, 381016.0, 418428.0, 425820.0, 403116.0, 353899.0, 290411.0, 225806.0, 166253.0, 117576.0, 79540.0, 52287.0, 33440.0, 21039.0, 12866.0, 7780.0, 4554.0, 2736.0, 1513.0, 895.0, 507.0, 286.0, 174.0, 85.0, 53.0, 36.0, 15.0, 15.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.5625, -20.913818359375, -20.26513671875, -19.616455078125, -18.9677734375, -18.319091796875, -17.67041015625, -17.021728515625, -16.373046875, -15.724365234375, -15.07568359375, -14.427001953125, -13.7783203125, -13.129638671875, -12.48095703125, -11.832275390625, -11.18359375, -10.534912109375, -9.88623046875, -9.237548828125, -8.5888671875, -7.940185546875, -7.29150390625, -6.642822265625, -5.994140625, -5.345458984375, -4.69677734375, -4.048095703125, -3.3994140625, -2.750732421875, -2.10205078125, -1.453369140625, -0.8046875, -0.156005859375, 0.49267578125, 1.141357421875, 1.7900390625, 2.438720703125, 3.08740234375, 3.736083984375, 4.384765625, 5.033447265625, 5.68212890625, 6.330810546875, 6.9794921875, 7.628173828125, 8.27685546875, 8.925537109375, 9.57421875, 10.222900390625, 10.87158203125, 11.520263671875, 12.1689453125, 12.817626953125, 13.46630859375, 14.114990234375, 14.763671875, 15.412353515625, 16.06103515625, 16.709716796875, 17.3583984375, 18.007080078125, 18.65576171875, 19.304443359375, 19.953125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 8.0, 7.0, 13.0, 12.0, 20.0, 36.0, 26.0, 40.0, 42.0, 68.0, 64.0, 93.0, 102.0, 130.0, 142.0, 173.0, 174.0, 175.0, 216.0, 205.0, 203.0, 203.0, 214.0, 207.0, 182.0, 185.0, 174.0, 150.0, 149.0, 131.0, 92.0, 74.0, 73.0, 65.0, 43.0, 41.0, 38.0, 23.0, 32.0, 11.0, 8.0, 6.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.42578125, -10.0546875, -9.68359375, -9.3125, -8.94140625, -8.5703125, -8.19921875, -7.828125, -7.45703125, -7.0859375, -6.71484375, -6.34375, -5.97265625, -5.6015625, -5.23046875, -4.859375, -4.48828125, -4.1171875, -3.74609375, -3.375, -3.00390625, -2.6328125, -2.26171875, -1.890625, -1.51953125, -1.1484375, -0.77734375, -0.40625, -0.03515625, 0.3359375, 0.70703125, 1.078125, 1.44921875, 1.8203125, 2.19140625, 2.5625, 2.93359375, 3.3046875, 3.67578125, 4.046875, 4.41796875, 4.7890625, 5.16015625, 5.53125, 5.90234375, 6.2734375, 6.64453125, 7.015625, 7.38671875, 7.7578125, 8.12890625, 8.5, 8.87109375, 9.2421875, 9.61328125, 9.984375, 10.35546875, 10.7265625, 11.09765625, 11.46875, 11.83984375, 12.2109375, 12.58203125, 12.953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 7.0, 10.0, 12.0, 13.0, 8.0, 20.0, 23.0, 25.0, 35.0, 31.0, 34.0, 32.0, 35.0, 47.0, 54.0, 56.0, 49.0, 51.0, 45.0, 44.0, 38.0, 41.0, 39.0, 31.0, 33.0, 37.0, 25.0, 21.0, 22.0, 14.0, 14.0, 11.0, 9.0, 9.0, 4.0, 2.0, 2.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.171144485473633, -27.296199798583984, -26.421255111694336, -25.546310424804688, -24.671363830566406, -23.796419143676758, -22.92147445678711, -22.04652976989746, -21.171585083007812, -20.296640396118164, -19.421695709228516, -18.546749114990234, -17.671804428100586, -16.796859741210938, -15.921915054321289, -15.04697036743164, -14.172024726867676, -13.297080039978027, -12.422134399414062, -11.547189712524414, -10.672245025634766, -9.797300338745117, -8.922354698181152, -8.047410011291504, -7.172464847564697, -6.297519683837891, -5.422574996948242, -4.5476298332214355, -3.672684907913208, -2.7977399826049805, -1.9227948188781738, -1.0478501319885254, -0.17290496826171875, 0.7020400166511536, 1.5769850015640259, 2.451930046081543, 3.3268749713897705, 4.201819896697998, 5.076765060424805, 5.951709747314453, 6.82665491104126, 7.701600074768066, 8.576544761657715, 9.45149040222168, 10.326435089111328, 11.201379776000977, 12.076324462890625, 12.951269149780273, 13.826214790344238, 14.701159477233887, 15.576105117797852, 16.4510498046875, 17.32599449157715, 18.200939178466797, 19.075885772705078, 19.950828552246094, 20.825775146484375, 21.700719833374023, 22.575664520263672, 23.450611114501953, 24.3255558013916, 25.20050048828125, 26.0754451751709, 26.950389862060547, 27.825334548950195]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 5.0, 6.0, 5.0, 4.0, 9.0, 4.0, 10.0, 12.0, 20.0, 29.0, 19.0, 24.0, 38.0, 31.0, 35.0, 37.0, 28.0, 41.0, 43.0, 39.0, 31.0, 47.0, 30.0, 48.0, 40.0, 42.0, 38.0, 37.0, 38.0, 28.0, 30.0, 24.0, 28.0, 15.0, 14.0, 14.0, 20.0, 3.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.982175827026367, -26.99736976623535, -26.012563705444336, -25.02775764465332, -24.042951583862305, -23.05814552307129, -22.073341369628906, -21.08853530883789, -20.103729248046875, -19.11892318725586, -18.134117126464844, -17.149311065673828, -16.164505004882812, -15.179698944091797, -14.194893836975098, -13.210087776184082, -12.22528076171875, -11.240474700927734, -10.255668640136719, -9.270862579345703, -8.286056518554688, -7.30125093460083, -6.316445350646973, -5.331639289855957, -4.346833229064941, -3.362027168273926, -2.3772213459014893, -1.3924155235290527, -0.4076094627380371, 0.5771965980529785, 1.562002182006836, 2.5468082427978516, 3.5316162109375, 4.516422271728516, 5.501228332519531, 6.486033916473389, 7.470839977264404, 8.455646514892578, 9.440451622009277, 10.425257682800293, 11.410063743591309, 12.394869804382324, 13.37967586517334, 14.364480972290039, 15.349287033081055, 16.33409309387207, 17.318899154663086, 18.3037052154541, 19.288511276245117, 20.273317337036133, 21.25812339782715, 22.242929458618164, 23.22773551940918, 24.212541580200195, 25.197345733642578, 26.182151794433594, 27.16695785522461, 28.151763916015625, 29.13656997680664, 30.121376037597656, 31.106182098388672, 32.09098815917969, 33.0757942199707, 34.06060028076172, 35.045406341552734]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 10.0, 15.0, 23.0, 31.0, 50.0, 100.0, 141.0, 257.0, 419.0, 685.0, 1056.0, 1786.0, 3033.0, 4950.0, 8032.0, 13047.0, 20710.0, 32809.0, 50343.0, 73863.0, 103498.0, 131335.0, 144496.0, 133459.0, 106505.0, 76105.0, 51664.0, 33642.0, 21790.0, 13594.0, 8291.0, 5017.0, 2998.0, 1923.0, 1137.0, 663.0, 425.0, 208.0, 167.0, 115.0, 61.0, 48.0, 24.0, 14.0, 9.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.64453125, -6.4403076171875, -6.236083984375, -6.0318603515625, -5.82763671875, -5.6234130859375, -5.419189453125, -5.2149658203125, -5.0107421875, -4.8065185546875, -4.602294921875, -4.3980712890625, -4.19384765625, -3.9896240234375, -3.785400390625, -3.5811767578125, -3.376953125, -3.1727294921875, -2.968505859375, -2.7642822265625, -2.56005859375, -2.3558349609375, -2.151611328125, -1.9473876953125, -1.7431640625, -1.5389404296875, -1.334716796875, -1.1304931640625, -0.92626953125, -0.7220458984375, -0.517822265625, -0.3135986328125, -0.109375, 0.0948486328125, 0.299072265625, 0.5032958984375, 0.70751953125, 0.9117431640625, 1.115966796875, 1.3201904296875, 1.5244140625, 1.7286376953125, 1.932861328125, 2.1370849609375, 2.34130859375, 2.5455322265625, 2.749755859375, 2.9539794921875, 3.158203125, 3.3624267578125, 3.566650390625, 3.7708740234375, 3.97509765625, 4.1793212890625, 4.383544921875, 4.5877685546875, 4.7919921875, 4.9962158203125, 5.200439453125, 5.4046630859375, 5.60888671875, 5.8131103515625, 6.017333984375, 6.2215576171875, 6.42578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 2.0, 7.0, 7.0, 9.0, 7.0, 11.0, 20.0, 21.0, 32.0, 32.0, 20.0, 25.0, 37.0, 39.0, 43.0, 35.0, 52.0, 44.0, 32.0, 33.0, 44.0, 38.0, 46.0, 45.0, 42.0, 30.0, 27.0, 22.0, 34.0, 34.0, 23.0, 19.0, 17.0, 9.0, 13.0, 12.0, 6.0, 5.0, 4.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.234375, -29.210205078125, -28.18603515625, -27.161865234375, -26.1376953125, -25.113525390625, -24.08935546875, -23.065185546875, -22.041015625, -21.016845703125, -19.99267578125, -18.968505859375, -17.9443359375, -16.920166015625, -15.89599609375, -14.871826171875, -13.84765625, -12.823486328125, -11.79931640625, -10.775146484375, -9.7509765625, -8.726806640625, -7.70263671875, -6.678466796875, -5.654296875, -4.630126953125, -3.60595703125, -2.581787109375, -1.5576171875, -0.533447265625, 0.49072265625, 1.514892578125, 2.5390625, 3.563232421875, 4.58740234375, 5.611572265625, 6.6357421875, 7.659912109375, 8.68408203125, 9.708251953125, 10.732421875, 11.756591796875, 12.78076171875, 13.804931640625, 14.8291015625, 15.853271484375, 16.87744140625, 17.901611328125, 18.92578125, 19.949951171875, 20.97412109375, 21.998291015625, 23.0224609375, 24.046630859375, 25.07080078125, 26.094970703125, 27.119140625, 28.143310546875, 29.16748046875, 30.191650390625, 31.2158203125, 32.239990234375, 33.26416015625, 34.288330078125, 35.3125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 9.0, 11.0, 5.0, 16.0, 31.0, 43.0, 54.0, 79.0, 139.0, 189.0, 273.0, 471.0, 715.0, 1096.0, 1832.0, 3093.0, 5192.0, 8753.0, 14878.0, 25395.0, 42569.0, 68514.0, 103382.0, 141369.0, 161548.0, 150101.0, 116048.0, 79225.0, 49938.0, 29729.0, 17841.0, 10438.0, 6115.0, 3566.0, 2226.0, 1361.0, 854.0, 505.0, 361.0, 220.0, 133.0, 73.0, 51.0, 39.0, 27.0, 23.0, 14.0, 7.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.89453125, -5.71405029296875, -5.5335693359375, -5.35308837890625, -5.172607421875, -4.99212646484375, -4.8116455078125, -4.63116455078125, -4.45068359375, -4.27020263671875, -4.0897216796875, -3.90924072265625, -3.728759765625, -3.54827880859375, -3.3677978515625, -3.18731689453125, -3.0068359375, -2.82635498046875, -2.6458740234375, -2.46539306640625, -2.284912109375, -2.10443115234375, -1.9239501953125, -1.74346923828125, -1.56298828125, -1.38250732421875, -1.2020263671875, -1.02154541015625, -0.841064453125, -0.66058349609375, -0.4801025390625, -0.29962158203125, -0.119140625, 0.06134033203125, 0.2418212890625, 0.42230224609375, 0.602783203125, 0.78326416015625, 0.9637451171875, 1.14422607421875, 1.32470703125, 1.50518798828125, 1.6856689453125, 1.86614990234375, 2.046630859375, 2.22711181640625, 2.4075927734375, 2.58807373046875, 2.7685546875, 2.94903564453125, 3.1295166015625, 3.30999755859375, 3.490478515625, 3.67095947265625, 3.8514404296875, 4.03192138671875, 4.21240234375, 4.39288330078125, 4.5733642578125, 4.75384521484375, 4.934326171875, 5.11480712890625, 5.2952880859375, 5.47576904296875, 5.65625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 8.0, 2.0, 7.0, 4.0, 11.0, 9.0, 13.0, 15.0, 20.0, 14.0, 21.0, 26.0, 19.0, 18.0, 37.0, 27.0, 38.0, 33.0, 37.0, 32.0, 35.0, 38.0, 40.0, 37.0, 39.0, 44.0, 40.0, 41.0, 28.0, 24.0, 20.0, 19.0, 17.0, 20.0, 28.0, 24.0, 17.0, 5.0, 15.0, 10.0, 10.0, 11.0, 9.0, 8.0, 8.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-17.953125, -17.397216796875, -16.84130859375, -16.285400390625, -15.7294921875, -15.173583984375, -14.61767578125, -14.061767578125, -13.505859375, -12.949951171875, -12.39404296875, -11.838134765625, -11.2822265625, -10.726318359375, -10.17041015625, -9.614501953125, -9.05859375, -8.502685546875, -7.94677734375, -7.390869140625, -6.8349609375, -6.279052734375, -5.72314453125, -5.167236328125, -4.611328125, -4.055419921875, -3.49951171875, -2.943603515625, -2.3876953125, -1.831787109375, -1.27587890625, -0.719970703125, -0.1640625, 0.391845703125, 0.94775390625, 1.503662109375, 2.0595703125, 2.615478515625, 3.17138671875, 3.727294921875, 4.283203125, 4.839111328125, 5.39501953125, 5.950927734375, 6.5068359375, 7.062744140625, 7.61865234375, 8.174560546875, 8.73046875, 9.286376953125, 9.84228515625, 10.398193359375, 10.9541015625, 11.510009765625, 12.06591796875, 12.621826171875, 13.177734375, 13.733642578125, 14.28955078125, 14.845458984375, 15.4013671875, 15.957275390625, 16.51318359375, 17.069091796875, 17.625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 9.0, 7.0, 16.0, 17.0, 33.0, 46.0, 48.0, 75.0, 122.0, 194.0, 248.0, 407.0, 557.0, 865.0, 1348.0, 2234.0, 3691.0, 6489.0, 11989.0, 22929.0, 47198.0, 98076.0, 197532.0, 272727.0, 191998.0, 94373.0, 45455.0, 22101.0, 11771.0, 6305.0, 3579.0, 2150.0, 1344.0, 878.0, 532.0, 379.0, 254.0, 172.0, 122.0, 87.0, 46.0, 41.0, 34.0, 24.0, 13.0, 14.0, 7.0, 6.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.6533203125, -1.600799560546875, -1.54827880859375, -1.495758056640625, -1.4432373046875, -1.390716552734375, -1.33819580078125, -1.285675048828125, -1.233154296875, -1.180633544921875, -1.12811279296875, -1.075592041015625, -1.0230712890625, -0.970550537109375, -0.91802978515625, -0.865509033203125, -0.81298828125, -0.760467529296875, -0.70794677734375, -0.655426025390625, -0.6029052734375, -0.550384521484375, -0.49786376953125, -0.445343017578125, -0.392822265625, -0.340301513671875, -0.28778076171875, -0.235260009765625, -0.1827392578125, -0.130218505859375, -0.07769775390625, -0.025177001953125, 0.02734375, 0.079864501953125, 0.13238525390625, 0.184906005859375, 0.2374267578125, 0.289947509765625, 0.34246826171875, 0.394989013671875, 0.447509765625, 0.500030517578125, 0.55255126953125, 0.605072021484375, 0.6575927734375, 0.710113525390625, 0.76263427734375, 0.815155029296875, 0.86767578125, 0.920196533203125, 0.97271728515625, 1.025238037109375, 1.0777587890625, 1.130279541015625, 1.18280029296875, 1.235321044921875, 1.287841796875, 1.340362548828125, 1.39288330078125, 1.445404052734375, 1.4979248046875, 1.550445556640625, 1.60296630859375, 1.655487060546875, 1.7080078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 4.0, 11.0, 16.0, 23.0, 22.0, 32.0, 48.0, 60.0, 74.0, 63.0, 71.0, 81.0, 97.0, 76.0, 73.0, 67.0, 39.0, 31.0, 19.0, 24.0, 17.0, 10.0, 10.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003542900085449219, -0.0003448314964771271, -0.0003353729844093323, -0.0003259144723415375, -0.0003164559602737427, -0.0003069974482059479, -0.0002975389361381531, -0.0002880804240703583, -0.0002786219120025635, -0.0002691633999347687, -0.0002597048878669739, -0.0002502463757991791, -0.00024078786373138428, -0.00023132935166358948, -0.00022187083959579468, -0.00021241232752799988, -0.00020295381546020508, -0.00019349530339241028, -0.00018403679132461548, -0.00017457827925682068, -0.00016511976718902588, -0.00015566125512123108, -0.00014620274305343628, -0.00013674423098564148, -0.00012728571891784668, -0.00011782720685005188, -0.00010836869478225708, -9.891018271446228e-05, -8.945167064666748e-05, -7.999315857887268e-05, -7.053464651107788e-05, -6.107613444328308e-05, -5.161762237548828e-05, -4.215911030769348e-05, -3.270059823989868e-05, -2.3242086172103882e-05, -1.3783574104309082e-05, -4.325062036514282e-06, 5.133450031280518e-06, 1.4591962099075317e-05, 2.4050474166870117e-05, 3.350898623466492e-05, 4.296749830245972e-05, 5.2426010370254517e-05, 6.188452243804932e-05, 7.134303450584412e-05, 8.080154657363892e-05, 9.026005864143372e-05, 9.971857070922852e-05, 0.00010917708277702332, 0.00011863559484481812, 0.00012809410691261292, 0.00013755261898040771, 0.00014701113104820251, 0.00015646964311599731, 0.00016592815518379211, 0.00017538666725158691, 0.00018484517931938171, 0.00019430369138717651, 0.0002037622034549713, 0.0002132207155227661, 0.0002226792275905609, 0.0002321377396583557, 0.0002415962517261505, 0.0002510547637939453]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 8.0, 12.0, 17.0, 22.0, 39.0, 59.0, 80.0, 141.0, 198.0, 300.0, 473.0, 691.0, 1090.0, 1702.0, 2720.0, 4225.0, 7127.0, 11796.0, 19962.0, 34124.0, 57665.0, 93364.0, 140401.0, 178348.0, 168999.0, 124219.0, 80708.0, 48532.0, 28751.0, 16768.0, 9991.0, 5867.0, 3699.0, 2315.0, 1433.0, 932.0, 600.0, 388.0, 258.0, 177.0, 115.0, 82.0, 48.0, 39.0, 26.0, 17.0, 5.0, 9.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.259765625, -2.18878173828125, -2.1177978515625, -2.04681396484375, -1.975830078125, -1.90484619140625, -1.8338623046875, -1.76287841796875, -1.69189453125, -1.62091064453125, -1.5499267578125, -1.47894287109375, -1.407958984375, -1.33697509765625, -1.2659912109375, -1.19500732421875, -1.1240234375, -1.05303955078125, -0.9820556640625, -0.91107177734375, -0.840087890625, -0.76910400390625, -0.6981201171875, -0.62713623046875, -0.55615234375, -0.48516845703125, -0.4141845703125, -0.34320068359375, -0.272216796875, -0.20123291015625, -0.1302490234375, -0.05926513671875, 0.01171875, 0.08270263671875, 0.1536865234375, 0.22467041015625, 0.295654296875, 0.36663818359375, 0.4376220703125, 0.50860595703125, 0.57958984375, 0.65057373046875, 0.7215576171875, 0.79254150390625, 0.863525390625, 0.93450927734375, 1.0054931640625, 1.07647705078125, 1.1474609375, 1.21844482421875, 1.2894287109375, 1.36041259765625, 1.431396484375, 1.50238037109375, 1.5733642578125, 1.64434814453125, 1.71533203125, 1.78631591796875, 1.8572998046875, 1.92828369140625, 1.999267578125, 2.07025146484375, 2.1412353515625, 2.21221923828125, 2.283203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 13.0, 16.0, 22.0, 17.0, 16.0, 17.0, 34.0, 35.0, 39.0, 47.0, 53.0, 68.0, 67.0, 76.0, 47.0, 60.0, 47.0, 43.0, 43.0, 44.0, 24.0, 30.0, 21.0, 22.0, 20.0, 20.0, 8.0, 8.0, 3.0, 5.0, 6.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80419921875, -0.7785415649414062, -0.7528839111328125, -0.7272262573242188, -0.701568603515625, -0.6759109497070312, -0.6502532958984375, -0.6245956420898438, -0.59893798828125, -0.5732803344726562, -0.5476226806640625, -0.5219650268554688, -0.496307373046875, -0.47064971923828125, -0.4449920654296875, -0.41933441162109375, -0.3936767578125, -0.36801910400390625, -0.3423614501953125, -0.31670379638671875, -0.291046142578125, -0.26538848876953125, -0.2397308349609375, -0.21407318115234375, -0.18841552734375, -0.16275787353515625, -0.1371002197265625, -0.11144256591796875, -0.085784912109375, -0.06012725830078125, -0.0344696044921875, -0.00881195068359375, 0.016845703125, 0.04250335693359375, 0.0681610107421875, 0.09381866455078125, 0.119476318359375, 0.14513397216796875, 0.1707916259765625, 0.19644927978515625, 0.22210693359375, 0.24776458740234375, 0.2734222412109375, 0.29907989501953125, 0.324737548828125, 0.35039520263671875, 0.3760528564453125, 0.40171051025390625, 0.4273681640625, 0.45302581787109375, 0.4786834716796875, 0.5043411254882812, 0.529998779296875, 0.5556564331054688, 0.5813140869140625, 0.6069717407226562, 0.63262939453125, 0.6582870483398438, 0.6839447021484375, 0.7096023559570312, 0.735260009765625, 0.7609176635742188, 0.7865753173828125, 0.8122329711914062, 0.837890625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 10.0, 6.0, 7.0, 14.0, 11.0, 16.0, 23.0, 21.0, 26.0, 33.0, 34.0, 22.0, 41.0, 46.0, 34.0, 59.0, 50.0, 52.0, 54.0, 38.0, 48.0, 44.0, 35.0, 45.0, 27.0, 35.0, 27.0, 24.0, 21.0, 23.0, 16.0, 12.0, 6.0, 11.0, 11.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.702054977416992, -26.835445404052734, -25.96883773803711, -25.10222816467285, -24.235618591308594, -23.36901092529297, -22.50240135192871, -21.635791778564453, -20.769184112548828, -19.90257453918457, -19.035966873168945, -18.169357299804688, -17.30274772644043, -16.436138153076172, -15.569530487060547, -14.702920913696289, -13.836311340332031, -12.96970272064209, -12.103093147277832, -11.23648452758789, -10.369874954223633, -9.503266334533691, -8.63665771484375, -7.77004861831665, -6.903439521789551, -6.036830425262451, -5.170221328735352, -4.30361270904541, -3.4370036125183105, -2.570394515991211, -1.7037858963012695, -0.8371767997741699, 0.0294342041015625, 0.8960431814193726, 1.7626521587371826, 2.629261016845703, 3.4958701133728027, 4.362479209899902, 5.229087829589844, 6.095696926116943, 6.962306022644043, 7.828915119171143, 8.695524215698242, 9.562132835388184, 10.428741455078125, 11.295351028442383, 12.161959648132324, 13.028568267822266, 13.895177841186523, 14.761786460876465, 15.628396034240723, 16.495004653930664, 17.361614227294922, 18.228221893310547, 19.094831466674805, 19.961441040039062, 20.828048706054688, 21.694658279418945, 22.56126594543457, 23.427875518798828, 24.294485092163086, 25.161094665527344, 26.02770233154297, 26.894311904907227, 27.760921478271484]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 7.0, 2.0, 5.0, 6.0, 6.0, 4.0, 8.0, 5.0, 12.0, 13.0, 17.0, 29.0, 24.0, 22.0, 35.0, 30.0, 38.0, 35.0, 29.0, 42.0, 44.0, 41.0, 29.0, 44.0, 26.0, 53.0, 37.0, 41.0, 41.0, 34.0, 41.0, 25.0, 34.0, 21.0, 27.0, 14.0, 16.0, 14.0, 20.0, 5.0, 7.0, 5.0, 7.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.886810302734375, -26.911548614501953, -25.93628692626953, -24.961027145385742, -23.98576545715332, -23.0105037689209, -22.035242080688477, -21.059982299804688, -20.084720611572266, -19.109458923339844, -18.134197235107422, -17.158937454223633, -16.18367576599121, -15.208414077758789, -14.233152389526367, -13.257891654968262, -12.28262996673584, -11.307368278503418, -10.332107543945312, -9.35684585571289, -8.381585121154785, -7.406323432922363, -6.4310622215271, -5.455801010131836, -4.480539798736572, -3.5052785873413086, -2.530017375946045, -1.5547559261322021, -0.5794947147369385, 0.3957667350769043, 1.371027946472168, 2.3462891578674316, 3.3215503692626953, 4.296811580657959, 5.272072792053223, 6.2473344802856445, 7.22259521484375, 8.197856903076172, 9.173118591308594, 10.1483793258667, 11.123640060424805, 12.098901748657227, 13.074162483215332, 14.049424171447754, 15.02468490600586, 15.999946594238281, 16.975208282470703, 17.950469970703125, 18.925731658935547, 19.90099334716797, 20.87625503540039, 21.85151481628418, 22.8267765045166, 23.802038192749023, 24.777299880981445, 25.752559661865234, 26.727821350097656, 27.703083038330078, 28.6783447265625, 29.65360450744629, 30.62886619567871, 31.604127883911133, 32.57938766479492, 33.554649353027344, 34.529911041259766]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 12.0, 18.0, 20.0, 39.0, 56.0, 116.0, 202.0, 365.0, 498.0, 835.0, 1360.0, 2183.0, 3644.0, 5735.0, 8549.0, 13061.0, 19754.0, 28568.0, 39736.0, 53563.0, 67967.0, 82391.0, 93808.0, 100386.0, 100984.0, 93909.0, 82688.0, 68557.0, 53299.0, 40306.0, 28945.0, 19851.0, 13465.0, 8687.0, 5581.0, 3654.0, 2219.0, 1366.0, 823.0, 515.0, 312.0, 213.0, 110.0, 84.0, 45.0, 30.0, 21.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-19.59375, -18.981689453125, -18.36962890625, -17.757568359375, -17.1455078125, -16.533447265625, -15.92138671875, -15.309326171875, -14.697265625, -14.085205078125, -13.47314453125, -12.861083984375, -12.2490234375, -11.636962890625, -11.02490234375, -10.412841796875, -9.80078125, -9.188720703125, -8.57666015625, -7.964599609375, -7.3525390625, -6.740478515625, -6.12841796875, -5.516357421875, -4.904296875, -4.292236328125, -3.68017578125, -3.068115234375, -2.4560546875, -1.843994140625, -1.23193359375, -0.619873046875, -0.0078125, 0.604248046875, 1.21630859375, 1.828369140625, 2.4404296875, 3.052490234375, 3.66455078125, 4.276611328125, 4.888671875, 5.500732421875, 6.11279296875, 6.724853515625, 7.3369140625, 7.948974609375, 8.56103515625, 9.173095703125, 9.78515625, 10.397216796875, 11.00927734375, 11.621337890625, 12.2333984375, 12.845458984375, 13.45751953125, 14.069580078125, 14.681640625, 15.293701171875, 15.90576171875, 16.517822265625, 17.1298828125, 17.741943359375, 18.35400390625, 18.966064453125, 19.578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 7.0, 1.0, 4.0, 9.0, 9.0, 8.0, 13.0, 13.0, 18.0, 16.0, 16.0, 27.0, 25.0, 28.0, 33.0, 38.0, 16.0, 29.0, 43.0, 33.0, 30.0, 32.0, 30.0, 30.0, 47.0, 42.0, 43.0, 26.0, 43.0, 32.0, 37.0, 35.0, 26.0, 18.0, 13.0, 20.0, 18.0, 19.0, 12.0, 10.0, 13.0, 8.0, 8.0, 4.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-27.171875, -26.3017578125, -25.431640625, -24.5615234375, -23.69140625, -22.8212890625, -21.951171875, -21.0810546875, -20.2109375, -19.3408203125, -18.470703125, -17.6005859375, -16.73046875, -15.8603515625, -14.990234375, -14.1201171875, -13.25, -12.3798828125, -11.509765625, -10.6396484375, -9.76953125, -8.8994140625, -8.029296875, -7.1591796875, -6.2890625, -5.4189453125, -4.548828125, -3.6787109375, -2.80859375, -1.9384765625, -1.068359375, -0.1982421875, 0.671875, 1.5419921875, 2.412109375, 3.2822265625, 4.15234375, 5.0224609375, 5.892578125, 6.7626953125, 7.6328125, 8.5029296875, 9.373046875, 10.2431640625, 11.11328125, 11.9833984375, 12.853515625, 13.7236328125, 14.59375, 15.4638671875, 16.333984375, 17.2041015625, 18.07421875, 18.9443359375, 19.814453125, 20.6845703125, 21.5546875, 22.4248046875, 23.294921875, 24.1650390625, 25.03515625, 25.9052734375, 26.775390625, 27.6455078125, 28.515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 17.0, 20.0, 28.0, 57.0, 112.0, 133.0, 234.0, 385.0, 648.0, 1006.0, 1720.0, 2616.0, 4405.0, 6953.0, 10744.0, 16906.0, 24922.0, 36157.0, 50206.0, 66678.0, 84162.0, 97943.0, 106658.0, 107155.0, 100687.0, 86197.0, 71146.0, 54082.0, 39121.0, 27051.0, 18121.0, 11937.0, 7798.0, 4736.0, 3101.0, 1822.0, 1142.0, 684.0, 416.0, 250.0, 147.0, 111.0, 49.0, 37.0, 24.0, 13.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -20.03759765625, -19.3720703125, -18.70654296875, -18.041015625, -17.37548828125, -16.7099609375, -16.04443359375, -15.37890625, -14.71337890625, -14.0478515625, -13.38232421875, -12.716796875, -12.05126953125, -11.3857421875, -10.72021484375, -10.0546875, -9.38916015625, -8.7236328125, -8.05810546875, -7.392578125, -6.72705078125, -6.0615234375, -5.39599609375, -4.73046875, -4.06494140625, -3.3994140625, -2.73388671875, -2.068359375, -1.40283203125, -0.7373046875, -0.07177734375, 0.59375, 1.25927734375, 1.9248046875, 2.59033203125, 3.255859375, 3.92138671875, 4.5869140625, 5.25244140625, 5.91796875, 6.58349609375, 7.2490234375, 7.91455078125, 8.580078125, 9.24560546875, 9.9111328125, 10.57666015625, 11.2421875, 11.90771484375, 12.5732421875, 13.23876953125, 13.904296875, 14.56982421875, 15.2353515625, 15.90087890625, 16.56640625, 17.23193359375, 17.8974609375, 18.56298828125, 19.228515625, 19.89404296875, 20.5595703125, 21.22509765625, 21.890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 14.0, 7.0, 10.0, 17.0, 20.0, 15.0, 26.0, 29.0, 30.0, 27.0, 34.0, 40.0, 30.0, 46.0, 48.0, 32.0, 41.0, 55.0, 32.0, 40.0, 50.0, 47.0, 43.0, 37.0, 34.0, 31.0, 24.0, 23.0, 15.0, 12.0, 15.0, 13.0, 13.0, 3.0, 10.0, 6.0, 3.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.683837890625, -21.03955078125, -20.395263671875, -19.7509765625, -19.106689453125, -18.46240234375, -17.818115234375, -17.173828125, -16.529541015625, -15.88525390625, -15.240966796875, -14.5966796875, -13.952392578125, -13.30810546875, -12.663818359375, -12.01953125, -11.375244140625, -10.73095703125, -10.086669921875, -9.4423828125, -8.798095703125, -8.15380859375, -7.509521484375, -6.865234375, -6.220947265625, -5.57666015625, -4.932373046875, -4.2880859375, -3.643798828125, -2.99951171875, -2.355224609375, -1.7109375, -1.066650390625, -0.42236328125, 0.221923828125, 0.8662109375, 1.510498046875, 2.15478515625, 2.799072265625, 3.443359375, 4.087646484375, 4.73193359375, 5.376220703125, 6.0205078125, 6.664794921875, 7.30908203125, 7.953369140625, 8.59765625, 9.241943359375, 9.88623046875, 10.530517578125, 11.1748046875, 11.819091796875, 12.46337890625, 13.107666015625, 13.751953125, 14.396240234375, 15.04052734375, 15.684814453125, 16.3291015625, 16.973388671875, 17.61767578125, 18.261962890625, 18.90625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 7.0, 13.0, 23.0, 25.0, 31.0, 55.0, 81.0, 136.0, 164.0, 317.0, 474.0, 716.0, 1185.0, 1847.0, 2857.0, 4480.0, 7084.0, 10924.0, 16577.0, 25422.0, 37554.0, 53431.0, 72515.0, 92741.0, 108858.0, 116983.0, 113545.0, 100807.0, 82325.0, 62444.0, 45159.0, 31016.0, 20891.0, 13657.0, 8755.0, 5687.0, 3480.0, 2325.0, 1422.0, 868.0, 605.0, 373.0, 248.0, 157.0, 98.0, 55.0, 38.0, 31.0, 30.0, 12.0, 15.0, 8.0, 6.0, 4.0, 0.0, 2.0], "bins": [-8.75, -8.49072265625, -8.2314453125, -7.97216796875, -7.712890625, -7.45361328125, -7.1943359375, -6.93505859375, -6.67578125, -6.41650390625, -6.1572265625, -5.89794921875, -5.638671875, -5.37939453125, -5.1201171875, -4.86083984375, -4.6015625, -4.34228515625, -4.0830078125, -3.82373046875, -3.564453125, -3.30517578125, -3.0458984375, -2.78662109375, -2.52734375, -2.26806640625, -2.0087890625, -1.74951171875, -1.490234375, -1.23095703125, -0.9716796875, -0.71240234375, -0.453125, -0.19384765625, 0.0654296875, 0.32470703125, 0.583984375, 0.84326171875, 1.1025390625, 1.36181640625, 1.62109375, 1.88037109375, 2.1396484375, 2.39892578125, 2.658203125, 2.91748046875, 3.1767578125, 3.43603515625, 3.6953125, 3.95458984375, 4.2138671875, 4.47314453125, 4.732421875, 4.99169921875, 5.2509765625, 5.51025390625, 5.76953125, 6.02880859375, 6.2880859375, 6.54736328125, 6.806640625, 7.06591796875, 7.3251953125, 7.58447265625, 7.84375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 13.0, 18.0, 9.0, 22.0, 31.0, 26.0, 26.0, 34.0, 35.0, 48.0, 39.0, 46.0, 43.0, 68.0, 68.0, 45.0, 56.0, 41.0, 35.0, 51.0, 34.0, 38.0, 38.0, 27.0, 23.0, 17.0, 15.0, 6.0, 10.0, 11.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011043548583984375, -0.0010685175657272339, -0.0010326802730560303, -0.0009968429803848267, -0.000961005687713623, -0.0009251683950424194, -0.0008893311023712158, -0.0008534938097000122, -0.0008176565170288086, -0.000781819224357605, -0.0007459819316864014, -0.0007101446390151978, -0.0006743073463439941, -0.0006384700536727905, -0.0006026327610015869, -0.0005667954683303833, -0.0005309581756591797, -0.0004951208829879761, -0.00045928359031677246, -0.00042344629764556885, -0.00038760900497436523, -0.0003517717123031616, -0.000315934419631958, -0.0002800971269607544, -0.0002442598342895508, -0.00020842254161834717, -0.00017258524894714355, -0.00013674795627593994, -0.00010091066360473633, -6.507337093353271e-05, -2.92360782623291e-05, 6.601214408874512e-06, 4.2438507080078125e-05, 7.827579975128174e-05, 0.00011411309242248535, 0.00014995038509368896, 0.00018578767776489258, 0.0002216249704360962, 0.0002574622631072998, 0.0002932995557785034, 0.00032913684844970703, 0.00036497414112091064, 0.00040081143379211426, 0.00043664872646331787, 0.0004724860191345215, 0.0005083233118057251, 0.0005441606044769287, 0.0005799978971481323, 0.0006158351898193359, 0.0006516724824905396, 0.0006875097751617432, 0.0007233470678329468, 0.0007591843605041504, 0.000795021653175354, 0.0008308589458465576, 0.0008666962385177612, 0.0009025335311889648, 0.0009383708238601685, 0.0009742081165313721, 0.0010100454092025757, 0.0010458827018737793, 0.001081719994544983, 0.0011175572872161865, 0.0011533945798873901, 0.0011892318725585938]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 8.0, 11.0, 36.0, 42.0, 73.0, 116.0, 169.0, 256.0, 422.0, 688.0, 1123.0, 1719.0, 2927.0, 4481.0, 7265.0, 11526.0, 18202.0, 27438.0, 41024.0, 58157.0, 77677.0, 97068.0, 112483.0, 118529.0, 112901.0, 98422.0, 78738.0, 58384.0, 41475.0, 27866.0, 18245.0, 11597.0, 7382.0, 4650.0, 2816.0, 1734.0, 1115.0, 680.0, 410.0, 252.0, 154.0, 86.0, 82.0, 57.0, 24.0, 17.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.29833984375, -8.0263671875, -7.75439453125, -7.482421875, -7.21044921875, -6.9384765625, -6.66650390625, -6.39453125, -6.12255859375, -5.8505859375, -5.57861328125, -5.306640625, -5.03466796875, -4.7626953125, -4.49072265625, -4.21875, -3.94677734375, -3.6748046875, -3.40283203125, -3.130859375, -2.85888671875, -2.5869140625, -2.31494140625, -2.04296875, -1.77099609375, -1.4990234375, -1.22705078125, -0.955078125, -0.68310546875, -0.4111328125, -0.13916015625, 0.1328125, 0.40478515625, 0.6767578125, 0.94873046875, 1.220703125, 1.49267578125, 1.7646484375, 2.03662109375, 2.30859375, 2.58056640625, 2.8525390625, 3.12451171875, 3.396484375, 3.66845703125, 3.9404296875, 4.21240234375, 4.484375, 4.75634765625, 5.0283203125, 5.30029296875, 5.572265625, 5.84423828125, 6.1162109375, 6.38818359375, 6.66015625, 6.93212890625, 7.2041015625, 7.47607421875, 7.748046875, 8.02001953125, 8.2919921875, 8.56396484375, 8.8359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 5.0, 13.0, 11.0, 13.0, 16.0, 21.0, 22.0, 22.0, 37.0, 23.0, 31.0, 44.0, 42.0, 43.0, 36.0, 53.0, 50.0, 48.0, 39.0, 32.0, 36.0, 43.0, 40.0, 38.0, 29.0, 26.0, 23.0, 24.0, 24.0, 20.0, 17.0, 9.0, 9.0, 9.0, 7.0, 2.0, 9.0, 2.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.583984375, -3.470733642578125, -3.35748291015625, -3.244232177734375, -3.1309814453125, -3.017730712890625, -2.90447998046875, -2.791229248046875, -2.677978515625, -2.564727783203125, -2.45147705078125, -2.338226318359375, -2.2249755859375, -2.111724853515625, -1.99847412109375, -1.885223388671875, -1.77197265625, -1.658721923828125, -1.54547119140625, -1.432220458984375, -1.3189697265625, -1.205718994140625, -1.09246826171875, -0.979217529296875, -0.865966796875, -0.752716064453125, -0.63946533203125, -0.526214599609375, -0.4129638671875, -0.299713134765625, -0.18646240234375, -0.073211669921875, 0.0400390625, 0.153289794921875, 0.26654052734375, 0.379791259765625, 0.4930419921875, 0.606292724609375, 0.71954345703125, 0.832794189453125, 0.946044921875, 1.059295654296875, 1.17254638671875, 1.285797119140625, 1.3990478515625, 1.512298583984375, 1.62554931640625, 1.738800048828125, 1.85205078125, 1.965301513671875, 2.07855224609375, 2.191802978515625, 2.3050537109375, 2.418304443359375, 2.53155517578125, 2.644805908203125, 2.758056640625, 2.871307373046875, 2.98455810546875, 3.097808837890625, 3.2110595703125, 3.324310302734375, 3.43756103515625, 3.550811767578125, 3.6640625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 7.0, 10.0, 7.0, 9.0, 10.0, 10.0, 20.0, 20.0, 25.0, 19.0, 25.0, 34.0, 38.0, 43.0, 48.0, 43.0, 51.0, 41.0, 45.0, 44.0, 44.0, 49.0, 35.0, 44.0, 35.0, 41.0, 32.0, 28.0, 23.0, 20.0, 23.0, 11.0, 19.0, 9.0, 10.0, 5.0, 4.0, 4.0, 9.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.810029983520508, -23.951793670654297, -23.093557357788086, -22.235321044921875, -21.377086639404297, -20.518848419189453, -19.660614013671875, -18.802377700805664, -17.944141387939453, -17.085905075073242, -16.22766876220703, -15.369433403015137, -14.511197090148926, -13.652960777282715, -12.79472541809082, -11.93648910522461, -11.078252792358398, -10.220016479492188, -9.361780166625977, -8.503544807434082, -7.645308494567871, -6.78707218170166, -5.928836345672607, -5.070600509643555, -4.212364196777344, -3.354128122329712, -2.49589204788208, -1.6376559734344482, -0.7794198989868164, 0.07881641387939453, 0.9370522499084473, 1.7952880859375, 2.6535263061523438, 3.5117623805999756, 4.369998455047607, 5.22823429107666, 6.086470603942871, 6.944706916809082, 7.802942752838135, 8.661178588867188, 9.519414901733398, 10.37765121459961, 11.23588752746582, 12.094122886657715, 12.952359199523926, 13.810595512390137, 14.668830871582031, 15.527067184448242, 16.385303497314453, 17.243539810180664, 18.101776123046875, 18.960012435913086, 19.818248748779297, 20.676483154296875, 21.534719467163086, 22.392955780029297, 23.251192092895508, 24.10942840576172, 24.96766471862793, 25.82590103149414, 26.68413543701172, 27.542373657226562, 28.40060806274414, 29.25884437561035, 30.117080688476562]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 4.0, 7.0, 16.0, 17.0, 5.0, 19.0, 16.0, 24.0, 21.0, 28.0, 33.0, 24.0, 29.0, 44.0, 35.0, 41.0, 36.0, 29.0, 39.0, 47.0, 43.0, 38.0, 37.0, 38.0, 37.0, 29.0, 19.0, 37.0, 25.0, 29.0, 20.0, 13.0, 10.0, 15.0, 16.0, 12.0, 12.0, 9.0, 4.0, 5.0, 10.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.888347625732422, -26.984975814819336, -26.081605911254883, -25.178234100341797, -24.27486228942871, -23.371492385864258, -22.468120574951172, -21.56475067138672, -20.661378860473633, -19.758007049560547, -18.854637145996094, -17.951265335083008, -17.047893524169922, -16.14452362060547, -15.241151809692383, -14.337780952453613, -13.434409141540527, -12.531038284301758, -11.627666473388672, -10.724295616149902, -9.820924758911133, -8.917552947998047, -8.014182090759277, -7.110811233520508, -6.20743989944458, -5.304068565368652, -4.400697708129883, -3.497326374053955, -2.5939552783966064, -1.6905841827392578, -0.7872128486633301, 0.11615800857543945, 1.0195293426513672, 1.9229004383087158, 2.8262715339660645, 3.729642868041992, 4.633013725280762, 5.5363850593566895, 6.439756393432617, 7.343127250671387, 8.246498107910156, 9.149868965148926, 10.053240776062012, 10.956611633300781, 11.85998249053955, 12.76335334777832, 13.666725158691406, 14.570096015930176, 15.473467826843262, 16.37683868408203, 17.280210494995117, 18.183582305908203, 19.086952209472656, 19.990324020385742, 20.893695831298828, 21.79706573486328, 22.700437545776367, 23.603809356689453, 24.507179260253906, 25.410551071166992, 26.313922882080078, 27.21729278564453, 28.120664596557617, 29.024036407470703, 29.927406311035156]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 7.0, 20.0, 32.0, 54.0, 72.0, 121.0, 201.0, 357.0, 547.0, 878.0, 1337.0, 2272.0, 3656.0, 5823.0, 9149.0, 14528.0, 22490.0, 34386.0, 52492.0, 77360.0, 112236.0, 158606.0, 214549.0, 279051.0, 341796.0, 393279.0, 421152.0, 416456.0, 383355.0, 328479.0, 264362.0, 201730.0, 146527.0, 103070.0, 70949.0, 46723.0, 30895.0, 20226.0, 12914.0, 8255.0, 5010.0, 3330.0, 2073.0, 1310.0, 779.0, 512.0, 358.0, 200.0, 142.0, 71.0, 45.0, 24.0, 19.0, 11.0, 5.0, 9.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.612548828125, -16.03759765625, -15.462646484375, -14.8876953125, -14.312744140625, -13.73779296875, -13.162841796875, -12.587890625, -12.012939453125, -11.43798828125, -10.863037109375, -10.2880859375, -9.713134765625, -9.13818359375, -8.563232421875, -7.98828125, -7.413330078125, -6.83837890625, -6.263427734375, -5.6884765625, -5.113525390625, -4.53857421875, -3.963623046875, -3.388671875, -2.813720703125, -2.23876953125, -1.663818359375, -1.0888671875, -0.513916015625, 0.06103515625, 0.635986328125, 1.2109375, 1.785888671875, 2.36083984375, 2.935791015625, 3.5107421875, 4.085693359375, 4.66064453125, 5.235595703125, 5.810546875, 6.385498046875, 6.96044921875, 7.535400390625, 8.1103515625, 8.685302734375, 9.26025390625, 9.835205078125, 10.41015625, 10.985107421875, 11.56005859375, 12.135009765625, 12.7099609375, 13.284912109375, 13.85986328125, 14.434814453125, 15.009765625, 15.584716796875, 16.15966796875, 16.734619140625, 17.3095703125, 17.884521484375, 18.45947265625, 19.034423828125, 19.609375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 4.0, 5.0, 10.0, 9.0, 15.0, 15.0, 17.0, 17.0, 21.0, 19.0, 26.0, 23.0, 29.0, 31.0, 31.0, 29.0, 34.0, 30.0, 37.0, 40.0, 44.0, 44.0, 42.0, 31.0, 33.0, 36.0, 27.0, 36.0, 32.0, 31.0, 20.0, 20.0, 17.0, 18.0, 19.0, 15.0, 13.0, 15.0, 11.0, 11.0, 4.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-21.890625, -21.205322265625, -20.52001953125, -19.834716796875, -19.1494140625, -18.464111328125, -17.77880859375, -17.093505859375, -16.408203125, -15.722900390625, -15.03759765625, -14.352294921875, -13.6669921875, -12.981689453125, -12.29638671875, -11.611083984375, -10.92578125, -10.240478515625, -9.55517578125, -8.869873046875, -8.1845703125, -7.499267578125, -6.81396484375, -6.128662109375, -5.443359375, -4.758056640625, -4.07275390625, -3.387451171875, -2.7021484375, -2.016845703125, -1.33154296875, -0.646240234375, 0.0390625, 0.724365234375, 1.40966796875, 2.094970703125, 2.7802734375, 3.465576171875, 4.15087890625, 4.836181640625, 5.521484375, 6.206787109375, 6.89208984375, 7.577392578125, 8.2626953125, 8.947998046875, 9.63330078125, 10.318603515625, 11.00390625, 11.689208984375, 12.37451171875, 13.059814453125, 13.7451171875, 14.430419921875, 15.11572265625, 15.801025390625, 16.486328125, 17.171630859375, 17.85693359375, 18.542236328125, 19.2275390625, 19.912841796875, 20.59814453125, 21.283447265625, 21.96875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 9.0, 12.0, 15.0, 39.0, 55.0, 101.0, 165.0, 303.0, 489.0, 809.0, 1327.0, 2097.0, 3286.0, 5207.0, 8100.0, 12949.0, 19799.0, 29899.0, 44850.0, 64113.0, 90052.0, 124112.0, 163653.0, 210765.0, 258291.0, 303436.0, 339643.0, 360820.0, 363407.0, 346622.0, 315549.0, 271981.0, 223857.0, 176463.0, 135536.0, 99293.0, 70999.0, 49826.0, 33528.0, 22647.0, 14771.0, 9393.0, 6062.0, 3772.0, 2379.0, 1493.0, 921.0, 590.0, 319.0, 211.0, 124.0, 64.0, 31.0, 28.0, 17.0, 9.0, 0.0, 4.0, 0.0, 2.0, 1.0], "bins": [-16.8125, -16.272705078125, -15.73291015625, -15.193115234375, -14.6533203125, -14.113525390625, -13.57373046875, -13.033935546875, -12.494140625, -11.954345703125, -11.41455078125, -10.874755859375, -10.3349609375, -9.795166015625, -9.25537109375, -8.715576171875, -8.17578125, -7.635986328125, -7.09619140625, -6.556396484375, -6.0166015625, -5.476806640625, -4.93701171875, -4.397216796875, -3.857421875, -3.317626953125, -2.77783203125, -2.238037109375, -1.6982421875, -1.158447265625, -0.61865234375, -0.078857421875, 0.4609375, 1.000732421875, 1.54052734375, 2.080322265625, 2.6201171875, 3.159912109375, 3.69970703125, 4.239501953125, 4.779296875, 5.319091796875, 5.85888671875, 6.398681640625, 6.9384765625, 7.478271484375, 8.01806640625, 8.557861328125, 9.09765625, 9.637451171875, 10.17724609375, 10.717041015625, 11.2568359375, 11.796630859375, 12.33642578125, 12.876220703125, 13.416015625, 13.955810546875, 14.49560546875, 15.035400390625, 15.5751953125, 16.114990234375, 16.65478515625, 17.194580078125, 17.734375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 6.0, 6.0, 8.0, 18.0, 20.0, 21.0, 21.0, 30.0, 37.0, 44.0, 46.0, 65.0, 86.0, 96.0, 102.0, 111.0, 123.0, 131.0, 173.0, 161.0, 156.0, 162.0, 189.0, 183.0, 196.0, 190.0, 170.0, 157.0, 161.0, 140.0, 148.0, 133.0, 112.0, 107.0, 93.0, 83.0, 65.0, 64.0, 53.0, 43.0, 30.0, 38.0, 27.0, 8.0, 13.0, 13.0, 11.0, 9.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.5, -9.1822509765625, -8.864501953125, -8.5467529296875, -8.22900390625, -7.9112548828125, -7.593505859375, -7.2757568359375, -6.9580078125, -6.6402587890625, -6.322509765625, -6.0047607421875, -5.68701171875, -5.3692626953125, -5.051513671875, -4.7337646484375, -4.416015625, -4.0982666015625, -3.780517578125, -3.4627685546875, -3.14501953125, -2.8272705078125, -2.509521484375, -2.1917724609375, -1.8740234375, -1.5562744140625, -1.238525390625, -0.9207763671875, -0.60302734375, -0.2852783203125, 0.032470703125, 0.3502197265625, 0.66796875, 0.9857177734375, 1.303466796875, 1.6212158203125, 1.93896484375, 2.2567138671875, 2.574462890625, 2.8922119140625, 3.2099609375, 3.5277099609375, 3.845458984375, 4.1632080078125, 4.48095703125, 4.7987060546875, 5.116455078125, 5.4342041015625, 5.751953125, 6.0697021484375, 6.387451171875, 6.7052001953125, 7.02294921875, 7.3406982421875, 7.658447265625, 7.9761962890625, 8.2939453125, 8.6116943359375, 8.929443359375, 9.2471923828125, 9.56494140625, 9.8826904296875, 10.200439453125, 10.5181884765625, 10.8359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 4.0, 8.0, 12.0, 8.0, 10.0, 11.0, 16.0, 15.0, 17.0, 23.0, 27.0, 22.0, 31.0, 19.0, 29.0, 40.0, 43.0, 36.0, 41.0, 39.0, 40.0, 36.0, 46.0, 39.0, 44.0, 29.0, 31.0, 35.0, 34.0, 31.0, 22.0, 33.0, 21.0, 21.0, 20.0, 13.0, 7.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-24.885677337646484, -24.141450881958008, -23.39722442626953, -22.652997970581055, -21.908771514892578, -21.164546966552734, -20.420320510864258, -19.67609405517578, -18.931867599487305, -18.187641143798828, -17.44341468811035, -16.699188232421875, -15.954962730407715, -15.210736274719238, -14.466510772705078, -13.722284317016602, -12.978057861328125, -12.233831405639648, -11.489604949951172, -10.745379447937012, -10.001152992248535, -9.256926536560059, -8.512701034545898, -7.768474578857422, -7.024248123168945, -6.280021667480469, -5.53579568862915, -4.791569709777832, -4.0473432540893555, -3.303117036819458, -2.5588908195495605, -1.8146648406982422, -1.0704402923583984, -0.326214075088501, 0.4180121421813965, 1.162238359451294, 1.9064645767211914, 2.650690793991089, 3.3949170112609863, 4.139142990112305, 4.883369445800781, 5.627595901489258, 6.371821880340576, 7.1160478591918945, 7.860274314880371, 8.604500770568848, 9.348726272583008, 10.092952728271484, 10.837179183959961, 11.581405639648438, 12.325632095336914, 13.069857597351074, 13.81408405303955, 14.558310508728027, 15.302536010742188, 16.046762466430664, 16.79098892211914, 17.535215377807617, 18.279441833496094, 19.02366828918457, 19.767894744873047, 20.51211929321289, 21.256345748901367, 22.000572204589844, 22.74479866027832]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 4.0, 8.0, 10.0, 6.0, 12.0, 12.0, 17.0, 22.0, 18.0, 27.0, 24.0, 31.0, 40.0, 37.0, 41.0, 40.0, 45.0, 44.0, 38.0, 56.0, 39.0, 42.0, 37.0, 52.0, 35.0, 27.0, 36.0, 24.0, 29.0, 25.0, 13.0, 17.0, 20.0, 19.0, 11.0, 7.0, 6.0, 7.0, 8.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.845184326171875, -28.89992332458496, -27.954662322998047, -27.009403228759766, -26.06414222717285, -25.118881225585938, -24.173622131347656, -23.228361129760742, -22.283100128173828, -21.337839126586914, -20.392578125, -19.44731903076172, -18.502058029174805, -17.55679702758789, -16.61153793334961, -15.666276931762695, -14.721015930175781, -13.775754928588867, -12.83049488067627, -11.885234832763672, -10.939973831176758, -9.994712829589844, -9.049452781677246, -8.104192733764648, -7.158931732177734, -6.2136712074279785, -5.268410682678223, -4.323150157928467, -3.377889633178711, -2.432629108428955, -1.4873685836791992, -0.5421080589294434, 0.4031505584716797, 1.3484110832214355, 2.2936716079711914, 3.2389321327209473, 4.184192657470703, 5.129453182220459, 6.074713706970215, 7.019974231719971, 7.965234756469727, 8.91049575805664, 9.855755805969238, 10.801015853881836, 11.74627685546875, 12.691537857055664, 13.636797904968262, 14.58205795288086, 15.527318954467773, 16.472579956054688, 17.41783905029297, 18.363100051879883, 19.308361053466797, 20.25362205505371, 21.198883056640625, 22.144142150878906, 23.08940315246582, 24.034664154052734, 24.979923248291016, 25.92518424987793, 26.870445251464844, 27.815706253051758, 28.760967254638672, 29.706226348876953, 30.651487350463867]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 6.0, 3.0, 18.0, 25.0, 46.0, 61.0, 96.0, 184.0, 236.0, 445.0, 716.0, 1236.0, 2059.0, 3433.0, 5691.0, 10141.0, 16951.0, 28811.0, 48876.0, 79691.0, 120908.0, 161937.0, 171184.0, 142873.0, 99081.0, 62303.0, 37302.0, 22294.0, 13095.0, 7795.0, 4425.0, 2707.0, 1545.0, 933.0, 552.0, 362.0, 203.0, 108.0, 80.0, 63.0, 33.0, 13.0, 9.0, 10.0, 5.0, 8.0, 3.0, 1.0, 2.0], "bins": [-7.8203125, -7.6103515625, -7.400390625, -7.1904296875, -6.98046875, -6.7705078125, -6.560546875, -6.3505859375, -6.140625, -5.9306640625, -5.720703125, -5.5107421875, -5.30078125, -5.0908203125, -4.880859375, -4.6708984375, -4.4609375, -4.2509765625, -4.041015625, -3.8310546875, -3.62109375, -3.4111328125, -3.201171875, -2.9912109375, -2.78125, -2.5712890625, -2.361328125, -2.1513671875, -1.94140625, -1.7314453125, -1.521484375, -1.3115234375, -1.1015625, -0.8916015625, -0.681640625, -0.4716796875, -0.26171875, -0.0517578125, 0.158203125, 0.3681640625, 0.578125, 0.7880859375, 0.998046875, 1.2080078125, 1.41796875, 1.6279296875, 1.837890625, 2.0478515625, 2.2578125, 2.4677734375, 2.677734375, 2.8876953125, 3.09765625, 3.3076171875, 3.517578125, 3.7275390625, 3.9375, 4.1474609375, 4.357421875, 4.5673828125, 4.77734375, 4.9873046875, 5.197265625, 5.4072265625, 5.6171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 0.0, 3.0, 2.0, 2.0, 8.0, 3.0, 9.0, 2.0, 13.0, 9.0, 13.0, 20.0, 22.0, 32.0, 22.0, 20.0, 28.0, 23.0, 30.0, 31.0, 35.0, 46.0, 46.0, 33.0, 32.0, 45.0, 29.0, 34.0, 45.0, 29.0, 37.0, 40.0, 30.0, 40.0, 20.0, 17.0, 23.0, 13.0, 23.0, 19.0, 9.0, 16.0, 11.0, 9.0, 5.0, 7.0, 5.0, 3.0, 3.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.625, -24.7568359375, -23.888671875, -23.0205078125, -22.15234375, -21.2841796875, -20.416015625, -19.5478515625, -18.6796875, -17.8115234375, -16.943359375, -16.0751953125, -15.20703125, -14.3388671875, -13.470703125, -12.6025390625, -11.734375, -10.8662109375, -9.998046875, -9.1298828125, -8.26171875, -7.3935546875, -6.525390625, -5.6572265625, -4.7890625, -3.9208984375, -3.052734375, -2.1845703125, -1.31640625, -0.4482421875, 0.419921875, 1.2880859375, 2.15625, 3.0244140625, 3.892578125, 4.7607421875, 5.62890625, 6.4970703125, 7.365234375, 8.2333984375, 9.1015625, 9.9697265625, 10.837890625, 11.7060546875, 12.57421875, 13.4423828125, 14.310546875, 15.1787109375, 16.046875, 16.9150390625, 17.783203125, 18.6513671875, 19.51953125, 20.3876953125, 21.255859375, 22.1240234375, 22.9921875, 23.8603515625, 24.728515625, 25.5966796875, 26.46484375, 27.3330078125, 28.201171875, 29.0693359375, 29.9375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 3.0, 5.0, 9.0, 7.0, 19.0, 22.0, 23.0, 41.0, 43.0, 65.0, 102.0, 169.0, 262.0, 365.0, 659.0, 1075.0, 1895.0, 3358.0, 6311.0, 12221.0, 23844.0, 47006.0, 89536.0, 153941.0, 208116.0, 200316.0, 137327.0, 78069.0, 40196.0, 20482.0, 10571.0, 5362.0, 2936.0, 1541.0, 974.0, 601.0, 333.0, 247.0, 162.0, 106.0, 59.0, 45.0, 42.0, 30.0, 15.0, 11.0, 10.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-6.93359375, -6.71612548828125, -6.4986572265625, -6.28118896484375, -6.063720703125, -5.84625244140625, -5.6287841796875, -5.41131591796875, -5.19384765625, -4.97637939453125, -4.7589111328125, -4.54144287109375, -4.323974609375, -4.10650634765625, -3.8890380859375, -3.67156982421875, -3.4541015625, -3.23663330078125, -3.0191650390625, -2.80169677734375, -2.584228515625, -2.36676025390625, -2.1492919921875, -1.93182373046875, -1.71435546875, -1.49688720703125, -1.2794189453125, -1.06195068359375, -0.844482421875, -0.62701416015625, -0.4095458984375, -0.19207763671875, 0.025390625, 0.24285888671875, 0.4603271484375, 0.67779541015625, 0.895263671875, 1.11273193359375, 1.3302001953125, 1.54766845703125, 1.76513671875, 1.98260498046875, 2.2000732421875, 2.41754150390625, 2.635009765625, 2.85247802734375, 3.0699462890625, 3.28741455078125, 3.5048828125, 3.72235107421875, 3.9398193359375, 4.15728759765625, 4.374755859375, 4.59222412109375, 4.8096923828125, 5.02716064453125, 5.24462890625, 5.46209716796875, 5.6795654296875, 5.89703369140625, 6.114501953125, 6.33197021484375, 6.5494384765625, 6.76690673828125, 6.984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 6.0, 11.0, 9.0, 16.0, 22.0, 22.0, 29.0, 26.0, 28.0, 26.0, 47.0, 32.0, 33.0, 45.0, 50.0, 36.0, 42.0, 43.0, 62.0, 44.0, 38.0, 39.0, 41.0, 36.0, 28.0, 33.0, 28.0, 25.0, 15.0, 18.0, 13.0, 6.0, 6.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.234375, -20.5869140625, -19.939453125, -19.2919921875, -18.64453125, -17.9970703125, -17.349609375, -16.7021484375, -16.0546875, -15.4072265625, -14.759765625, -14.1123046875, -13.46484375, -12.8173828125, -12.169921875, -11.5224609375, -10.875, -10.2275390625, -9.580078125, -8.9326171875, -8.28515625, -7.6376953125, -6.990234375, -6.3427734375, -5.6953125, -5.0478515625, -4.400390625, -3.7529296875, -3.10546875, -2.4580078125, -1.810546875, -1.1630859375, -0.515625, 0.1318359375, 0.779296875, 1.4267578125, 2.07421875, 2.7216796875, 3.369140625, 4.0166015625, 4.6640625, 5.3115234375, 5.958984375, 6.6064453125, 7.25390625, 7.9013671875, 8.548828125, 9.1962890625, 9.84375, 10.4912109375, 11.138671875, 11.7861328125, 12.43359375, 13.0810546875, 13.728515625, 14.3759765625, 15.0234375, 15.6708984375, 16.318359375, 16.9658203125, 17.61328125, 18.2607421875, 18.908203125, 19.5556640625, 20.203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 1.0, 2.0, 6.0, 10.0, 17.0, 12.0, 21.0, 21.0, 51.0, 63.0, 88.0, 136.0, 243.0, 412.0, 790.0, 1579.0, 3860.0, 10827.0, 39644.0, 193204.0, 531684.0, 205454.0, 41569.0, 11202.0, 4050.0, 1676.0, 825.0, 404.0, 250.0, 145.0, 93.0, 59.0, 51.0, 32.0, 16.0, 11.0, 11.0, 15.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.13671875, -3.037200927734375, -2.93768310546875, -2.838165283203125, -2.7386474609375, -2.639129638671875, -2.53961181640625, -2.440093994140625, -2.340576171875, -2.241058349609375, -2.14154052734375, -2.042022705078125, -1.9425048828125, -1.842987060546875, -1.74346923828125, -1.643951416015625, -1.54443359375, -1.444915771484375, -1.34539794921875, -1.245880126953125, -1.1463623046875, -1.046844482421875, -0.94732666015625, -0.847808837890625, -0.748291015625, -0.648773193359375, -0.54925537109375, -0.449737548828125, -0.3502197265625, -0.250701904296875, -0.15118408203125, -0.051666259765625, 0.0478515625, 0.147369384765625, 0.24688720703125, 0.346405029296875, 0.4459228515625, 0.545440673828125, 0.64495849609375, 0.744476318359375, 0.843994140625, 0.943511962890625, 1.04302978515625, 1.142547607421875, 1.2420654296875, 1.341583251953125, 1.44110107421875, 1.540618896484375, 1.64013671875, 1.739654541015625, 1.83917236328125, 1.938690185546875, 2.0382080078125, 2.137725830078125, 2.23724365234375, 2.336761474609375, 2.436279296875, 2.535797119140625, 2.63531494140625, 2.734832763671875, 2.8343505859375, 2.933868408203125, 3.03338623046875, 3.132904052734375, 3.232421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 15.0, 25.0, 24.0, 34.0, 67.0, 90.0, 94.0, 110.0, 113.0, 94.0, 88.0, 65.0, 42.0, 35.0, 30.0, 10.0, 14.0, 12.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004107952117919922, -0.0004003159701824188, -0.00038983672857284546, -0.0003793574869632721, -0.00036887824535369873, -0.00035839900374412537, -0.000347919762134552, -0.00033744052052497864, -0.0003269612789154053, -0.0003164820373058319, -0.00030600279569625854, -0.0002955235540866852, -0.0002850443124771118, -0.00027456507086753845, -0.0002640858292579651, -0.0002536065876483917, -0.00024312734603881836, -0.000232648104429245, -0.00022216886281967163, -0.00021168962121009827, -0.0002012103796005249, -0.00019073113799095154, -0.00018025189638137817, -0.0001697726547718048, -0.00015929341316223145, -0.00014881417155265808, -0.00013833492994308472, -0.00012785568833351135, -0.00011737644672393799, -0.00010689720511436462, -9.641796350479126e-05, -8.59387218952179e-05, -7.545948028564453e-05, -6.498023867607117e-05, -5.45009970664978e-05, -4.402175545692444e-05, -3.3542513847351074e-05, -2.306327223777771e-05, -1.2584030628204346e-05, -2.1047890186309814e-06, 8.374452590942383e-06, 1.8853694200515747e-05, 2.933293581008911e-05, 3.9812177419662476e-05, 5.029141902923584e-05, 6.0770660638809204e-05, 7.124990224838257e-05, 8.172914385795593e-05, 9.22083854675293e-05, 0.00010268762707710266, 0.00011316686868667603, 0.0001236461102962494, 0.00013412535190582275, 0.00014460459351539612, 0.00015508383512496948, 0.00016556307673454285, 0.0001760423183441162, 0.00018652155995368958, 0.00019700080156326294, 0.0002074800431728363, 0.00021795928478240967, 0.00022843852639198303, 0.0002389177680015564, 0.00024939700961112976, 0.0002598762512207031]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 9.0, 13.0, 13.0, 29.0, 42.0, 66.0, 81.0, 130.0, 196.0, 266.0, 442.0, 623.0, 958.0, 1484.0, 2295.0, 3805.0, 6292.0, 11176.0, 20235.0, 38270.0, 73691.0, 140329.0, 227014.0, 225530.0, 138040.0, 72227.0, 37453.0, 19953.0, 11111.0, 6438.0, 3812.0, 2264.0, 1437.0, 940.0, 626.0, 383.0, 273.0, 188.0, 139.0, 88.0, 65.0, 48.0, 20.0, 16.0, 10.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 3.0], "bins": [-2.939453125, -2.855438232421875, -2.77142333984375, -2.687408447265625, -2.6033935546875, -2.519378662109375, -2.43536376953125, -2.351348876953125, -2.267333984375, -2.183319091796875, -2.09930419921875, -2.015289306640625, -1.9312744140625, -1.847259521484375, -1.76324462890625, -1.679229736328125, -1.59521484375, -1.511199951171875, -1.42718505859375, -1.343170166015625, -1.2591552734375, -1.175140380859375, -1.09112548828125, -1.007110595703125, -0.923095703125, -0.839080810546875, -0.75506591796875, -0.671051025390625, -0.5870361328125, -0.503021240234375, -0.41900634765625, -0.334991455078125, -0.2509765625, -0.166961669921875, -0.08294677734375, 0.001068115234375, 0.0850830078125, 0.169097900390625, 0.25311279296875, 0.337127685546875, 0.421142578125, 0.505157470703125, 0.58917236328125, 0.673187255859375, 0.7572021484375, 0.841217041015625, 0.92523193359375, 1.009246826171875, 1.09326171875, 1.177276611328125, 1.26129150390625, 1.345306396484375, 1.4293212890625, 1.513336181640625, 1.59735107421875, 1.681365966796875, 1.765380859375, 1.849395751953125, 1.93341064453125, 2.017425537109375, 2.1014404296875, 2.185455322265625, 2.26947021484375, 2.353485107421875, 2.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 10.0, 10.0, 13.0, 10.0, 25.0, 23.0, 25.0, 39.0, 44.0, 59.0, 66.0, 61.0, 81.0, 91.0, 93.0, 79.0, 59.0, 44.0, 36.0, 37.0, 24.0, 14.0, 13.0, 11.0, 8.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.98828125, -0.9605484008789062, -0.9328155517578125, -0.9050827026367188, -0.877349853515625, -0.8496170043945312, -0.8218841552734375, -0.7941513061523438, -0.76641845703125, -0.7386856079101562, -0.7109527587890625, -0.6832199096679688, -0.655487060546875, -0.6277542114257812, -0.6000213623046875, -0.5722885131835938, -0.5445556640625, -0.5168228149414062, -0.4890899658203125, -0.46135711669921875, -0.433624267578125, -0.40589141845703125, -0.3781585693359375, -0.35042572021484375, -0.32269287109375, -0.29496002197265625, -0.2672271728515625, -0.23949432373046875, -0.211761474609375, -0.18402862548828125, -0.1562957763671875, -0.12856292724609375, -0.100830078125, -0.07309722900390625, -0.0453643798828125, -0.01763153076171875, 0.010101318359375, 0.03783416748046875, 0.0655670166015625, 0.09329986572265625, 0.12103271484375, 0.14876556396484375, 0.1764984130859375, 0.20423126220703125, 0.231964111328125, 0.25969696044921875, 0.2874298095703125, 0.31516265869140625, 0.3428955078125, 0.37062835693359375, 0.3983612060546875, 0.42609405517578125, 0.453826904296875, 0.48155975341796875, 0.5092926025390625, 0.5370254516601562, 0.56475830078125, 0.5924911499023438, 0.6202239990234375, 0.6479568481445312, 0.675689697265625, 0.7034225463867188, 0.7311553955078125, 0.7588882446289062, 0.78662109375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 7.0, 5.0, 8.0, 6.0, 9.0, 8.0, 18.0, 13.0, 15.0, 24.0, 23.0, 19.0, 24.0, 26.0, 25.0, 22.0, 42.0, 37.0, 39.0, 38.0, 38.0, 41.0, 42.0, 31.0, 44.0, 38.0, 36.0, 33.0, 31.0, 35.0, 25.0, 22.0, 27.0, 34.0, 20.0, 20.0, 16.0, 15.0, 4.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-23.547218322753906, -22.82798194885254, -22.108747482299805, -21.389511108398438, -20.670276641845703, -19.951040267944336, -19.23180389404297, -18.512569427490234, -17.793333053588867, -17.0740966796875, -16.354862213134766, -15.635625839233398, -14.916390419006348, -14.197154998779297, -13.47791862487793, -12.758683204650879, -12.039447784423828, -11.320212364196777, -10.600976943969727, -9.88174057006836, -9.162505149841309, -8.443269729614258, -7.724033832550049, -7.00479793548584, -6.285562515258789, -5.566327095031738, -4.847091197967529, -4.12785530090332, -3.4086198806762695, -2.6893842220306396, -1.9701485633850098, -1.2509126663208008, -0.5316753387451172, 0.1875603199005127, 0.9067959785461426, 1.6260316371917725, 2.3452672958374023, 3.0645029544830322, 3.783738613128662, 4.502974510192871, 5.222209930419922, 5.941445350646973, 6.660681247711182, 7.379917144775391, 8.099152565002441, 8.818387985229492, 9.53762435913086, 10.25685977935791, 10.976095199584961, 11.695330619812012, 12.414566040039062, 13.13380241394043, 13.85303783416748, 14.572273254394531, 15.291509628295898, 16.010746002197266, 16.72998046875, 17.449216842651367, 18.1684513092041, 18.88768768310547, 19.606922149658203, 20.32615852355957, 21.045394897460938, 21.764629364013672, 22.48386573791504]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 4.0, 8.0, 9.0, 7.0, 12.0, 14.0, 14.0, 21.0, 21.0, 28.0, 22.0, 32.0, 41.0, 36.0, 44.0, 43.0, 40.0, 44.0, 37.0, 58.0, 43.0, 36.0, 43.0, 53.0, 31.0, 26.0, 32.0, 30.0, 26.0, 24.0, 16.0, 15.0, 19.0, 20.0, 11.0, 6.0, 7.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.58525276184082, -28.641803741455078, -27.698352813720703, -26.75490379333496, -25.811452865600586, -24.868003845214844, -23.92455291748047, -22.981103897094727, -22.037654876708984, -21.094205856323242, -20.150754928588867, -19.207305908203125, -18.26385498046875, -17.320405960083008, -16.376956939697266, -15.43350601196289, -14.490055084228516, -13.546605110168457, -12.603155136108398, -11.659706115722656, -10.716255187988281, -9.772806167602539, -8.82935619354248, -7.885906219482422, -6.942456245422363, -5.999006271362305, -5.055556297302246, -4.112106800079346, -3.168656826019287, -2.2252068519592285, -1.2817573547363281, -0.33830738067626953, 0.6051425933837891, 1.548592448234558, 2.492042303085327, 3.4354920387268066, 4.378942012786865, 5.322391986846924, 6.265841484069824, 7.209291458129883, 8.152741432189941, 9.09619140625, 10.039641380310059, 10.983091354370117, 11.92654037475586, 12.869991302490234, 13.813440322875977, 14.756890296936035, 15.700340270996094, 16.643789291381836, 17.58724021911621, 18.530689239501953, 19.474140167236328, 20.41758918762207, 21.361038208007812, 22.304489135742188, 23.247940063476562, 24.191389083862305, 25.13484001159668, 26.078289031982422, 27.021739959716797, 27.96518898010254, 28.90863800048828, 29.852088928222656, 30.7955379486084]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 10.0, 18.0, 15.0, 41.0, 57.0, 102.0, 214.0, 274.0, 429.0, 751.0, 1201.0, 1991.0, 3276.0, 5420.0, 8815.0, 14084.0, 21658.0, 33132.0, 47647.0, 65085.0, 84587.0, 101405.0, 113039.0, 114678.0, 105812.0, 91043.0, 71973.0, 54366.0, 38100.0, 25539.0, 16442.0, 10565.0, 6345.0, 4000.0, 2556.0, 1524.0, 938.0, 601.0, 341.0, 179.0, 128.0, 73.0, 36.0, 26.0, 19.0, 12.0, 1.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0], "bins": [-21.734375, -21.0986328125, -20.462890625, -19.8271484375, -19.19140625, -18.5556640625, -17.919921875, -17.2841796875, -16.6484375, -16.0126953125, -15.376953125, -14.7412109375, -14.10546875, -13.4697265625, -12.833984375, -12.1982421875, -11.5625, -10.9267578125, -10.291015625, -9.6552734375, -9.01953125, -8.3837890625, -7.748046875, -7.1123046875, -6.4765625, -5.8408203125, -5.205078125, -4.5693359375, -3.93359375, -3.2978515625, -2.662109375, -2.0263671875, -1.390625, -0.7548828125, -0.119140625, 0.5166015625, 1.15234375, 1.7880859375, 2.423828125, 3.0595703125, 3.6953125, 4.3310546875, 4.966796875, 5.6025390625, 6.23828125, 6.8740234375, 7.509765625, 8.1455078125, 8.78125, 9.4169921875, 10.052734375, 10.6884765625, 11.32421875, 11.9599609375, 12.595703125, 13.2314453125, 13.8671875, 14.5029296875, 15.138671875, 15.7744140625, 16.41015625, 17.0458984375, 17.681640625, 18.3173828125, 18.953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 9.0, 18.0, 18.0, 12.0, 9.0, 23.0, 19.0, 19.0, 28.0, 36.0, 40.0, 37.0, 25.0, 36.0, 45.0, 51.0, 37.0, 50.0, 41.0, 25.0, 43.0, 41.0, 40.0, 28.0, 27.0, 30.0, 29.0, 15.0, 22.0, 16.0, 12.0, 16.0, 19.0, 17.0, 9.0, 10.0, 4.0, 6.0, 5.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.453125, -25.58984375, -24.7265625, -23.86328125, -23.0, -22.13671875, -21.2734375, -20.41015625, -19.546875, -18.68359375, -17.8203125, -16.95703125, -16.09375, -15.23046875, -14.3671875, -13.50390625, -12.640625, -11.77734375, -10.9140625, -10.05078125, -9.1875, -8.32421875, -7.4609375, -6.59765625, -5.734375, -4.87109375, -4.0078125, -3.14453125, -2.28125, -1.41796875, -0.5546875, 0.30859375, 1.171875, 2.03515625, 2.8984375, 3.76171875, 4.625, 5.48828125, 6.3515625, 7.21484375, 8.078125, 8.94140625, 9.8046875, 10.66796875, 11.53125, 12.39453125, 13.2578125, 14.12109375, 14.984375, 15.84765625, 16.7109375, 17.57421875, 18.4375, 19.30078125, 20.1640625, 21.02734375, 21.890625, 22.75390625, 23.6171875, 24.48046875, 25.34375, 26.20703125, 27.0703125, 27.93359375, 28.796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 8.0, 11.0, 27.0, 25.0, 54.0, 70.0, 109.0, 226.0, 324.0, 528.0, 806.0, 1226.0, 1911.0, 2860.0, 4433.0, 6593.0, 9868.0, 14124.0, 20458.0, 28078.0, 38341.0, 50001.0, 62749.0, 75518.0, 85992.0, 92505.0, 94516.0, 90239.0, 81868.0, 70094.0, 57619.0, 44811.0, 33587.0, 24726.0, 17639.0, 12136.0, 8397.0, 5626.0, 3655.0, 2395.0, 1559.0, 1040.0, 681.0, 414.0, 271.0, 161.0, 107.0, 67.0, 39.0, 23.0, 12.0, 14.0, 6.0, 9.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.046875, -15.51708984375, -14.9873046875, -14.45751953125, -13.927734375, -13.39794921875, -12.8681640625, -12.33837890625, -11.80859375, -11.27880859375, -10.7490234375, -10.21923828125, -9.689453125, -9.15966796875, -8.6298828125, -8.10009765625, -7.5703125, -7.04052734375, -6.5107421875, -5.98095703125, -5.451171875, -4.92138671875, -4.3916015625, -3.86181640625, -3.33203125, -2.80224609375, -2.2724609375, -1.74267578125, -1.212890625, -0.68310546875, -0.1533203125, 0.37646484375, 0.90625, 1.43603515625, 1.9658203125, 2.49560546875, 3.025390625, 3.55517578125, 4.0849609375, 4.61474609375, 5.14453125, 5.67431640625, 6.2041015625, 6.73388671875, 7.263671875, 7.79345703125, 8.3232421875, 8.85302734375, 9.3828125, 9.91259765625, 10.4423828125, 10.97216796875, 11.501953125, 12.03173828125, 12.5615234375, 13.09130859375, 13.62109375, 14.15087890625, 14.6806640625, 15.21044921875, 15.740234375, 16.27001953125, 16.7998046875, 17.32958984375, 17.859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 6.0, 3.0, 6.0, 3.0, 8.0, 11.0, 7.0, 7.0, 17.0, 15.0, 12.0, 12.0, 18.0, 19.0, 31.0, 28.0, 17.0, 27.0, 30.0, 52.0, 36.0, 29.0, 41.0, 34.0, 34.0, 39.0, 33.0, 33.0, 30.0, 32.0, 29.0, 32.0, 23.0, 31.0, 31.0, 21.0, 27.0, 21.0, 20.0, 17.0, 20.0, 14.0, 9.0, 5.0, 7.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.2109375, -13.7237548828125, -13.236572265625, -12.7493896484375, -12.26220703125, -11.7750244140625, -11.287841796875, -10.8006591796875, -10.3134765625, -9.8262939453125, -9.339111328125, -8.8519287109375, -8.36474609375, -7.8775634765625, -7.390380859375, -6.9031982421875, -6.416015625, -5.9288330078125, -5.441650390625, -4.9544677734375, -4.46728515625, -3.9801025390625, -3.492919921875, -3.0057373046875, -2.5185546875, -2.0313720703125, -1.544189453125, -1.0570068359375, -0.56982421875, -0.0826416015625, 0.404541015625, 0.8917236328125, 1.37890625, 1.8660888671875, 2.353271484375, 2.8404541015625, 3.32763671875, 3.8148193359375, 4.302001953125, 4.7891845703125, 5.2763671875, 5.7635498046875, 6.250732421875, 6.7379150390625, 7.22509765625, 7.7122802734375, 8.199462890625, 8.6866455078125, 9.173828125, 9.6610107421875, 10.148193359375, 10.6353759765625, 11.12255859375, 11.6097412109375, 12.096923828125, 12.5841064453125, 13.0712890625, 13.5584716796875, 14.045654296875, 14.5328369140625, 15.02001953125, 15.5072021484375, 15.994384765625, 16.4815673828125, 16.96875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 2.0, 11.0, 15.0, 15.0, 23.0, 21.0, 42.0, 43.0, 68.0, 115.0, 173.0, 270.0, 383.0, 622.0, 989.0, 1529.0, 2431.0, 3876.0, 6316.0, 10211.0, 16339.0, 25581.0, 39117.0, 57199.0, 78405.0, 99622.0, 117047.0, 123452.0, 117505.0, 100895.0, 79236.0, 57337.0, 39648.0, 25832.0, 16662.0, 10224.0, 6470.0, 4072.0, 2408.0, 1490.0, 1009.0, 601.0, 409.0, 257.0, 181.0, 115.0, 82.0, 69.0, 46.0, 29.0, 19.0, 11.0, 8.0, 7.0, 4.0, 9.0, 2.0, 1.0], "bins": [-8.125, -7.882568359375, -7.64013671875, -7.397705078125, -7.1552734375, -6.912841796875, -6.67041015625, -6.427978515625, -6.185546875, -5.943115234375, -5.70068359375, -5.458251953125, -5.2158203125, -4.973388671875, -4.73095703125, -4.488525390625, -4.24609375, -4.003662109375, -3.76123046875, -3.518798828125, -3.2763671875, -3.033935546875, -2.79150390625, -2.549072265625, -2.306640625, -2.064208984375, -1.82177734375, -1.579345703125, -1.3369140625, -1.094482421875, -0.85205078125, -0.609619140625, -0.3671875, -0.124755859375, 0.11767578125, 0.360107421875, 0.6025390625, 0.844970703125, 1.08740234375, 1.329833984375, 1.572265625, 1.814697265625, 2.05712890625, 2.299560546875, 2.5419921875, 2.784423828125, 3.02685546875, 3.269287109375, 3.51171875, 3.754150390625, 3.99658203125, 4.239013671875, 4.4814453125, 4.723876953125, 4.96630859375, 5.208740234375, 5.451171875, 5.693603515625, 5.93603515625, 6.178466796875, 6.4208984375, 6.663330078125, 6.90576171875, 7.148193359375, 7.390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 3.0, 9.0, 7.0, 8.0, 17.0, 23.0, 14.0, 33.0, 28.0, 43.0, 49.0, 72.0, 80.0, 71.0, 66.0, 59.0, 67.0, 56.0, 53.0, 45.0, 36.0, 36.0, 26.0, 25.0, 18.0, 12.0, 19.0, 8.0, 2.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008840560913085938, -0.0008467435836791992, -0.0008094310760498047, -0.0007721185684204102, -0.0007348060607910156, -0.0006974935531616211, -0.0006601810455322266, -0.000622868537902832, -0.0005855560302734375, -0.000548243522644043, -0.0005109310150146484, -0.0004736185073852539, -0.0004363059997558594, -0.00039899349212646484, -0.0003616809844970703, -0.0003243684768676758, -0.00028705596923828125, -0.0002497434616088867, -0.0002124309539794922, -0.00017511844635009766, -0.00013780593872070312, -0.0001004934310913086, -6.318092346191406e-05, -2.586841583251953e-05, 1.1444091796875e-05, 4.875659942626953e-05, 8.606910705566406e-05, 0.0001233816146850586, 0.00016069412231445312, 0.00019800662994384766, 0.0002353191375732422, 0.0002726316452026367, 0.00030994415283203125, 0.0003472566604614258, 0.0003845691680908203, 0.00042188167572021484, 0.0004591941833496094, 0.0004965066909790039, 0.0005338191986083984, 0.000571131706237793, 0.0006084442138671875, 0.000645756721496582, 0.0006830692291259766, 0.0007203817367553711, 0.0007576942443847656, 0.0007950067520141602, 0.0008323192596435547, 0.0008696317672729492, 0.0009069442749023438, 0.0009442567825317383, 0.0009815692901611328, 0.0010188817977905273, 0.0010561943054199219, 0.0010935068130493164, 0.001130819320678711, 0.0011681318283081055, 0.0012054443359375, 0.0012427568435668945, 0.001280069351196289, 0.0013173818588256836, 0.0013546943664550781, 0.0013920068740844727, 0.0014293193817138672, 0.0014666318893432617, 0.0015039443969726562]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 10.0, 15.0, 26.0, 27.0, 34.0, 66.0, 81.0, 150.0, 199.0, 273.0, 455.0, 721.0, 1215.0, 1933.0, 3200.0, 5299.0, 9161.0, 15339.0, 26066.0, 42594.0, 66816.0, 96629.0, 125678.0, 143694.0, 140582.0, 119615.0, 90039.0, 61956.0, 38789.0, 23498.0, 14228.0, 8096.0, 4638.0, 2783.0, 1660.0, 1064.0, 673.0, 416.0, 265.0, 199.0, 130.0, 86.0, 51.0, 37.0, 19.0, 21.0, 11.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.109375, -8.8046875, -8.5, -8.1953125, -7.890625, -7.5859375, -7.28125, -6.9765625, -6.671875, -6.3671875, -6.0625, -5.7578125, -5.453125, -5.1484375, -4.84375, -4.5390625, -4.234375, -3.9296875, -3.625, -3.3203125, -3.015625, -2.7109375, -2.40625, -2.1015625, -1.796875, -1.4921875, -1.1875, -0.8828125, -0.578125, -0.2734375, 0.03125, 0.3359375, 0.640625, 0.9453125, 1.25, 1.5546875, 1.859375, 2.1640625, 2.46875, 2.7734375, 3.078125, 3.3828125, 3.6875, 3.9921875, 4.296875, 4.6015625, 4.90625, 5.2109375, 5.515625, 5.8203125, 6.125, 6.4296875, 6.734375, 7.0390625, 7.34375, 7.6484375, 7.953125, 8.2578125, 8.5625, 8.8671875, 9.171875, 9.4765625, 9.78125, 10.0859375, 10.390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 5.0, 11.0, 9.0, 17.0, 11.0, 26.0, 14.0, 31.0, 32.0, 38.0, 48.0, 66.0, 49.0, 49.0, 43.0, 55.0, 62.0, 48.0, 45.0, 57.0, 44.0, 47.0, 36.0, 35.0, 22.0, 26.0, 20.0, 9.0, 11.0, 4.0, 5.0, 9.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.34375, -4.22564697265625, -4.1075439453125, -3.98944091796875, -3.871337890625, -3.75323486328125, -3.6351318359375, -3.51702880859375, -3.39892578125, -3.28082275390625, -3.1627197265625, -3.04461669921875, -2.926513671875, -2.80841064453125, -2.6903076171875, -2.57220458984375, -2.4541015625, -2.33599853515625, -2.2178955078125, -2.09979248046875, -1.981689453125, -1.86358642578125, -1.7454833984375, -1.62738037109375, -1.50927734375, -1.39117431640625, -1.2730712890625, -1.15496826171875, -1.036865234375, -0.91876220703125, -0.8006591796875, -0.68255615234375, -0.564453125, -0.44635009765625, -0.3282470703125, -0.21014404296875, -0.092041015625, 0.02606201171875, 0.1441650390625, 0.26226806640625, 0.38037109375, 0.49847412109375, 0.6165771484375, 0.73468017578125, 0.852783203125, 0.97088623046875, 1.0889892578125, 1.20709228515625, 1.3251953125, 1.44329833984375, 1.5614013671875, 1.67950439453125, 1.797607421875, 1.91571044921875, 2.0338134765625, 2.15191650390625, 2.27001953125, 2.38812255859375, 2.5062255859375, 2.62432861328125, 2.742431640625, 2.86053466796875, 2.9786376953125, 3.09674072265625, 3.21484375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 10.0, 4.0, 8.0, 16.0, 29.0, 16.0, 19.0, 16.0, 22.0, 28.0, 25.0, 26.0, 29.0, 42.0, 30.0, 33.0, 34.0, 44.0, 38.0, 40.0, 35.0, 38.0, 37.0, 39.0, 40.0, 24.0, 31.0, 29.0, 34.0, 24.0, 23.0, 29.0, 18.0, 10.0, 14.0, 8.0, 3.0, 8.0, 4.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-22.8902530670166, -22.200899124145508, -21.511545181274414, -20.82219123840332, -20.13283920288086, -19.443485260009766, -18.754131317138672, -18.064777374267578, -17.375423431396484, -16.68606948852539, -15.996715545654297, -15.30736255645752, -14.618008613586426, -13.928654670715332, -13.239301681518555, -12.549947738647461, -11.860593795776367, -11.171239852905273, -10.48188591003418, -9.792532920837402, -9.103178977966309, -8.413825035095215, -7.724471569061279, -7.035118103027344, -6.34576416015625, -5.656410217285156, -4.967056751251221, -4.277703285217285, -3.5883493423461914, -2.8989956378936768, -2.209641933441162, -1.5202884674072266, -0.8309345245361328, -0.14158082008361816, 0.5477728843688965, 1.2371265888214111, 1.9264802932739258, 2.6158339977264404, 3.305187702178955, 3.9945411682128906, 4.683895111083984, 5.373249053955078, 6.062602519989014, 6.751955986022949, 7.441309928894043, 8.130663871765137, 8.820016860961914, 9.509370803833008, 10.198724746704102, 10.888078689575195, 11.577432632446289, 12.266785621643066, 12.95613956451416, 13.645493507385254, 14.334846496582031, 15.024200439453125, 15.713554382324219, 16.402908325195312, 17.092262268066406, 17.7816162109375, 18.470970153808594, 19.160322189331055, 19.84967613220215, 20.539030075073242, 21.228384017944336]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 11.0, 12.0, 21.0, 16.0, 17.0, 31.0, 26.0, 26.0, 27.0, 30.0, 37.0, 32.0, 43.0, 47.0, 36.0, 31.0, 45.0, 47.0, 42.0, 44.0, 38.0, 31.0, 33.0, 18.0, 34.0, 26.0, 22.0, 21.0, 19.0, 15.0, 13.0, 12.0, 15.0, 12.0, 8.0, 9.0, 5.0, 6.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0], "bins": [-30.595733642578125, -29.736892700195312, -28.8780517578125, -28.019210815429688, -27.160369873046875, -26.301528930664062, -25.44268798828125, -24.583847045898438, -23.725006103515625, -22.866165161132812, -22.00732421875, -21.148483276367188, -20.289642333984375, -19.430801391601562, -18.57196044921875, -17.713119506835938, -16.854278564453125, -15.995437622070312, -15.1365966796875, -14.277755737304688, -13.418914794921875, -12.560073852539062, -11.70123291015625, -10.842391967773438, -9.983551025390625, -9.124710083007812, -8.265869140625, -7.4070281982421875, -6.548187255859375, -5.6893463134765625, -4.83050537109375, -3.9716644287109375, -3.112823486328125, -2.2539825439453125, -1.3951416015625, -0.5363006591796875, 0.322540283203125, 1.1813812255859375, 2.04022216796875, 2.8990631103515625, 3.757904052734375, 4.6167449951171875, 5.4755859375, 6.3344268798828125, 7.193267822265625, 8.052108764648438, 8.91094970703125, 9.769790649414062, 10.628631591796875, 11.487472534179688, 12.3463134765625, 13.205154418945312, 14.063995361328125, 14.922836303710938, 15.78167724609375, 16.640518188476562, 17.499359130859375, 18.358200073242188, 19.217041015625, 20.075881958007812, 20.934722900390625, 21.793563842773438, 22.65240478515625, 23.511245727539062, 24.370086669921875]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 5.0, 10.0, 15.0, 33.0, 33.0, 77.0, 147.0, 239.0, 410.0, 649.0, 1063.0, 1868.0, 2885.0, 4752.0, 7914.0, 12451.0, 19532.0, 30798.0, 46988.0, 70468.0, 103378.0, 145481.0, 198156.0, 258777.0, 320152.0, 374160.0, 407017.0, 413474.0, 392121.0, 345617.0, 285899.0, 223631.0, 166955.0, 119418.0, 82533.0, 55579.0, 37260.0, 23688.0, 15344.0, 9569.0, 6137.0, 3704.0, 2300.0, 1388.0, 870.0, 541.0, 329.0, 200.0, 124.0, 60.0, 45.0, 25.0, 13.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.453125, -16.89404296875, -16.3349609375, -15.77587890625, -15.216796875, -14.65771484375, -14.0986328125, -13.53955078125, -12.98046875, -12.42138671875, -11.8623046875, -11.30322265625, -10.744140625, -10.18505859375, -9.6259765625, -9.06689453125, -8.5078125, -7.94873046875, -7.3896484375, -6.83056640625, -6.271484375, -5.71240234375, -5.1533203125, -4.59423828125, -4.03515625, -3.47607421875, -2.9169921875, -2.35791015625, -1.798828125, -1.23974609375, -0.6806640625, -0.12158203125, 0.4375, 0.99658203125, 1.5556640625, 2.11474609375, 2.673828125, 3.23291015625, 3.7919921875, 4.35107421875, 4.91015625, 5.46923828125, 6.0283203125, 6.58740234375, 7.146484375, 7.70556640625, 8.2646484375, 8.82373046875, 9.3828125, 9.94189453125, 10.5009765625, 11.06005859375, 11.619140625, 12.17822265625, 12.7373046875, 13.29638671875, 13.85546875, 14.41455078125, 14.9736328125, 15.53271484375, 16.091796875, 16.65087890625, 17.2099609375, 17.76904296875, 18.328125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 7.0, 3.0, 0.0, 13.0, 12.0, 17.0, 15.0, 15.0, 21.0, 17.0, 31.0, 31.0, 35.0, 28.0, 34.0, 42.0, 38.0, 51.0, 40.0, 44.0, 51.0, 43.0, 39.0, 42.0, 48.0, 37.0, 35.0, 22.0, 23.0, 23.0, 27.0, 22.0, 15.0, 8.0, 9.0, 16.0, 12.0, 13.0, 5.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.375, -24.631591796875, -23.88818359375, -23.144775390625, -22.4013671875, -21.657958984375, -20.91455078125, -20.171142578125, -19.427734375, -18.684326171875, -17.94091796875, -17.197509765625, -16.4541015625, -15.710693359375, -14.96728515625, -14.223876953125, -13.48046875, -12.737060546875, -11.99365234375, -11.250244140625, -10.5068359375, -9.763427734375, -9.02001953125, -8.276611328125, -7.533203125, -6.789794921875, -6.04638671875, -5.302978515625, -4.5595703125, -3.816162109375, -3.07275390625, -2.329345703125, -1.5859375, -0.842529296875, -0.09912109375, 0.644287109375, 1.3876953125, 2.131103515625, 2.87451171875, 3.617919921875, 4.361328125, 5.104736328125, 5.84814453125, 6.591552734375, 7.3349609375, 8.078369140625, 8.82177734375, 9.565185546875, 10.30859375, 11.052001953125, 11.79541015625, 12.538818359375, 13.2822265625, 14.025634765625, 14.76904296875, 15.512451171875, 16.255859375, 16.999267578125, 17.74267578125, 18.486083984375, 19.2294921875, 19.972900390625, 20.71630859375, 21.459716796875, 22.203125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 8.0, 8.0, 9.0, 27.0, 32.0, 48.0, 97.0, 167.0, 277.0, 451.0, 702.0, 1195.0, 1954.0, 3066.0, 5116.0, 8076.0, 12138.0, 18792.0, 28054.0, 41098.0, 60693.0, 83926.0, 116178.0, 153474.0, 196726.0, 242176.0, 286282.0, 321213.0, 346613.0, 355392.0, 345181.0, 320176.0, 283002.0, 239975.0, 194712.0, 151090.0, 114010.0, 83248.0, 59130.0, 41418.0, 27693.0, 18474.0, 11953.0, 7737.0, 4736.0, 3008.0, 1952.0, 1118.0, 662.0, 399.0, 243.0, 171.0, 84.0, 49.0, 45.0, 17.0, 13.0, 7.0, 1.0, 3.0, 3.0, 2.0], "bins": [-16.390625, -15.869873046875, -15.34912109375, -14.828369140625, -14.3076171875, -13.786865234375, -13.26611328125, -12.745361328125, -12.224609375, -11.703857421875, -11.18310546875, -10.662353515625, -10.1416015625, -9.620849609375, -9.10009765625, -8.579345703125, -8.05859375, -7.537841796875, -7.01708984375, -6.496337890625, -5.9755859375, -5.454833984375, -4.93408203125, -4.413330078125, -3.892578125, -3.371826171875, -2.85107421875, -2.330322265625, -1.8095703125, -1.288818359375, -0.76806640625, -0.247314453125, 0.2734375, 0.794189453125, 1.31494140625, 1.835693359375, 2.3564453125, 2.877197265625, 3.39794921875, 3.918701171875, 4.439453125, 4.960205078125, 5.48095703125, 6.001708984375, 6.5224609375, 7.043212890625, 7.56396484375, 8.084716796875, 8.60546875, 9.126220703125, 9.64697265625, 10.167724609375, 10.6884765625, 11.209228515625, 11.72998046875, 12.250732421875, 12.771484375, 13.292236328125, 13.81298828125, 14.333740234375, 14.8544921875, 15.375244140625, 15.89599609375, 16.416748046875, 16.9375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 4.0, 5.0, 7.0, 11.0, 12.0, 19.0, 21.0, 20.0, 37.0, 39.0, 53.0, 59.0, 70.0, 85.0, 83.0, 122.0, 111.0, 142.0, 159.0, 171.0, 189.0, 191.0, 183.0, 179.0, 206.0, 195.0, 205.0, 156.0, 168.0, 190.0, 154.0, 128.0, 109.0, 98.0, 65.0, 58.0, 67.0, 59.0, 54.0, 40.0, 33.0, 26.0, 23.0, 21.0, 7.0, 12.0, 5.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-9.859375, -9.541015625, -9.22265625, -8.904296875, -8.5859375, -8.267578125, -7.94921875, -7.630859375, -7.3125, -6.994140625, -6.67578125, -6.357421875, -6.0390625, -5.720703125, -5.40234375, -5.083984375, -4.765625, -4.447265625, -4.12890625, -3.810546875, -3.4921875, -3.173828125, -2.85546875, -2.537109375, -2.21875, -1.900390625, -1.58203125, -1.263671875, -0.9453125, -0.626953125, -0.30859375, 0.009765625, 0.328125, 0.646484375, 0.96484375, 1.283203125, 1.6015625, 1.919921875, 2.23828125, 2.556640625, 2.875, 3.193359375, 3.51171875, 3.830078125, 4.1484375, 4.466796875, 4.78515625, 5.103515625, 5.421875, 5.740234375, 6.05859375, 6.376953125, 6.6953125, 7.013671875, 7.33203125, 7.650390625, 7.96875, 8.287109375, 8.60546875, 8.923828125, 9.2421875, 9.560546875, 9.87890625, 10.197265625, 10.515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 7.0, 8.0, 8.0, 11.0, 10.0, 16.0, 17.0, 21.0, 18.0, 21.0, 17.0, 20.0, 32.0, 33.0, 27.0, 35.0, 31.0, 41.0, 52.0, 40.0, 43.0, 31.0, 43.0, 41.0, 55.0, 41.0, 50.0, 26.0, 25.0, 28.0, 38.0, 27.0, 14.0, 17.0, 13.0, 13.0, 8.0, 4.0, 1.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.20938491821289, -23.411296844482422, -22.613208770751953, -21.81511878967285, -21.017030715942383, -20.218942642211914, -19.420852661132812, -18.622764587402344, -17.824676513671875, -17.026588439941406, -16.228500366210938, -15.430410385131836, -14.632322311401367, -13.834234237670898, -13.036145210266113, -12.238056182861328, -11.43996810913086, -10.64188003540039, -9.843791007995605, -9.04570198059082, -8.247613906860352, -7.449525356292725, -6.651436805725098, -5.853348255157471, -5.055259704589844, -4.257171154022217, -3.45908260345459, -2.660994052886963, -1.862905502319336, -1.064816951751709, -0.26672840118408203, 0.5313601493835449, 1.329446792602539, 2.127535343170166, 2.925623893737793, 3.72371244430542, 4.521800994873047, 5.319889545440674, 6.117978096008301, 6.916066646575928, 7.714155197143555, 8.512243270874023, 9.310332298278809, 10.108421325683594, 10.906509399414062, 11.704597473144531, 12.502686500549316, 13.300775527954102, 14.09886360168457, 14.896951675415039, 15.695040702819824, 16.49312973022461, 17.291217803955078, 18.089305877685547, 18.887393951416016, 19.685483932495117, 20.483572006225586, 21.281660079956055, 22.079750061035156, 22.877838134765625, 23.675926208496094, 24.474014282226562, 25.27210235595703, 26.070192337036133, 26.8682804107666]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1.0, 8.0, 6.0, 10.0, 5.0, 10.0, 10.0, 10.0, 11.0, 21.0, 12.0, 29.0, 34.0, 24.0, 30.0, 36.0, 47.0, 35.0, 48.0, 54.0, 36.0, 32.0, 29.0, 48.0, 38.0, 35.0, 32.0, 38.0, 33.0, 32.0, 31.0, 26.0, 26.0, 18.0, 11.0, 12.0, 14.0, 12.0, 11.0, 12.0, 7.0, 11.0, 4.0, 6.0, 2.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-26.185714721679688, -25.343616485595703, -24.501516342163086, -23.65941619873047, -22.817317962646484, -21.9752197265625, -21.133119583129883, -20.291019439697266, -19.44892120361328, -18.606822967529297, -17.76472282409668, -16.922622680664062, -16.080524444580078, -15.238425254821777, -14.396326065063477, -13.554226875305176, -12.712127685546875, -11.870028495788574, -11.027929306030273, -10.185830116271973, -9.343730926513672, -8.501631736755371, -7.65953254699707, -6.8174333572387695, -5.975334167480469, -5.133234977722168, -4.291135787963867, -3.4490365982055664, -2.6069374084472656, -1.7648382186889648, -0.9227390289306641, -0.08063983917236328, 0.7614574432373047, 1.6035566329956055, 2.4456558227539062, 3.287755012512207, 4.129854202270508, 4.971953392028809, 5.814052581787109, 6.65615177154541, 7.498250961303711, 8.340350151062012, 9.182449340820312, 10.024548530578613, 10.866647720336914, 11.708746910095215, 12.550846099853516, 13.392945289611816, 14.235044479370117, 15.077143669128418, 15.919242858886719, 16.761341094970703, 17.60344123840332, 18.445541381835938, 19.287639617919922, 20.129737854003906, 20.971837997436523, 21.81393814086914, 22.656036376953125, 23.49813461303711, 24.340234756469727, 25.182334899902344, 26.024433135986328, 26.866531372070312, 27.70863151550293]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 9.0, 8.0, 11.0, 14.0, 24.0, 33.0, 48.0, 65.0, 83.0, 136.0, 205.0, 292.0, 363.0, 588.0, 784.0, 1207.0, 1843.0, 2950.0, 4857.0, 8807.0, 15969.0, 31044.0, 62481.0, 121256.0, 203566.0, 234310.0, 167236.0, 91776.0, 45669.0, 23043.0, 12088.0, 6621.0, 3868.0, 2391.0, 1548.0, 1023.0, 701.0, 519.0, 348.0, 239.0, 177.0, 99.0, 83.0, 57.0, 36.0, 26.0, 17.0, 15.0, 15.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.67578125, -7.40435791015625, -7.1329345703125, -6.86151123046875, -6.590087890625, -6.31866455078125, -6.0472412109375, -5.77581787109375, -5.50439453125, -5.23297119140625, -4.9615478515625, -4.69012451171875, -4.418701171875, -4.14727783203125, -3.8758544921875, -3.60443115234375, -3.3330078125, -3.06158447265625, -2.7901611328125, -2.51873779296875, -2.247314453125, -1.97589111328125, -1.7044677734375, -1.43304443359375, -1.16162109375, -0.89019775390625, -0.6187744140625, -0.34735107421875, -0.075927734375, 0.19549560546875, 0.4669189453125, 0.73834228515625, 1.009765625, 1.28118896484375, 1.5526123046875, 1.82403564453125, 2.095458984375, 2.36688232421875, 2.6383056640625, 2.90972900390625, 3.18115234375, 3.45257568359375, 3.7239990234375, 3.99542236328125, 4.266845703125, 4.53826904296875, 4.8096923828125, 5.08111572265625, 5.3525390625, 5.62396240234375, 5.8953857421875, 6.16680908203125, 6.438232421875, 6.70965576171875, 6.9810791015625, 7.25250244140625, 7.52392578125, 7.79534912109375, 8.0667724609375, 8.33819580078125, 8.609619140625, 8.88104248046875, 9.1524658203125, 9.42388916015625, 9.6953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 5.0, 3.0, 10.0, 10.0, 4.0, 10.0, 14.0, 8.0, 13.0, 10.0, 23.0, 31.0, 25.0, 35.0, 46.0, 36.0, 34.0, 35.0, 39.0, 37.0, 50.0, 43.0, 33.0, 52.0, 43.0, 29.0, 40.0, 33.0, 24.0, 28.0, 27.0, 17.0, 24.0, 22.0, 16.0, 17.0, 16.0, 12.0, 11.0, 10.0, 8.0, 8.0, 4.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.703125, -25.81396484375, -24.9248046875, -24.03564453125, -23.146484375, -22.25732421875, -21.3681640625, -20.47900390625, -19.58984375, -18.70068359375, -17.8115234375, -16.92236328125, -16.033203125, -15.14404296875, -14.2548828125, -13.36572265625, -12.4765625, -11.58740234375, -10.6982421875, -9.80908203125, -8.919921875, -8.03076171875, -7.1416015625, -6.25244140625, -5.36328125, -4.47412109375, -3.5849609375, -2.69580078125, -1.806640625, -0.91748046875, -0.0283203125, 0.86083984375, 1.75, 2.63916015625, 3.5283203125, 4.41748046875, 5.306640625, 6.19580078125, 7.0849609375, 7.97412109375, 8.86328125, 9.75244140625, 10.6416015625, 11.53076171875, 12.419921875, 13.30908203125, 14.1982421875, 15.08740234375, 15.9765625, 16.86572265625, 17.7548828125, 18.64404296875, 19.533203125, 20.42236328125, 21.3115234375, 22.20068359375, 23.08984375, 23.97900390625, 24.8681640625, 25.75732421875, 26.646484375, 27.53564453125, 28.4248046875, 29.31396484375, 30.203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 8.0, 7.0, 5.0, 6.0, 15.0, 22.0, 38.0, 44.0, 66.0, 108.0, 139.0, 235.0, 337.0, 709.0, 1272.0, 2683.0, 5841.0, 14309.0, 37961.0, 105699.0, 248703.0, 325237.0, 187677.0, 72356.0, 26196.0, 10156.0, 4243.0, 2028.0, 970.0, 575.0, 322.0, 219.0, 116.0, 75.0, 47.0, 36.0, 25.0, 25.0, 12.0, 11.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.3828125, -10.040283203125, -9.69775390625, -9.355224609375, -9.0126953125, -8.670166015625, -8.32763671875, -7.985107421875, -7.642578125, -7.300048828125, -6.95751953125, -6.614990234375, -6.2724609375, -5.929931640625, -5.58740234375, -5.244873046875, -4.90234375, -4.559814453125, -4.21728515625, -3.874755859375, -3.5322265625, -3.189697265625, -2.84716796875, -2.504638671875, -2.162109375, -1.819580078125, -1.47705078125, -1.134521484375, -0.7919921875, -0.449462890625, -0.10693359375, 0.235595703125, 0.578125, 0.920654296875, 1.26318359375, 1.605712890625, 1.9482421875, 2.290771484375, 2.63330078125, 2.975830078125, 3.318359375, 3.660888671875, 4.00341796875, 4.345947265625, 4.6884765625, 5.031005859375, 5.37353515625, 5.716064453125, 6.05859375, 6.401123046875, 6.74365234375, 7.086181640625, 7.4287109375, 7.771240234375, 8.11376953125, 8.456298828125, 8.798828125, 9.141357421875, 9.48388671875, 9.826416015625, 10.1689453125, 10.511474609375, 10.85400390625, 11.196533203125, 11.5390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 10.0, 6.0, 12.0, 11.0, 6.0, 10.0, 12.0, 10.0, 21.0, 15.0, 27.0, 27.0, 25.0, 30.0, 41.0, 35.0, 31.0, 36.0, 34.0, 38.0, 40.0, 51.0, 36.0, 45.0, 38.0, 35.0, 32.0, 35.0, 33.0, 31.0, 31.0, 27.0, 18.0, 21.0, 20.0, 8.0, 15.0, 7.0, 8.0, 6.0, 6.0, 6.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-20.359375, -19.761474609375, -19.16357421875, -18.565673828125, -17.9677734375, -17.369873046875, -16.77197265625, -16.174072265625, -15.576171875, -14.978271484375, -14.38037109375, -13.782470703125, -13.1845703125, -12.586669921875, -11.98876953125, -11.390869140625, -10.79296875, -10.195068359375, -9.59716796875, -8.999267578125, -8.4013671875, -7.803466796875, -7.20556640625, -6.607666015625, -6.009765625, -5.411865234375, -4.81396484375, -4.216064453125, -3.6181640625, -3.020263671875, -2.42236328125, -1.824462890625, -1.2265625, -0.628662109375, -0.03076171875, 0.567138671875, 1.1650390625, 1.762939453125, 2.36083984375, 2.958740234375, 3.556640625, 4.154541015625, 4.75244140625, 5.350341796875, 5.9482421875, 6.546142578125, 7.14404296875, 7.741943359375, 8.33984375, 8.937744140625, 9.53564453125, 10.133544921875, 10.7314453125, 11.329345703125, 11.92724609375, 12.525146484375, 13.123046875, 13.720947265625, 14.31884765625, 14.916748046875, 15.5146484375, 16.112548828125, 16.71044921875, 17.308349609375, 17.90625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 6.0, 10.0, 19.0, 27.0, 25.0, 44.0, 70.0, 124.0, 193.0, 305.0, 465.0, 848.0, 1408.0, 2835.0, 5667.0, 13717.0, 51693.0, 338792.0, 512880.0, 85694.0, 19174.0, 6888.0, 3375.0, 1787.0, 1003.0, 546.0, 347.0, 198.0, 125.0, 101.0, 62.0, 38.0, 17.0, 17.0, 15.0, 5.0, 10.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.546875, -3.4429931640625, -3.339111328125, -3.2352294921875, -3.13134765625, -3.0274658203125, -2.923583984375, -2.8197021484375, -2.7158203125, -2.6119384765625, -2.508056640625, -2.4041748046875, -2.30029296875, -2.1964111328125, -2.092529296875, -1.9886474609375, -1.884765625, -1.7808837890625, -1.677001953125, -1.5731201171875, -1.46923828125, -1.3653564453125, -1.261474609375, -1.1575927734375, -1.0537109375, -0.9498291015625, -0.845947265625, -0.7420654296875, -0.63818359375, -0.5343017578125, -0.430419921875, -0.3265380859375, -0.22265625, -0.1187744140625, -0.014892578125, 0.0889892578125, 0.19287109375, 0.2967529296875, 0.400634765625, 0.5045166015625, 0.6083984375, 0.7122802734375, 0.816162109375, 0.9200439453125, 1.02392578125, 1.1278076171875, 1.231689453125, 1.3355712890625, 1.439453125, 1.5433349609375, 1.647216796875, 1.7510986328125, 1.85498046875, 1.9588623046875, 2.062744140625, 2.1666259765625, 2.2705078125, 2.3743896484375, 2.478271484375, 2.5821533203125, 2.68603515625, 2.7899169921875, 2.893798828125, 2.9976806640625, 3.1015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 8.0, 10.0, 8.0, 11.0, 22.0, 26.0, 36.0, 60.0, 73.0, 136.0, 150.0, 133.0, 95.0, 75.0, 40.0, 33.0, 19.0, 7.0, 12.0, 9.0, 7.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002574920654296875, -0.00024781376123428345, -0.0002381354570388794, -0.00022845715284347534, -0.0002187788486480713, -0.00020910054445266724, -0.00019942224025726318, -0.00018974393606185913, -0.00018006563186645508, -0.00017038732767105103, -0.00016070902347564697, -0.00015103071928024292, -0.00014135241508483887, -0.00013167411088943481, -0.00012199580669403076, -0.00011231750249862671, -0.00010263919830322266, -9.29608941078186e-05, -8.328258991241455e-05, -7.36042857170105e-05, -6.392598152160645e-05, -5.424767732620239e-05, -4.456937313079834e-05, -3.489106893539429e-05, -2.5212764739990234e-05, -1.553446054458618e-05, -5.856156349182129e-06, 3.822147846221924e-06, 1.3500452041625977e-05, 2.317875623703003e-05, 3.285706043243408e-05, 4.2535364627838135e-05, 5.221366882324219e-05, 6.189197301864624e-05, 7.157027721405029e-05, 8.124858140945435e-05, 9.09268856048584e-05, 0.00010060518980026245, 0.0001102834939956665, 0.00011996179819107056, 0.0001296401023864746, 0.00013931840658187866, 0.00014899671077728271, 0.00015867501497268677, 0.00016835331916809082, 0.00017803162336349487, 0.00018770992755889893, 0.00019738823175430298, 0.00020706653594970703, 0.00021674484014511108, 0.00022642314434051514, 0.0002361014485359192, 0.00024577975273132324, 0.0002554580569267273, 0.00026513636112213135, 0.0002748146653175354, 0.00028449296951293945, 0.0002941712737083435, 0.00030384957790374756, 0.0003135278820991516, 0.00032320618629455566, 0.0003328844904899597, 0.00034256279468536377, 0.0003522410988807678, 0.0003619194030761719]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 9.0, 4.0, 7.0, 11.0, 17.0, 19.0, 34.0, 42.0, 66.0, 88.0, 117.0, 179.0, 293.0, 392.0, 591.0, 821.0, 1167.0, 1704.0, 2362.0, 3590.0, 5568.0, 8775.0, 15396.0, 29841.0, 65587.0, 153390.0, 295032.0, 245668.0, 112141.0, 48242.0, 23104.0, 12235.0, 7441.0, 4734.0, 3101.0, 2028.0, 1477.0, 982.0, 655.0, 484.0, 350.0, 245.0, 188.0, 109.0, 81.0, 62.0, 39.0, 29.0, 22.0, 19.0, 4.0, 3.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.6875, -2.60028076171875, -2.5130615234375, -2.42584228515625, -2.338623046875, -2.25140380859375, -2.1641845703125, -2.07696533203125, -1.98974609375, -1.90252685546875, -1.8153076171875, -1.72808837890625, -1.640869140625, -1.55364990234375, -1.4664306640625, -1.37921142578125, -1.2919921875, -1.20477294921875, -1.1175537109375, -1.03033447265625, -0.943115234375, -0.85589599609375, -0.7686767578125, -0.68145751953125, -0.59423828125, -0.50701904296875, -0.4197998046875, -0.33258056640625, -0.245361328125, -0.15814208984375, -0.0709228515625, 0.01629638671875, 0.103515625, 0.19073486328125, 0.2779541015625, 0.36517333984375, 0.452392578125, 0.53961181640625, 0.6268310546875, 0.71405029296875, 0.80126953125, 0.88848876953125, 0.9757080078125, 1.06292724609375, 1.150146484375, 1.23736572265625, 1.3245849609375, 1.41180419921875, 1.4990234375, 1.58624267578125, 1.6734619140625, 1.76068115234375, 1.847900390625, 1.93511962890625, 2.0223388671875, 2.10955810546875, 2.19677734375, 2.28399658203125, 2.3712158203125, 2.45843505859375, 2.545654296875, 2.63287353515625, 2.7200927734375, 2.80731201171875, 2.89453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 11.0, 14.0, 11.0, 23.0, 27.0, 40.0, 63.0, 93.0, 107.0, 135.0, 125.0, 86.0, 58.0, 40.0, 28.0, 18.0, 20.0, 16.0, 9.0, 11.0, 9.0, 1.0, 4.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0], "bins": [-1.3076171875, -1.2754058837890625, -1.243194580078125, -1.2109832763671875, -1.17877197265625, -1.1465606689453125, -1.114349365234375, -1.0821380615234375, -1.0499267578125, -1.0177154541015625, -0.985504150390625, -0.9532928466796875, -0.92108154296875, -0.8888702392578125, -0.856658935546875, -0.8244476318359375, -0.792236328125, -0.7600250244140625, -0.727813720703125, -0.6956024169921875, -0.66339111328125, -0.6311798095703125, -0.598968505859375, -0.5667572021484375, -0.5345458984375, -0.5023345947265625, -0.470123291015625, -0.4379119873046875, -0.40570068359375, -0.3734893798828125, -0.341278076171875, -0.3090667724609375, -0.27685546875, -0.2446441650390625, -0.212432861328125, -0.1802215576171875, -0.14801025390625, -0.1157989501953125, -0.083587646484375, -0.0513763427734375, -0.0191650390625, 0.0130462646484375, 0.045257568359375, 0.0774688720703125, 0.10968017578125, 0.1418914794921875, 0.174102783203125, 0.2063140869140625, 0.238525390625, 0.2707366943359375, 0.302947998046875, 0.3351593017578125, 0.36737060546875, 0.3995819091796875, 0.431793212890625, 0.4640045166015625, 0.4962158203125, 0.5284271240234375, 0.560638427734375, 0.5928497314453125, 0.62506103515625, 0.6572723388671875, 0.689483642578125, 0.7216949462890625, 0.75390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 5.0, 0.0, 2.0, 4.0, 5.0, 11.0, 9.0, 8.0, 8.0, 14.0, 18.0, 19.0, 21.0, 21.0, 18.0, 17.0, 21.0, 27.0, 35.0, 36.0, 35.0, 32.0, 52.0, 37.0, 36.0, 38.0, 44.0, 42.0, 47.0, 45.0, 45.0, 32.0, 29.0, 22.0, 31.0, 28.0, 26.0, 16.0, 19.0, 14.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.170150756835938, -22.39649200439453, -21.622833251953125, -20.84917640686035, -20.075517654418945, -19.30185890197754, -18.528202056884766, -17.75454330444336, -16.980884552001953, -16.207225799560547, -15.433568000793457, -14.659910202026367, -13.886251449584961, -13.112592697143555, -12.338934898376465, -11.565277099609375, -10.791618347167969, -10.017959594726562, -9.244301795959473, -8.470643997192383, -7.696985244750977, -6.9233269691467285, -6.1496686935424805, -5.376010417938232, -4.602352142333984, -3.8286938667297363, -3.0550355911254883, -2.2813773155212402, -1.5077190399169922, -0.7340607643127441, 0.039597511291503906, 0.813255786895752, 1.5869140625, 2.360572338104248, 3.134230613708496, 3.907888889312744, 4.681547164916992, 5.45520544052124, 6.228863716125488, 7.002521991729736, 7.776180267333984, 8.54983901977539, 9.32349681854248, 10.09715461730957, 10.870813369750977, 11.644472122192383, 12.418129920959473, 13.191787719726562, 13.965446472167969, 14.739105224609375, 15.512763023376465, 16.286420822143555, 17.06007957458496, 17.833738327026367, 18.60739517211914, 19.381053924560547, 20.154712677001953, 20.92837142944336, 21.702030181884766, 22.47568702697754, 23.249345779418945, 24.02300453186035, 24.796661376953125, 25.57032012939453, 26.343978881835938]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 6.0, 10.0, 6.0, 10.0, 9.0, 10.0, 11.0, 18.0, 15.0, 29.0, 29.0, 27.0, 27.0, 41.0, 43.0, 35.0, 44.0, 56.0, 36.0, 37.0, 26.0, 49.0, 34.0, 38.0, 36.0, 31.0, 37.0, 33.0, 31.0, 28.0, 24.0, 19.0, 13.0, 12.0, 10.0, 16.0, 11.0, 11.0, 9.0, 10.0, 4.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-26.323423385620117, -25.48480987548828, -24.646196365356445, -23.80758285522461, -22.96896743774414, -22.130353927612305, -21.29174041748047, -20.453126907348633, -19.614513397216797, -18.77589988708496, -17.937286376953125, -17.098670959472656, -16.26005744934082, -15.421443939208984, -14.582830429077148, -13.744216918945312, -12.90560245513916, -12.066988945007324, -11.228374481201172, -10.389760971069336, -9.5511474609375, -8.712533950805664, -7.873919486999512, -7.035305976867676, -6.196691989898682, -5.3580780029296875, -4.519464492797852, -3.6808505058288574, -2.8422367572784424, -2.0036230087280273, -1.1650090217590332, -0.32639551162719727, 0.5122184753417969, 1.350832223892212, 2.189445972442627, 3.028059959411621, 3.866673707962036, 4.705287456512451, 5.543901443481445, 6.382514953613281, 7.221128940582275, 8.05974292755127, 8.898356437683105, 9.736970901489258, 10.575584411621094, 11.41419792175293, 12.252811431884766, 13.091424942016602, 13.930039405822754, 14.76865291595459, 15.607267379760742, 16.445880889892578, 17.284494400024414, 18.12310791015625, 18.96172332763672, 19.800334930419922, 20.63895034790039, 21.477563858032227, 22.316177368164062, 23.15479278564453, 23.993406295776367, 24.832019805908203, 25.67063331604004, 26.509246826171875, 27.34786033630371]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 9.0, 11.0, 18.0, 22.0, 43.0, 52.0, 74.0, 114.0, 211.0, 318.0, 475.0, 694.0, 1094.0, 1660.0, 2479.0, 3840.0, 5552.0, 8185.0, 11709.0, 16416.0, 22579.0, 30039.0, 39612.0, 50140.0, 61567.0, 71153.0, 80544.0, 85198.0, 86911.0, 84316.0, 77517.0, 68546.0, 57623.0, 47354.0, 36789.0, 27675.0, 20315.0, 14864.0, 10593.0, 7371.0, 4904.0, 3450.0, 2308.0, 1410.0, 1025.0, 638.0, 435.0, 236.0, 177.0, 109.0, 58.0, 51.0, 23.0, 20.0, 24.0, 8.0, 3.0, 5.0, 1.0, 2.0], "bins": [-14.7890625, -14.3319091796875, -13.874755859375, -13.4176025390625, -12.96044921875, -12.5032958984375, -12.046142578125, -11.5889892578125, -11.1318359375, -10.6746826171875, -10.217529296875, -9.7603759765625, -9.30322265625, -8.8460693359375, -8.388916015625, -7.9317626953125, -7.474609375, -7.0174560546875, -6.560302734375, -6.1031494140625, -5.64599609375, -5.1888427734375, -4.731689453125, -4.2745361328125, -3.8173828125, -3.3602294921875, -2.903076171875, -2.4459228515625, -1.98876953125, -1.5316162109375, -1.074462890625, -0.6173095703125, -0.16015625, 0.2969970703125, 0.754150390625, 1.2113037109375, 1.66845703125, 2.1256103515625, 2.582763671875, 3.0399169921875, 3.4970703125, 3.9542236328125, 4.411376953125, 4.8685302734375, 5.32568359375, 5.7828369140625, 6.239990234375, 6.6971435546875, 7.154296875, 7.6114501953125, 8.068603515625, 8.5257568359375, 8.98291015625, 9.4400634765625, 9.897216796875, 10.3543701171875, 10.8115234375, 11.2686767578125, 11.725830078125, 12.1829833984375, 12.64013671875, 13.0972900390625, 13.554443359375, 14.0115966796875, 14.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 3.0, 2.0, 10.0, 7.0, 7.0, 12.0, 11.0, 7.0, 18.0, 21.0, 22.0, 33.0, 31.0, 21.0, 38.0, 34.0, 45.0, 36.0, 41.0, 37.0, 44.0, 39.0, 45.0, 40.0, 33.0, 34.0, 33.0, 26.0, 30.0, 35.0, 29.0, 23.0, 20.0, 22.0, 20.0, 21.0, 6.0, 13.0, 14.0, 5.0, 13.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.609375, -25.748291015625, -24.88720703125, -24.026123046875, -23.1650390625, -22.303955078125, -21.44287109375, -20.581787109375, -19.720703125, -18.859619140625, -17.99853515625, -17.137451171875, -16.2763671875, -15.415283203125, -14.55419921875, -13.693115234375, -12.83203125, -11.970947265625, -11.10986328125, -10.248779296875, -9.3876953125, -8.526611328125, -7.66552734375, -6.804443359375, -5.943359375, -5.082275390625, -4.22119140625, -3.360107421875, -2.4990234375, -1.637939453125, -0.77685546875, 0.084228515625, 0.9453125, 1.806396484375, 2.66748046875, 3.528564453125, 4.3896484375, 5.250732421875, 6.11181640625, 6.972900390625, 7.833984375, 8.695068359375, 9.55615234375, 10.417236328125, 11.2783203125, 12.139404296875, 13.00048828125, 13.861572265625, 14.72265625, 15.583740234375, 16.44482421875, 17.305908203125, 18.1669921875, 19.028076171875, 19.88916015625, 20.750244140625, 21.611328125, 22.472412109375, 23.33349609375, 24.194580078125, 25.0556640625, 25.916748046875, 26.77783203125, 27.638916015625, 28.5]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 24.0, 29.0, 34.0, 61.0, 107.0, 162.0, 235.0, 433.0, 643.0, 978.0, 1659.0, 2520.0, 3748.0, 5635.0, 8370.0, 12309.0, 17531.0, 24684.0, 34007.0, 44932.0, 57390.0, 70304.0, 82045.0, 90693.0, 94507.0, 93042.0, 85888.0, 75195.0, 62454.0, 49902.0, 37954.0, 28192.0, 20194.0, 13992.0, 9848.0, 6513.0, 4350.0, 2912.0, 1792.0, 1189.0, 762.0, 510.0, 306.0, 193.0, 119.0, 78.0, 52.0, 28.0, 13.0, 18.0, 5.0, 6.0, 3.0, 2.0, 3.0], "bins": [-16.796875, -16.29833984375, -15.7998046875, -15.30126953125, -14.802734375, -14.30419921875, -13.8056640625, -13.30712890625, -12.80859375, -12.31005859375, -11.8115234375, -11.31298828125, -10.814453125, -10.31591796875, -9.8173828125, -9.31884765625, -8.8203125, -8.32177734375, -7.8232421875, -7.32470703125, -6.826171875, -6.32763671875, -5.8291015625, -5.33056640625, -4.83203125, -4.33349609375, -3.8349609375, -3.33642578125, -2.837890625, -2.33935546875, -1.8408203125, -1.34228515625, -0.84375, -0.34521484375, 0.1533203125, 0.65185546875, 1.150390625, 1.64892578125, 2.1474609375, 2.64599609375, 3.14453125, 3.64306640625, 4.1416015625, 4.64013671875, 5.138671875, 5.63720703125, 6.1357421875, 6.63427734375, 7.1328125, 7.63134765625, 8.1298828125, 8.62841796875, 9.126953125, 9.62548828125, 10.1240234375, 10.62255859375, 11.12109375, 11.61962890625, 12.1181640625, 12.61669921875, 13.115234375, 13.61376953125, 14.1123046875, 14.61083984375, 15.109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 4.0, 11.0, 16.0, 18.0, 14.0, 17.0, 21.0, 27.0, 32.0, 23.0, 38.0, 33.0, 43.0, 50.0, 43.0, 50.0, 53.0, 47.0, 37.0, 46.0, 51.0, 37.0, 33.0, 44.0, 32.0, 26.0, 19.0, 23.0, 16.0, 20.0, 11.0, 11.0, 12.0, 9.0, 8.0, 7.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.828125, -16.2333984375, -15.638671875, -15.0439453125, -14.44921875, -13.8544921875, -13.259765625, -12.6650390625, -12.0703125, -11.4755859375, -10.880859375, -10.2861328125, -9.69140625, -9.0966796875, -8.501953125, -7.9072265625, -7.3125, -6.7177734375, -6.123046875, -5.5283203125, -4.93359375, -4.3388671875, -3.744140625, -3.1494140625, -2.5546875, -1.9599609375, -1.365234375, -0.7705078125, -0.17578125, 0.4189453125, 1.013671875, 1.6083984375, 2.203125, 2.7978515625, 3.392578125, 3.9873046875, 4.58203125, 5.1767578125, 5.771484375, 6.3662109375, 6.9609375, 7.5556640625, 8.150390625, 8.7451171875, 9.33984375, 9.9345703125, 10.529296875, 11.1240234375, 11.71875, 12.3134765625, 12.908203125, 13.5029296875, 14.09765625, 14.6923828125, 15.287109375, 15.8818359375, 16.4765625, 17.0712890625, 17.666015625, 18.2607421875, 18.85546875, 19.4501953125, 20.044921875, 20.6396484375, 21.234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 3.0, 3.0, 10.0, 15.0, 15.0, 22.0, 33.0, 39.0, 77.0, 92.0, 117.0, 157.0, 328.0, 455.0, 706.0, 1130.0, 1958.0, 3224.0, 5505.0, 9320.0, 16143.0, 26698.0, 42698.0, 63365.0, 87416.0, 111532.0, 126647.0, 129697.0, 118967.0, 97992.0, 72434.0, 50606.0, 32316.0, 20025.0, 11630.0, 6915.0, 4009.0, 2378.0, 1439.0, 825.0, 563.0, 350.0, 225.0, 145.0, 104.0, 66.0, 56.0, 28.0, 32.0, 16.0, 16.0, 10.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -6.979736328125, -6.74072265625, -6.501708984375, -6.2626953125, -6.023681640625, -5.78466796875, -5.545654296875, -5.306640625, -5.067626953125, -4.82861328125, -4.589599609375, -4.3505859375, -4.111572265625, -3.87255859375, -3.633544921875, -3.39453125, -3.155517578125, -2.91650390625, -2.677490234375, -2.4384765625, -2.199462890625, -1.96044921875, -1.721435546875, -1.482421875, -1.243408203125, -1.00439453125, -0.765380859375, -0.5263671875, -0.287353515625, -0.04833984375, 0.190673828125, 0.4296875, 0.668701171875, 0.90771484375, 1.146728515625, 1.3857421875, 1.624755859375, 1.86376953125, 2.102783203125, 2.341796875, 2.580810546875, 2.81982421875, 3.058837890625, 3.2978515625, 3.536865234375, 3.77587890625, 4.014892578125, 4.25390625, 4.492919921875, 4.73193359375, 4.970947265625, 5.2099609375, 5.448974609375, 5.68798828125, 5.927001953125, 6.166015625, 6.405029296875, 6.64404296875, 6.883056640625, 7.1220703125, 7.361083984375, 7.60009765625, 7.839111328125, 8.078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 4.0, 10.0, 6.0, 17.0, 21.0, 26.0, 17.0, 27.0, 29.0, 35.0, 41.0, 48.0, 57.0, 54.0, 60.0, 61.0, 62.0, 58.0, 54.0, 40.0, 42.0, 46.0, 36.0, 26.0, 21.0, 17.0, 22.0, 8.0, 10.0, 14.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009469985961914062, -0.0009180232882499695, -0.0008890479803085327, -0.000860072672367096, -0.0008310973644256592, -0.0008021220564842224, -0.0007731467485427856, -0.0007441714406013489, -0.0007151961326599121, -0.0006862208247184753, -0.0006572455167770386, -0.0006282702088356018, -0.000599294900894165, -0.0005703195929527283, -0.0005413442850112915, -0.0005123689770698547, -0.00048339366912841797, -0.0004544183611869812, -0.00042544305324554443, -0.00039646774530410767, -0.0003674924373626709, -0.00033851712942123413, -0.00030954182147979736, -0.0002805665135383606, -0.00025159120559692383, -0.00022261589765548706, -0.0001936405897140503, -0.00016466528177261353, -0.00013568997383117676, -0.00010671466588973999, -7.773935794830322e-05, -4.8764050006866455e-05, -1.9788742065429688e-05, 9.18656587600708e-06, 3.816187381744385e-05, 6.713718175888062e-05, 9.611248970031738e-05, 0.00012508779764175415, 0.00015406310558319092, 0.00018303841352462769, 0.00021201372146606445, 0.00024098902940750122, 0.000269964337348938, 0.00029893964529037476, 0.0003279149532318115, 0.0003568902611732483, 0.00038586556911468506, 0.0004148408770561218, 0.0004438161849975586, 0.00047279149293899536, 0.0005017668008804321, 0.0005307421088218689, 0.0005597174167633057, 0.0005886927247047424, 0.0006176680326461792, 0.000646643340587616, 0.0006756186485290527, 0.0007045939564704895, 0.0007335692644119263, 0.000762544572353363, 0.0007915198802947998, 0.0008204951882362366, 0.0008494704961776733, 0.0008784458041191101, 0.0009074211120605469]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 15.0, 16.0, 17.0, 30.0, 76.0, 105.0, 178.0, 270.0, 461.0, 779.0, 1288.0, 2117.0, 3473.0, 5976.0, 9910.0, 15992.0, 26044.0, 40053.0, 59788.0, 82605.0, 105724.0, 122966.0, 127973.0, 118658.0, 99194.0, 76337.0, 53859.0, 35706.0, 22914.0, 14266.0, 8595.0, 5254.0, 3122.0, 1925.0, 1090.0, 685.0, 422.0, 273.0, 143.0, 101.0, 53.0, 40.0, 27.0, 10.0, 7.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.96484375, -7.71875, -7.47265625, -7.2265625, -6.98046875, -6.734375, -6.48828125, -6.2421875, -5.99609375, -5.75, -5.50390625, -5.2578125, -5.01171875, -4.765625, -4.51953125, -4.2734375, -4.02734375, -3.78125, -3.53515625, -3.2890625, -3.04296875, -2.796875, -2.55078125, -2.3046875, -2.05859375, -1.8125, -1.56640625, -1.3203125, -1.07421875, -0.828125, -0.58203125, -0.3359375, -0.08984375, 0.15625, 0.40234375, 0.6484375, 0.89453125, 1.140625, 1.38671875, 1.6328125, 1.87890625, 2.125, 2.37109375, 2.6171875, 2.86328125, 3.109375, 3.35546875, 3.6015625, 3.84765625, 4.09375, 4.33984375, 4.5859375, 4.83203125, 5.078125, 5.32421875, 5.5703125, 5.81640625, 6.0625, 6.30859375, 6.5546875, 6.80078125, 7.046875, 7.29296875, 7.5390625, 7.78515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 7.0, 14.0, 13.0, 13.0, 13.0, 19.0, 22.0, 30.0, 35.0, 47.0, 42.0, 74.0, 57.0, 51.0, 51.0, 75.0, 68.0, 44.0, 56.0, 34.0, 31.0, 34.0, 37.0, 35.0, 19.0, 16.0, 14.0, 15.0, 11.0, 3.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.314453125, -3.195648193359375, -3.07684326171875, -2.958038330078125, -2.8392333984375, -2.720428466796875, -2.60162353515625, -2.482818603515625, -2.364013671875, -2.245208740234375, -2.12640380859375, -2.007598876953125, -1.8887939453125, -1.769989013671875, -1.65118408203125, -1.532379150390625, -1.41357421875, -1.294769287109375, -1.17596435546875, -1.057159423828125, -0.9383544921875, -0.819549560546875, -0.70074462890625, -0.581939697265625, -0.463134765625, -0.344329833984375, -0.22552490234375, -0.106719970703125, 0.0120849609375, 0.130889892578125, 0.24969482421875, 0.368499755859375, 0.4873046875, 0.606109619140625, 0.72491455078125, 0.843719482421875, 0.9625244140625, 1.081329345703125, 1.20013427734375, 1.318939208984375, 1.437744140625, 1.556549072265625, 1.67535400390625, 1.794158935546875, 1.9129638671875, 2.031768798828125, 2.15057373046875, 2.269378662109375, 2.38818359375, 2.506988525390625, 2.62579345703125, 2.744598388671875, 2.8634033203125, 2.982208251953125, 3.10101318359375, 3.219818115234375, 3.338623046875, 3.457427978515625, 3.57623291015625, 3.695037841796875, 3.8138427734375, 3.932647705078125, 4.05145263671875, 4.170257568359375, 4.2890625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 10.0, 9.0, 14.0, 14.0, 19.0, 18.0, 18.0, 27.0, 23.0, 24.0, 34.0, 31.0, 36.0, 32.0, 42.0, 44.0, 44.0, 48.0, 38.0, 46.0, 56.0, 44.0, 40.0, 44.0, 35.0, 31.0, 27.0, 28.0, 19.0, 24.0, 15.0, 12.0, 10.0, 11.0, 9.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.026466369628906, -24.18355941772461, -23.340654373168945, -22.49774742126465, -21.654842376708984, -20.811935424804688, -19.96902847290039, -19.126121520996094, -18.28321647644043, -17.440309524536133, -16.59740447998047, -15.754497528076172, -14.911591529846191, -14.068685531616211, -13.225778579711914, -12.382872581481934, -11.539966583251953, -10.697060585021973, -9.854154586791992, -9.011247634887695, -8.168341636657715, -7.325435638427734, -6.482529163360596, -5.639622688293457, -4.796716690063477, -3.953810453414917, -3.1109042167663574, -2.267997980117798, -1.4250917434692383, -0.5821857452392578, 0.26072072982788086, 1.1036272048950195, 1.9465351104736328, 2.7894413471221924, 3.632347583770752, 4.475254058837891, 5.318160057067871, 6.161066055297852, 7.00397253036499, 7.846879005432129, 8.68978500366211, 9.53269100189209, 10.37559700012207, 11.218503952026367, 12.061409950256348, 12.904315948486328, 13.747222900390625, 14.590128898620605, 15.433034896850586, 16.275941848754883, 17.118846893310547, 17.961753845214844, 18.80466079711914, 19.647565841674805, 20.4904727935791, 21.333377838134766, 22.176284790039062, 23.01919174194336, 23.862096786499023, 24.70500373840332, 25.547908782958984, 26.39081573486328, 27.233722686767578, 28.076629638671875, 28.91953468322754]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 8.0, 9.0, 2.0, 6.0, 8.0, 12.0, 11.0, 21.0, 15.0, 22.0, 18.0, 21.0, 39.0, 38.0, 37.0, 27.0, 28.0, 35.0, 36.0, 34.0, 39.0, 31.0, 50.0, 45.0, 36.0, 35.0, 31.0, 34.0, 26.0, 24.0, 27.0, 21.0, 27.0, 18.0, 17.0, 14.0, 14.0, 10.0, 14.0, 8.0, 9.0, 11.0, 6.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.079917907714844, -23.278287887573242, -22.47665786743164, -21.67502784729004, -20.873397827148438, -20.07176971435547, -19.270139694213867, -18.468509674072266, -17.666879653930664, -16.865249633789062, -16.06361961364746, -15.261990547180176, -14.460360527038574, -13.658730506896973, -12.857101440429688, -12.055471420288086, -11.253841400146484, -10.452211380004883, -9.650581359863281, -8.848952293395996, -8.047322273254395, -7.245692253112793, -6.44406270980835, -5.642433166503906, -4.840803146362305, -4.039173126220703, -3.2375435829162598, -2.4359138011932373, -1.6342840194702148, -0.8326539993286133, -0.031024456024169922, 0.7706050872802734, 1.572235107421875, 2.3738648891448975, 3.17549467086792, 3.9771244525909424, 4.778754234313965, 5.580384254455566, 6.38201379776001, 7.183643341064453, 7.985273361206055, 8.786903381347656, 9.588533401489258, 10.390162467956543, 11.191792488098145, 11.993422508239746, 12.795051574707031, 13.596681594848633, 14.398311614990234, 15.199941635131836, 16.001571655273438, 16.80320167541504, 17.60483169555664, 18.40645980834961, 19.20808982849121, 20.009719848632812, 20.811349868774414, 21.612979888916016, 22.414609909057617, 23.21623992919922, 24.017868041992188, 24.819499969482422, 25.62112808227539, 26.422758102416992, 27.224388122558594]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 15.0, 11.0, 19.0, 49.0, 87.0, 151.0, 261.0, 558.0, 853.0, 1459.0, 2455.0, 4219.0, 6808.0, 11619.0, 18463.0, 29620.0, 45870.0, 69602.0, 102628.0, 146208.0, 199866.0, 261583.0, 323799.0, 375414.0, 410932.0, 415791.0, 393196.0, 346669.0, 286609.0, 223445.0, 165663.0, 118044.0, 81390.0, 54492.0, 35954.0, 22746.0, 14524.0, 8930.0, 5569.0, 3479.0, 2083.0, 1288.0, 786.0, 456.0, 246.0, 145.0, 94.0, 60.0, 42.0, 18.0, 13.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.875, -17.302490234375, -16.72998046875, -16.157470703125, -15.5849609375, -15.012451171875, -14.43994140625, -13.867431640625, -13.294921875, -12.722412109375, -12.14990234375, -11.577392578125, -11.0048828125, -10.432373046875, -9.85986328125, -9.287353515625, -8.71484375, -8.142333984375, -7.56982421875, -6.997314453125, -6.4248046875, -5.852294921875, -5.27978515625, -4.707275390625, -4.134765625, -3.562255859375, -2.98974609375, -2.417236328125, -1.8447265625, -1.272216796875, -0.69970703125, -0.127197265625, 0.4453125, 1.017822265625, 1.59033203125, 2.162841796875, 2.7353515625, 3.307861328125, 3.88037109375, 4.452880859375, 5.025390625, 5.597900390625, 6.17041015625, 6.742919921875, 7.3154296875, 7.887939453125, 8.46044921875, 9.032958984375, 9.60546875, 10.177978515625, 10.75048828125, 11.322998046875, 11.8955078125, 12.468017578125, 13.04052734375, 13.613037109375, 14.185546875, 14.758056640625, 15.33056640625, 15.903076171875, 16.4755859375, 17.048095703125, 17.62060546875, 18.193115234375, 18.765625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 11.0, 9.0, 12.0, 17.0, 18.0, 27.0, 20.0, 21.0, 21.0, 28.0, 28.0, 37.0, 31.0, 40.0, 31.0, 33.0, 42.0, 31.0, 45.0, 38.0, 38.0, 35.0, 34.0, 31.0, 30.0, 23.0, 18.0, 25.0, 21.0, 27.0, 19.0, 28.0, 20.0, 12.0, 10.0, 12.0, 10.0, 8.0, 10.0, 4.0, 3.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0], "bins": [-19.4375, -18.802978515625, -18.16845703125, -17.533935546875, -16.8994140625, -16.264892578125, -15.63037109375, -14.995849609375, -14.361328125, -13.726806640625, -13.09228515625, -12.457763671875, -11.8232421875, -11.188720703125, -10.55419921875, -9.919677734375, -9.28515625, -8.650634765625, -8.01611328125, -7.381591796875, -6.7470703125, -6.112548828125, -5.47802734375, -4.843505859375, -4.208984375, -3.574462890625, -2.93994140625, -2.305419921875, -1.6708984375, -1.036376953125, -0.40185546875, 0.232666015625, 0.8671875, 1.501708984375, 2.13623046875, 2.770751953125, 3.4052734375, 4.039794921875, 4.67431640625, 5.308837890625, 5.943359375, 6.577880859375, 7.21240234375, 7.846923828125, 8.4814453125, 9.115966796875, 9.75048828125, 10.385009765625, 11.01953125, 11.654052734375, 12.28857421875, 12.923095703125, 13.5576171875, 14.192138671875, 14.82666015625, 15.461181640625, 16.095703125, 16.730224609375, 17.36474609375, 17.999267578125, 18.6337890625, 19.268310546875, 19.90283203125, 20.537353515625, 21.171875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 11.0, 22.0, 28.0, 71.0, 121.0, 163.0, 302.0, 528.0, 962.0, 1598.0, 2725.0, 4555.0, 7244.0, 11673.0, 18836.0, 29233.0, 43836.0, 65638.0, 93710.0, 129577.0, 173174.0, 221807.0, 270559.0, 316738.0, 351335.0, 369940.0, 369272.0, 347899.0, 312081.0, 267355.0, 216958.0, 168628.0, 126759.0, 91230.0, 62903.0, 42591.0, 27752.0, 18077.0, 11193.0, 7027.0, 4246.0, 2515.0, 1407.0, 840.0, 493.0, 281.0, 188.0, 88.0, 46.0, 35.0, 13.0, 15.0, 4.0, 1.0, 2.0, 2.0, 4.0], "bins": [-18.375, -17.8173828125, -17.259765625, -16.7021484375, -16.14453125, -15.5869140625, -15.029296875, -14.4716796875, -13.9140625, -13.3564453125, -12.798828125, -12.2412109375, -11.68359375, -11.1259765625, -10.568359375, -10.0107421875, -9.453125, -8.8955078125, -8.337890625, -7.7802734375, -7.22265625, -6.6650390625, -6.107421875, -5.5498046875, -4.9921875, -4.4345703125, -3.876953125, -3.3193359375, -2.76171875, -2.2041015625, -1.646484375, -1.0888671875, -0.53125, 0.0263671875, 0.583984375, 1.1416015625, 1.69921875, 2.2568359375, 2.814453125, 3.3720703125, 3.9296875, 4.4873046875, 5.044921875, 5.6025390625, 6.16015625, 6.7177734375, 7.275390625, 7.8330078125, 8.390625, 8.9482421875, 9.505859375, 10.0634765625, 10.62109375, 11.1787109375, 11.736328125, 12.2939453125, 12.8515625, 13.4091796875, 13.966796875, 14.5244140625, 15.08203125, 15.6396484375, 16.197265625, 16.7548828125, 17.3125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 11.0, 12.0, 23.0, 27.0, 25.0, 48.0, 54.0, 62.0, 70.0, 75.0, 85.0, 104.0, 139.0, 137.0, 161.0, 175.0, 182.0, 183.0, 204.0, 228.0, 221.0, 209.0, 204.0, 187.0, 163.0, 161.0, 144.0, 139.0, 118.0, 102.0, 91.0, 63.0, 53.0, 44.0, 37.0, 36.0, 26.0, 16.0, 10.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6171875, -11.2637939453125, -10.910400390625, -10.5570068359375, -10.20361328125, -9.8502197265625, -9.496826171875, -9.1434326171875, -8.7900390625, -8.4366455078125, -8.083251953125, -7.7298583984375, -7.37646484375, -7.0230712890625, -6.669677734375, -6.3162841796875, -5.962890625, -5.6094970703125, -5.256103515625, -4.9027099609375, -4.54931640625, -4.1959228515625, -3.842529296875, -3.4891357421875, -3.1357421875, -2.7823486328125, -2.428955078125, -2.0755615234375, -1.72216796875, -1.3687744140625, -1.015380859375, -0.6619873046875, -0.30859375, 0.0447998046875, 0.398193359375, 0.7515869140625, 1.10498046875, 1.4583740234375, 1.811767578125, 2.1651611328125, 2.5185546875, 2.8719482421875, 3.225341796875, 3.5787353515625, 3.93212890625, 4.2855224609375, 4.638916015625, 4.9923095703125, 5.345703125, 5.6990966796875, 6.052490234375, 6.4058837890625, 6.75927734375, 7.1126708984375, 7.466064453125, 7.8194580078125, 8.1728515625, 8.5262451171875, 8.879638671875, 9.2330322265625, 9.58642578125, 9.9398193359375, 10.293212890625, 10.6466064453125, 11.0]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 11.0, 9.0, 14.0, 11.0, 9.0, 14.0, 17.0, 18.0, 26.0, 22.0, 30.0, 19.0, 31.0, 44.0, 27.0, 41.0, 42.0, 34.0, 43.0, 39.0, 34.0, 37.0, 47.0, 33.0, 37.0, 41.0, 29.0, 28.0, 29.0, 28.0, 24.0, 27.0, 21.0, 19.0, 7.0, 11.0, 7.0, 9.0, 7.0, 6.0, 1.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-24.317245483398438, -23.54956817626953, -22.781890869140625, -22.014211654663086, -21.24653434753418, -20.478857040405273, -19.711177825927734, -18.943500518798828, -18.175823211669922, -17.408145904541016, -16.64046859741211, -15.87278938293457, -15.105112075805664, -14.337434768676758, -13.569756507873535, -12.802078247070312, -12.034400939941406, -11.2667236328125, -10.499045372009277, -9.731367111206055, -8.963689804077148, -8.196012496948242, -7.4283342361450195, -6.660656452178955, -5.892978668212891, -5.125300884246826, -4.357623100280762, -3.5899453163146973, -2.822267532348633, -2.0545897483825684, -1.286911964416504, -0.5192341804504395, 0.248443603515625, 1.0161213874816895, 1.783799171447754, 2.5514769554138184, 3.319154739379883, 4.086832523345947, 4.854510307312012, 5.622188091278076, 6.389865875244141, 7.157543659210205, 7.9252214431762695, 8.692899703979492, 9.460577011108398, 10.228254318237305, 10.995932579040527, 11.76361083984375, 12.531288146972656, 13.298965454101562, 14.066643714904785, 14.834321975708008, 15.601999282836914, 16.36967658996582, 17.13735580444336, 17.905033111572266, 18.672710418701172, 19.440387725830078, 20.208065032958984, 20.975744247436523, 21.74342155456543, 22.511098861694336, 23.278778076171875, 24.04645538330078, 24.814132690429688]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 7.0, 3.0, 7.0, 13.0, 11.0, 14.0, 18.0, 15.0, 15.0, 19.0, 24.0, 26.0, 20.0, 31.0, 26.0, 32.0, 27.0, 37.0, 35.0, 28.0, 22.0, 40.0, 43.0, 38.0, 35.0, 38.0, 30.0, 40.0, 27.0, 32.0, 36.0, 20.0, 23.0, 27.0, 20.0, 22.0, 14.0, 14.0, 16.0, 8.0, 7.0, 9.0, 3.0, 6.0, 7.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.114910125732422, -19.35466766357422, -18.594425201416016, -17.834184646606445, -17.073942184448242, -16.31369972229004, -15.553458213806152, -14.793216705322266, -14.032974243164062, -13.27273178100586, -12.512490272521973, -11.752248764038086, -10.992006301879883, -10.23176383972168, -9.471522331237793, -8.711280822753906, -7.951038360595703, -7.190796375274658, -6.430554389953613, -5.670312404632568, -4.910070419311523, -4.1498284339904785, -3.3895864486694336, -2.6293444633483887, -1.8691024780273438, -1.1088604927062988, -0.3486185073852539, 0.411623477935791, 1.171865463256836, 1.9321074485778809, 2.692349433898926, 3.4525914192199707, 4.212831497192383, 4.973073482513428, 5.733315467834473, 6.493557453155518, 7.2537994384765625, 8.014041900634766, 8.774283409118652, 9.534524917602539, 10.294767379760742, 11.055009841918945, 11.815251350402832, 12.575492858886719, 13.335735321044922, 14.095977783203125, 14.856219291687012, 15.616460800170898, 16.3767032623291, 17.136945724487305, 17.897186279296875, 18.657428741455078, 19.41767120361328, 20.177913665771484, 20.938156127929688, 21.698396682739258, 22.45863914489746, 23.218881607055664, 23.979122161865234, 24.739364624023438, 25.49960708618164, 26.259849548339844, 27.020092010498047, 27.780332565307617, 28.54057502746582]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 16.0, 22.0, 52.0, 51.0, 87.0, 140.0, 208.0, 325.0, 510.0, 776.0, 1367.0, 2104.0, 3350.0, 5560.0, 8904.0, 15059.0, 24586.0, 38956.0, 61213.0, 90505.0, 125096.0, 149291.0, 147492.0, 123407.0, 89917.0, 60001.0, 38085.0, 23626.0, 14501.0, 9079.0, 5461.0, 3331.0, 1989.0, 1242.0, 788.0, 502.0, 336.0, 202.0, 143.0, 82.0, 61.0, 32.0, 36.0, 22.0, 14.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -4.0128173828125, -3.869384765625, -3.7259521484375, -3.58251953125, -3.4390869140625, -3.295654296875, -3.1522216796875, -3.0087890625, -2.8653564453125, -2.721923828125, -2.5784912109375, -2.43505859375, -2.2916259765625, -2.148193359375, -2.0047607421875, -1.861328125, -1.7178955078125, -1.574462890625, -1.4310302734375, -1.28759765625, -1.1441650390625, -1.000732421875, -0.8572998046875, -0.7138671875, -0.5704345703125, -0.427001953125, -0.2835693359375, -0.14013671875, 0.0032958984375, 0.146728515625, 0.2901611328125, 0.43359375, 0.5770263671875, 0.720458984375, 0.8638916015625, 1.00732421875, 1.1507568359375, 1.294189453125, 1.4376220703125, 1.5810546875, 1.7244873046875, 1.867919921875, 2.0113525390625, 2.15478515625, 2.2982177734375, 2.441650390625, 2.5850830078125, 2.728515625, 2.8719482421875, 3.015380859375, 3.1588134765625, 3.30224609375, 3.4456787109375, 3.589111328125, 3.7325439453125, 3.8759765625, 4.0194091796875, 4.162841796875, 4.3062744140625, 4.44970703125, 4.5931396484375, 4.736572265625, 4.8800048828125, 5.0234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 13.0, 10.0, 6.0, 12.0, 11.0, 20.0, 12.0, 18.0, 24.0, 28.0, 16.0, 33.0, 23.0, 34.0, 31.0, 30.0, 34.0, 40.0, 35.0, 45.0, 43.0, 34.0, 44.0, 33.0, 37.0, 31.0, 33.0, 27.0, 36.0, 28.0, 28.0, 11.0, 17.0, 25.0, 18.0, 13.0, 13.0, 6.0, 6.0, 4.0, 8.0, 3.0, 7.0, 7.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.921875, -21.0908203125, -20.259765625, -19.4287109375, -18.59765625, -17.7666015625, -16.935546875, -16.1044921875, -15.2734375, -14.4423828125, -13.611328125, -12.7802734375, -11.94921875, -11.1181640625, -10.287109375, -9.4560546875, -8.625, -7.7939453125, -6.962890625, -6.1318359375, -5.30078125, -4.4697265625, -3.638671875, -2.8076171875, -1.9765625, -1.1455078125, -0.314453125, 0.5166015625, 1.34765625, 2.1787109375, 3.009765625, 3.8408203125, 4.671875, 5.5029296875, 6.333984375, 7.1650390625, 7.99609375, 8.8271484375, 9.658203125, 10.4892578125, 11.3203125, 12.1513671875, 12.982421875, 13.8134765625, 14.64453125, 15.4755859375, 16.306640625, 17.1376953125, 17.96875, 18.7998046875, 19.630859375, 20.4619140625, 21.29296875, 22.1240234375, 22.955078125, 23.7861328125, 24.6171875, 25.4482421875, 26.279296875, 27.1103515625, 27.94140625, 28.7724609375, 29.603515625, 30.4345703125, 31.265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 11.0, 7.0, 15.0, 23.0, 32.0, 50.0, 96.0, 135.0, 229.0, 361.0, 616.0, 1012.0, 1826.0, 3333.0, 6029.0, 11109.0, 21149.0, 40296.0, 74519.0, 128882.0, 188704.0, 204594.0, 156131.0, 95907.0, 53042.0, 27855.0, 14677.0, 7981.0, 4303.0, 2323.0, 1368.0, 785.0, 444.0, 270.0, 182.0, 95.0, 60.0, 39.0, 19.0, 19.0, 11.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.49609375, -5.3079833984375, -5.119873046875, -4.9317626953125, -4.74365234375, -4.5555419921875, -4.367431640625, -4.1793212890625, -3.9912109375, -3.8031005859375, -3.614990234375, -3.4268798828125, -3.23876953125, -3.0506591796875, -2.862548828125, -2.6744384765625, -2.486328125, -2.2982177734375, -2.110107421875, -1.9219970703125, -1.73388671875, -1.5457763671875, -1.357666015625, -1.1695556640625, -0.9814453125, -0.7933349609375, -0.605224609375, -0.4171142578125, -0.22900390625, -0.0408935546875, 0.147216796875, 0.3353271484375, 0.5234375, 0.7115478515625, 0.899658203125, 1.0877685546875, 1.27587890625, 1.4639892578125, 1.652099609375, 1.8402099609375, 2.0283203125, 2.2164306640625, 2.404541015625, 2.5926513671875, 2.78076171875, 2.9688720703125, 3.156982421875, 3.3450927734375, 3.533203125, 3.7213134765625, 3.909423828125, 4.0975341796875, 4.28564453125, 4.4737548828125, 4.661865234375, 4.8499755859375, 5.0380859375, 5.2261962890625, 5.414306640625, 5.6024169921875, 5.79052734375, 5.9786376953125, 6.166748046875, 6.3548583984375, 6.54296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 6.0, 10.0, 11.0, 6.0, 16.0, 17.0, 16.0, 26.0, 27.0, 21.0, 25.0, 32.0, 31.0, 36.0, 39.0, 44.0, 25.0, 41.0, 40.0, 43.0, 35.0, 39.0, 44.0, 45.0, 38.0, 35.0, 23.0, 37.0, 23.0, 22.0, 19.0, 15.0, 23.0, 13.0, 14.0, 14.0, 7.0, 11.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.625, -17.06689453125, -16.5087890625, -15.95068359375, -15.392578125, -14.83447265625, -14.2763671875, -13.71826171875, -13.16015625, -12.60205078125, -12.0439453125, -11.48583984375, -10.927734375, -10.36962890625, -9.8115234375, -9.25341796875, -8.6953125, -8.13720703125, -7.5791015625, -7.02099609375, -6.462890625, -5.90478515625, -5.3466796875, -4.78857421875, -4.23046875, -3.67236328125, -3.1142578125, -2.55615234375, -1.998046875, -1.43994140625, -0.8818359375, -0.32373046875, 0.234375, 0.79248046875, 1.3505859375, 1.90869140625, 2.466796875, 3.02490234375, 3.5830078125, 4.14111328125, 4.69921875, 5.25732421875, 5.8154296875, 6.37353515625, 6.931640625, 7.48974609375, 8.0478515625, 8.60595703125, 9.1640625, 9.72216796875, 10.2802734375, 10.83837890625, 11.396484375, 11.95458984375, 12.5126953125, 13.07080078125, 13.62890625, 14.18701171875, 14.7451171875, 15.30322265625, 15.861328125, 16.41943359375, 16.9775390625, 17.53564453125, 18.09375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 9.0, 19.0, 28.0, 28.0, 46.0, 61.0, 74.0, 124.0, 155.0, 217.0, 327.0, 457.0, 710.0, 1044.0, 1753.0, 2711.0, 4366.0, 7682.0, 14728.0, 31291.0, 72272.0, 168199.0, 293914.0, 239643.0, 113444.0, 47621.0, 21769.0, 10540.0, 5733.0, 3410.0, 2010.0, 1287.0, 855.0, 565.0, 425.0, 268.0, 205.0, 151.0, 94.0, 79.0, 66.0, 37.0, 34.0, 26.0, 20.0, 15.0, 10.0, 5.0, 10.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1123046875, -1.076141357421875, -1.03997802734375, -1.003814697265625, -0.9676513671875, -0.931488037109375, -0.89532470703125, -0.859161376953125, -0.822998046875, -0.786834716796875, -0.75067138671875, -0.714508056640625, -0.6783447265625, -0.642181396484375, -0.60601806640625, -0.569854736328125, -0.53369140625, -0.497528076171875, -0.46136474609375, -0.425201416015625, -0.3890380859375, -0.352874755859375, -0.31671142578125, -0.280548095703125, -0.244384765625, -0.208221435546875, -0.17205810546875, -0.135894775390625, -0.0997314453125, -0.063568115234375, -0.02740478515625, 0.008758544921875, 0.044921875, 0.081085205078125, 0.11724853515625, 0.153411865234375, 0.1895751953125, 0.225738525390625, 0.26190185546875, 0.298065185546875, 0.334228515625, 0.370391845703125, 0.40655517578125, 0.442718505859375, 0.4788818359375, 0.515045166015625, 0.55120849609375, 0.587371826171875, 0.62353515625, 0.659698486328125, 0.69586181640625, 0.732025146484375, 0.7681884765625, 0.804351806640625, 0.84051513671875, 0.876678466796875, 0.912841796875, 0.949005126953125, 0.98516845703125, 1.021331787109375, 1.0574951171875, 1.093658447265625, 1.12982177734375, 1.165985107421875, 1.2021484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 10.0, 10.0, 13.0, 27.0, 29.0, 38.0, 61.0, 84.0, 84.0, 108.0, 101.0, 85.0, 88.0, 71.0, 44.0, 36.0, 24.0, 20.0, 9.0, 8.0, 7.0, 11.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014495849609375, -0.00013921968638896942, -0.00013348087668418884, -0.00012774206697940826, -0.00012200325727462769, -0.00011626444756984711, -0.00011052563786506653, -0.00010478682816028595, -9.904801845550537e-05, -9.330920875072479e-05, -8.757039904594421e-05, -8.183158934116364e-05, -7.609277963638306e-05, -7.035396993160248e-05, -6.46151602268219e-05, -5.887635052204132e-05, -5.313754081726074e-05, -4.7398731112480164e-05, -4.1659921407699585e-05, -3.5921111702919006e-05, -3.0182301998138428e-05, -2.444349229335785e-05, -1.870468258857727e-05, -1.2965872883796692e-05, -7.227063179016113e-06, -1.4882534742355347e-06, 4.250556230545044e-06, 9.989365935325623e-06, 1.57281756401062e-05, 2.146698534488678e-05, 2.720579504966736e-05, 3.294460475444794e-05, 3.8683414459228516e-05, 4.4422224164009094e-05, 5.016103386878967e-05, 5.589984357357025e-05, 6.163865327835083e-05, 6.737746298313141e-05, 7.311627268791199e-05, 7.885508239269257e-05, 8.459389209747314e-05, 9.033270180225372e-05, 9.60715115070343e-05, 0.00010181032121181488, 0.00010754913091659546, 0.00011328794062137604, 0.00011902675032615662, 0.0001247655600309372, 0.00013050436973571777, 0.00013624317944049835, 0.00014198198914527893, 0.0001477207988500595, 0.0001534596085548401, 0.00015919841825962067, 0.00016493722796440125, 0.00017067603766918182, 0.0001764148473739624, 0.00018215365707874298, 0.00018789246678352356, 0.00019363127648830414, 0.00019937008619308472, 0.0002051088958978653, 0.00021084770560264587, 0.00021658651530742645, 0.00022232532501220703]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 7.0, 9.0, 14.0, 18.0, 24.0, 40.0, 69.0, 92.0, 114.0, 152.0, 268.0, 300.0, 466.0, 668.0, 935.0, 1332.0, 1894.0, 2697.0, 4001.0, 5947.0, 8994.0, 14110.0, 22573.0, 37153.0, 62455.0, 105099.0, 163640.0, 198819.0, 159017.0, 100306.0, 59610.0, 35368.0, 21630.0, 13429.0, 8692.0, 5712.0, 3955.0, 2602.0, 1878.0, 1291.0, 934.0, 654.0, 463.0, 321.0, 234.0, 180.0, 116.0, 95.0, 51.0, 43.0, 34.0, 18.0, 16.0, 8.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.271484375, -1.229736328125, -1.18798828125, -1.146240234375, -1.1044921875, -1.062744140625, -1.02099609375, -0.979248046875, -0.9375, -0.895751953125, -0.85400390625, -0.812255859375, -0.7705078125, -0.728759765625, -0.68701171875, -0.645263671875, -0.603515625, -0.561767578125, -0.52001953125, -0.478271484375, -0.4365234375, -0.394775390625, -0.35302734375, -0.311279296875, -0.26953125, -0.227783203125, -0.18603515625, -0.144287109375, -0.1025390625, -0.060791015625, -0.01904296875, 0.022705078125, 0.064453125, 0.106201171875, 0.14794921875, 0.189697265625, 0.2314453125, 0.273193359375, 0.31494140625, 0.356689453125, 0.3984375, 0.440185546875, 0.48193359375, 0.523681640625, 0.5654296875, 0.607177734375, 0.64892578125, 0.690673828125, 0.732421875, 0.774169921875, 0.81591796875, 0.857666015625, 0.8994140625, 0.941162109375, 0.98291015625, 1.024658203125, 1.06640625, 1.108154296875, 1.14990234375, 1.191650390625, 1.2333984375, 1.275146484375, 1.31689453125, 1.358642578125, 1.400390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 6.0, 9.0, 10.0, 8.0, 12.0, 14.0, 19.0, 27.0, 27.0, 38.0, 52.0, 56.0, 60.0, 60.0, 71.0, 68.0, 67.0, 70.0, 39.0, 44.0, 38.0, 25.0, 28.0, 29.0, 18.0, 16.0, 14.0, 14.0, 13.0, 8.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.59130859375, -0.5753898620605469, -0.5594711303710938, -0.5435523986816406, -0.5276336669921875, -0.5117149353027344, -0.49579620361328125, -0.4798774719238281, -0.463958740234375, -0.4480400085449219, -0.43212127685546875, -0.4162025451660156, -0.4002838134765625, -0.3843650817871094, -0.36844635009765625, -0.3525276184082031, -0.33660888671875, -0.3206901550292969, -0.30477142333984375, -0.2888526916503906, -0.2729339599609375, -0.2570152282714844, -0.24109649658203125, -0.22517776489257812, -0.209259033203125, -0.19334030151367188, -0.17742156982421875, -0.16150283813476562, -0.1455841064453125, -0.12966537475585938, -0.11374664306640625, -0.09782791137695312, -0.0819091796875, -0.06599044799804688, -0.05007171630859375, -0.034152984619140625, -0.0182342529296875, -0.002315521240234375, 0.01360321044921875, 0.029521942138671875, 0.045440673828125, 0.061359405517578125, 0.07727813720703125, 0.09319686889648438, 0.1091156005859375, 0.12503433227539062, 0.14095306396484375, 0.15687179565429688, 0.17279052734375, 0.18870925903320312, 0.20462799072265625, 0.22054672241210938, 0.2364654541015625, 0.2523841857910156, 0.26830291748046875, 0.2842216491699219, 0.300140380859375, 0.3160591125488281, 0.33197784423828125, 0.3478965759277344, 0.3638153076171875, 0.3797340393066406, 0.39565277099609375, 0.4115715026855469, 0.427490234375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 4.0, 14.0, 13.0, 10.0, 13.0, 13.0, 23.0, 21.0, 26.0, 21.0, 24.0, 34.0, 23.0, 45.0, 33.0, 35.0, 40.0, 45.0, 34.0, 40.0, 33.0, 39.0, 41.0, 35.0, 43.0, 36.0, 25.0, 32.0, 27.0, 21.0, 29.0, 21.0, 17.0, 16.0, 10.0, 11.0, 8.0, 7.0, 6.0, 2.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.540283203125, -22.78327751159668, -22.02627182006836, -21.26926612854004, -20.51226043701172, -19.7552547454834, -18.998249053955078, -18.24124526977539, -17.484237670898438, -16.727231979370117, -15.970226287841797, -15.213220596313477, -14.456214904785156, -13.699209213256836, -12.942204475402832, -12.185198783874512, -11.428194046020508, -10.671188354492188, -9.914182662963867, -9.157176971435547, -8.400171279907227, -7.6431660652160645, -6.886160850524902, -6.129155158996582, -5.372149467468262, -4.615143775939941, -3.8581383228302, -3.101132869720459, -2.3441271781921387, -1.5871214866638184, -0.8301162719726562, -0.07311058044433594, 0.6838970184326172, 1.440902590751648, 2.1979081630706787, 2.95491361618042, 3.7119193077087402, 4.4689249992370605, 5.225930213928223, 5.982935905456543, 6.739941596984863, 7.496947288513184, 8.253952980041504, 9.010957717895508, 9.767963409423828, 10.524969100952148, 11.281974792480469, 12.038980484008789, 12.79598617553711, 13.55299186706543, 14.30999755859375, 15.06700325012207, 15.82400894165039, 16.58101463317871, 17.33802032470703, 18.09502410888672, 18.852031707763672, 19.609037399291992, 20.366043090820312, 21.123048782348633, 21.880054473876953, 22.637060165405273, 23.394065856933594, 24.15106964111328, 24.9080753326416]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 8.0, 4.0, 6.0, 9.0, 13.0, 14.0, 17.0, 17.0, 13.0, 21.0, 23.0, 24.0, 22.0, 28.0, 29.0, 31.0, 28.0, 32.0, 35.0, 33.0, 19.0, 41.0, 43.0, 39.0, 34.0, 39.0, 32.0, 41.0, 29.0, 24.0, 37.0, 26.0, 21.0, 23.0, 25.0, 19.0, 18.0, 15.0, 14.0, 9.0, 8.0, 6.0, 5.0, 7.0, 6.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.398534774780273, -19.63751983642578, -18.87650489807129, -18.115488052368164, -17.354473114013672, -16.59345817565918, -15.832443237304688, -15.071427345275879, -14.31041145324707, -13.549396514892578, -12.78838062286377, -12.027365684509277, -11.266349792480469, -10.505334854125977, -9.744319915771484, -8.983304023742676, -8.222289085388184, -7.461273670196533, -6.700258255004883, -5.939243316650391, -5.178227424621582, -4.41721248626709, -3.6561970710754395, -2.895181655883789, -2.1341662406921387, -1.3731508255004883, -0.6121355295181274, 0.1488797664642334, 0.9098951816558838, 1.6709105968475342, 2.4319257736206055, 3.192941188812256, 3.9539566040039062, 4.714972019195557, 5.475987434387207, 6.237002372741699, 6.998018264770508, 7.759033203125, 8.520048141479492, 9.2810640335083, 10.04207992553711, 10.803094863891602, 11.56411075592041, 12.325125694274902, 13.086141586303711, 13.847156524658203, 14.608171463012695, 15.369187355041504, 16.130203247070312, 16.891218185424805, 17.652233123779297, 18.413249969482422, 19.174264907836914, 19.935279846191406, 20.6962947845459, 21.45730972290039, 22.218324661254883, 22.979339599609375, 23.740354537963867, 24.501371383666992, 25.262386322021484, 26.023401260375977, 26.78441619873047, 27.545433044433594, 28.306447982788086]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 14.0, 21.0, 20.0, 49.0, 56.0, 80.0, 134.0, 223.0, 378.0, 583.0, 925.0, 1540.0, 2305.0, 3523.0, 5462.0, 7999.0, 11623.0, 16566.0, 23408.0, 31575.0, 42069.0, 53219.0, 64699.0, 76336.0, 84886.0, 90499.0, 90121.0, 85599.0, 77742.0, 66809.0, 55118.0, 43482.0, 32971.0, 24297.0, 17583.0, 12210.0, 8459.0, 5471.0, 3813.0, 2433.0, 1586.0, 959.0, 669.0, 434.0, 235.0, 147.0, 116.0, 53.0, 24.0, 19.0, 15.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.765625, -14.30517578125, -13.8447265625, -13.38427734375, -12.923828125, -12.46337890625, -12.0029296875, -11.54248046875, -11.08203125, -10.62158203125, -10.1611328125, -9.70068359375, -9.240234375, -8.77978515625, -8.3193359375, -7.85888671875, -7.3984375, -6.93798828125, -6.4775390625, -6.01708984375, -5.556640625, -5.09619140625, -4.6357421875, -4.17529296875, -3.71484375, -3.25439453125, -2.7939453125, -2.33349609375, -1.873046875, -1.41259765625, -0.9521484375, -0.49169921875, -0.03125, 0.42919921875, 0.8896484375, 1.35009765625, 1.810546875, 2.27099609375, 2.7314453125, 3.19189453125, 3.65234375, 4.11279296875, 4.5732421875, 5.03369140625, 5.494140625, 5.95458984375, 6.4150390625, 6.87548828125, 7.3359375, 7.79638671875, 8.2568359375, 8.71728515625, 9.177734375, 9.63818359375, 10.0986328125, 10.55908203125, 11.01953125, 11.47998046875, 11.9404296875, 12.40087890625, 12.861328125, 13.32177734375, 13.7822265625, 14.24267578125, 14.703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 10.0, 11.0, 24.0, 14.0, 14.0, 12.0, 20.0, 18.0, 26.0, 28.0, 39.0, 35.0, 33.0, 28.0, 41.0, 42.0, 28.0, 35.0, 37.0, 51.0, 43.0, 33.0, 44.0, 29.0, 28.0, 36.0, 29.0, 20.0, 22.0, 17.0, 22.0, 17.0, 17.0, 15.0, 15.0, 9.0, 9.0, 12.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.71875, -21.89013671875, -21.0615234375, -20.23291015625, -19.404296875, -18.57568359375, -17.7470703125, -16.91845703125, -16.08984375, -15.26123046875, -14.4326171875, -13.60400390625, -12.775390625, -11.94677734375, -11.1181640625, -10.28955078125, -9.4609375, -8.63232421875, -7.8037109375, -6.97509765625, -6.146484375, -5.31787109375, -4.4892578125, -3.66064453125, -2.83203125, -2.00341796875, -1.1748046875, -0.34619140625, 0.482421875, 1.31103515625, 2.1396484375, 2.96826171875, 3.796875, 4.62548828125, 5.4541015625, 6.28271484375, 7.111328125, 7.93994140625, 8.7685546875, 9.59716796875, 10.42578125, 11.25439453125, 12.0830078125, 12.91162109375, 13.740234375, 14.56884765625, 15.3974609375, 16.22607421875, 17.0546875, 17.88330078125, 18.7119140625, 19.54052734375, 20.369140625, 21.19775390625, 22.0263671875, 22.85498046875, 23.68359375, 24.51220703125, 25.3408203125, 26.16943359375, 26.998046875, 27.82666015625, 28.6552734375, 29.48388671875, 30.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 4.0, 7.0, 13.0, 20.0, 33.0, 38.0, 73.0, 107.0, 170.0, 276.0, 439.0, 619.0, 958.0, 1448.0, 2133.0, 3207.0, 4905.0, 6997.0, 10108.0, 14641.0, 20434.0, 28172.0, 37624.0, 48007.0, 59840.0, 72054.0, 81922.0, 88381.0, 90722.0, 87582.0, 80494.0, 70802.0, 59543.0, 47751.0, 36513.0, 27297.0, 20255.0, 14175.0, 9863.0, 6889.0, 4656.0, 3226.0, 2112.0, 1360.0, 899.0, 612.0, 424.0, 269.0, 161.0, 106.0, 83.0, 51.0, 42.0, 15.0, 13.0, 13.0, 4.0, 4.0, 2.0, 1.0], "bins": [-15.0078125, -14.5455322265625, -14.083251953125, -13.6209716796875, -13.15869140625, -12.6964111328125, -12.234130859375, -11.7718505859375, -11.3095703125, -10.8472900390625, -10.385009765625, -9.9227294921875, -9.46044921875, -8.9981689453125, -8.535888671875, -8.0736083984375, -7.611328125, -7.1490478515625, -6.686767578125, -6.2244873046875, -5.76220703125, -5.2999267578125, -4.837646484375, -4.3753662109375, -3.9130859375, -3.4508056640625, -2.988525390625, -2.5262451171875, -2.06396484375, -1.6016845703125, -1.139404296875, -0.6771240234375, -0.21484375, 0.2474365234375, 0.709716796875, 1.1719970703125, 1.63427734375, 2.0965576171875, 2.558837890625, 3.0211181640625, 3.4833984375, 3.9456787109375, 4.407958984375, 4.8702392578125, 5.33251953125, 5.7947998046875, 6.257080078125, 6.7193603515625, 7.181640625, 7.6439208984375, 8.106201171875, 8.5684814453125, 9.03076171875, 9.4930419921875, 9.955322265625, 10.4176025390625, 10.8798828125, 11.3421630859375, 11.804443359375, 12.2667236328125, 12.72900390625, 13.1912841796875, 13.653564453125, 14.1158447265625, 14.578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 8.0, 9.0, 9.0, 13.0, 14.0, 10.0, 11.0, 14.0, 23.0, 18.0, 25.0, 24.0, 21.0, 29.0, 38.0, 36.0, 24.0, 32.0, 40.0, 28.0, 35.0, 37.0, 40.0, 27.0, 31.0, 35.0, 36.0, 31.0, 29.0, 37.0, 25.0, 29.0, 24.0, 23.0, 24.0, 11.0, 15.0, 11.0, 16.0, 6.0, 13.0, 10.0, 4.0, 6.0, 3.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-16.515625, -16.0172119140625, -15.518798828125, -15.0203857421875, -14.52197265625, -14.0235595703125, -13.525146484375, -13.0267333984375, -12.5283203125, -12.0299072265625, -11.531494140625, -11.0330810546875, -10.53466796875, -10.0362548828125, -9.537841796875, -9.0394287109375, -8.541015625, -8.0426025390625, -7.544189453125, -7.0457763671875, -6.54736328125, -6.0489501953125, -5.550537109375, -5.0521240234375, -4.5537109375, -4.0552978515625, -3.556884765625, -3.0584716796875, -2.56005859375, -2.0616455078125, -1.563232421875, -1.0648193359375, -0.56640625, -0.0679931640625, 0.430419921875, 0.9288330078125, 1.42724609375, 1.9256591796875, 2.424072265625, 2.9224853515625, 3.4208984375, 3.9193115234375, 4.417724609375, 4.9161376953125, 5.41455078125, 5.9129638671875, 6.411376953125, 6.9097900390625, 7.408203125, 7.9066162109375, 8.405029296875, 8.9034423828125, 9.40185546875, 9.9002685546875, 10.398681640625, 10.8970947265625, 11.3955078125, 11.8939208984375, 12.392333984375, 12.8907470703125, 13.38916015625, 13.8875732421875, 14.385986328125, 14.8843994140625, 15.3828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 14.0, 21.0, 33.0, 49.0, 71.0, 92.0, 137.0, 226.0, 319.0, 493.0, 854.0, 1181.0, 1868.0, 2826.0, 4347.0, 6344.0, 9771.0, 14107.0, 20584.0, 29003.0, 39876.0, 52445.0, 66200.0, 79296.0, 90381.0, 96900.0, 96999.0, 91734.0, 81617.0, 68056.0, 54374.0, 41532.0, 30106.0, 21317.0, 15210.0, 10179.0, 6829.0, 4557.0, 2930.0, 1967.0, 1271.0, 814.0, 524.0, 395.0, 219.0, 148.0, 95.0, 79.0, 41.0, 42.0, 20.0, 26.0, 10.0, 9.0, 9.0, 3.0, 4.0, 5.0], "bins": [-5.53515625, -5.362548828125, -5.18994140625, -5.017333984375, -4.8447265625, -4.672119140625, -4.49951171875, -4.326904296875, -4.154296875, -3.981689453125, -3.80908203125, -3.636474609375, -3.4638671875, -3.291259765625, -3.11865234375, -2.946044921875, -2.7734375, -2.600830078125, -2.42822265625, -2.255615234375, -2.0830078125, -1.910400390625, -1.73779296875, -1.565185546875, -1.392578125, -1.219970703125, -1.04736328125, -0.874755859375, -0.7021484375, -0.529541015625, -0.35693359375, -0.184326171875, -0.01171875, 0.160888671875, 0.33349609375, 0.506103515625, 0.6787109375, 0.851318359375, 1.02392578125, 1.196533203125, 1.369140625, 1.541748046875, 1.71435546875, 1.886962890625, 2.0595703125, 2.232177734375, 2.40478515625, 2.577392578125, 2.75, 2.922607421875, 3.09521484375, 3.267822265625, 3.4404296875, 3.613037109375, 3.78564453125, 3.958251953125, 4.130859375, 4.303466796875, 4.47607421875, 4.648681640625, 4.8212890625, 4.993896484375, 5.16650390625, 5.339111328125, 5.51171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 1.0, 3.0, 14.0, 9.0, 14.0, 21.0, 25.0, 30.0, 21.0, 33.0, 25.0, 46.0, 37.0, 39.0, 46.0, 48.0, 49.0, 46.0, 60.0, 40.0, 47.0, 44.0, 44.0, 36.0, 36.0, 20.0, 31.0, 23.0, 19.0, 17.0, 16.0, 21.0, 7.0, 11.0, 7.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007042884826660156, -0.0006781965494155884, -0.0006521046161651611, -0.0006260126829147339, -0.0005999207496643066, -0.0005738288164138794, -0.0005477368831634521, -0.0005216449499130249, -0.0004955530166625977, -0.0004694610834121704, -0.00044336915016174316, -0.0004172772169113159, -0.00039118528366088867, -0.0003650933504104614, -0.0003390014171600342, -0.00031290948390960693, -0.0002868175506591797, -0.00026072561740875244, -0.0002346336841583252, -0.00020854175090789795, -0.0001824498176574707, -0.00015635788440704346, -0.0001302659511566162, -0.00010417401790618896, -7.808208465576172e-05, -5.199015140533447e-05, -2.5898218154907227e-05, 1.9371509552001953e-07, 2.6285648345947266e-05, 5.237758159637451e-05, 7.846951484680176e-05, 0.000104561448097229, 0.00013065338134765625, 0.0001567453145980835, 0.00018283724784851074, 0.000208929181098938, 0.00023502111434936523, 0.0002611130475997925, 0.0002872049808502197, 0.00031329691410064697, 0.0003393888473510742, 0.00036548078060150146, 0.0003915727138519287, 0.00041766464710235596, 0.0004437565803527832, 0.00046984851360321045, 0.0004959404468536377, 0.0005220323801040649, 0.0005481243133544922, 0.0005742162466049194, 0.0006003081798553467, 0.0006264001131057739, 0.0006524920463562012, 0.0006785839796066284, 0.0007046759128570557, 0.0007307678461074829, 0.0007568597793579102, 0.0007829517126083374, 0.0008090436458587646, 0.0008351355791091919, 0.0008612275123596191, 0.0008873194456100464, 0.0009134113788604736, 0.0009395033121109009, 0.0009655952453613281]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 16.0, 32.0, 36.0, 47.0, 73.0, 143.0, 186.0, 304.0, 451.0, 687.0, 1108.0, 1627.0, 2585.0, 3990.0, 6101.0, 9616.0, 14365.0, 21375.0, 30958.0, 43028.0, 58411.0, 74361.0, 89505.0, 100723.0, 105712.0, 102670.0, 92494.0, 77680.0, 61838.0, 46505.0, 33456.0, 23200.0, 15622.0, 10432.0, 6703.0, 4429.0, 2872.0, 1877.0, 1183.0, 784.0, 461.0, 307.0, 218.0, 123.0, 88.0, 69.0, 39.0, 20.0, 22.0, 8.0, 6.0, 4.0, 4.0], "bins": [-7.16796875, -6.9666748046875, -6.765380859375, -6.5640869140625, -6.36279296875, -6.1614990234375, -5.960205078125, -5.7589111328125, -5.5576171875, -5.3563232421875, -5.155029296875, -4.9537353515625, -4.75244140625, -4.5511474609375, -4.349853515625, -4.1485595703125, -3.947265625, -3.7459716796875, -3.544677734375, -3.3433837890625, -3.14208984375, -2.9407958984375, -2.739501953125, -2.5382080078125, -2.3369140625, -2.1356201171875, -1.934326171875, -1.7330322265625, -1.53173828125, -1.3304443359375, -1.129150390625, -0.9278564453125, -0.7265625, -0.5252685546875, -0.323974609375, -0.1226806640625, 0.07861328125, 0.2799072265625, 0.481201171875, 0.6824951171875, 0.8837890625, 1.0850830078125, 1.286376953125, 1.4876708984375, 1.68896484375, 1.8902587890625, 2.091552734375, 2.2928466796875, 2.494140625, 2.6954345703125, 2.896728515625, 3.0980224609375, 3.29931640625, 3.5006103515625, 3.701904296875, 3.9031982421875, 4.1044921875, 4.3057861328125, 4.507080078125, 4.7083740234375, 4.90966796875, 5.1109619140625, 5.312255859375, 5.5135498046875, 5.71484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 14.0, 12.0, 17.0, 13.0, 19.0, 33.0, 22.0, 30.0, 43.0, 37.0, 39.0, 41.0, 49.0, 48.0, 59.0, 55.0, 42.0, 50.0, 43.0, 40.0, 39.0, 34.0, 33.0, 25.0, 18.0, 16.0, 18.0, 9.0, 12.0, 16.0, 10.0, 11.0, 6.0, 6.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.134307861328125, -3.03619384765625, -2.938079833984375, -2.8399658203125, -2.741851806640625, -2.64373779296875, -2.545623779296875, -2.447509765625, -2.349395751953125, -2.25128173828125, -2.153167724609375, -2.0550537109375, -1.956939697265625, -1.85882568359375, -1.760711669921875, -1.66259765625, -1.564483642578125, -1.46636962890625, -1.368255615234375, -1.2701416015625, -1.172027587890625, -1.07391357421875, -0.975799560546875, -0.877685546875, -0.779571533203125, -0.68145751953125, -0.583343505859375, -0.4852294921875, -0.387115478515625, -0.28900146484375, -0.190887451171875, -0.0927734375, 0.005340576171875, 0.10345458984375, 0.201568603515625, 0.2996826171875, 0.397796630859375, 0.49591064453125, 0.594024658203125, 0.692138671875, 0.790252685546875, 0.88836669921875, 0.986480712890625, 1.0845947265625, 1.182708740234375, 1.28082275390625, 1.378936767578125, 1.47705078125, 1.575164794921875, 1.67327880859375, 1.771392822265625, 1.8695068359375, 1.967620849609375, 2.06573486328125, 2.163848876953125, 2.261962890625, 2.360076904296875, 2.45819091796875, 2.556304931640625, 2.6544189453125, 2.752532958984375, 2.85064697265625, 2.948760986328125, 3.046875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 8.0, 6.0, 6.0, 8.0, 13.0, 12.0, 12.0, 12.0, 19.0, 25.0, 19.0, 26.0, 20.0, 22.0, 22.0, 37.0, 27.0, 45.0, 40.0, 36.0, 37.0, 41.0, 38.0, 39.0, 23.0, 31.0, 46.0, 41.0, 33.0, 24.0, 32.0, 29.0, 32.0, 17.0, 19.0, 20.0, 13.0, 16.0, 6.0, 9.0, 8.0, 6.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.452224731445312, -20.738773345947266, -20.02532196044922, -19.31186866760254, -18.598417282104492, -17.884965896606445, -17.1715145111084, -16.45806121826172, -15.744609832763672, -15.031158447265625, -14.317706108093262, -13.604254722595215, -12.890802383422852, -12.177350997924805, -11.463899612426758, -10.750447273254395, -10.036995887756348, -9.3235445022583, -8.610092163085938, -7.896640777587891, -7.183188438415527, -6.4697370529174805, -5.756285190582275, -5.04283332824707, -4.329381465911865, -3.61592960357666, -2.902477741241455, -2.189026117324829, -1.475574254989624, -0.762122392654419, -0.04867076873779297, 0.6647810935974121, 1.3782329559326172, 2.0916848182678223, 2.8051366806030273, 3.5185883045196533, 4.2320404052734375, 4.945491790771484, 5.6589436531066895, 6.3723955154418945, 7.0858473777771, 7.799299240112305, 8.512750625610352, 9.226202964782715, 9.939654350280762, 10.653106689453125, 11.366558074951172, 12.080009460449219, 12.793461799621582, 13.506913185119629, 14.220365524291992, 14.933816909790039, 15.647269248962402, 16.360721588134766, 17.074172973632812, 17.78762435913086, 18.501075744628906, 19.214527130126953, 19.927978515625, 20.64143180847168, 21.354883193969727, 22.068334579467773, 22.78178596496582, 23.4952392578125, 24.208690643310547]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 1.0, 11.0, 12.0, 16.0, 19.0, 13.0, 17.0, 31.0, 24.0, 39.0, 24.0, 39.0, 30.0, 34.0, 44.0, 44.0, 48.0, 50.0, 43.0, 40.0, 42.0, 39.0, 38.0, 34.0, 32.0, 29.0, 23.0, 24.0, 23.0, 22.0, 18.0, 12.0, 11.0, 11.0, 13.0, 9.0, 10.0, 9.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.564584732055664, -25.62040138244629, -24.67621612548828, -23.732032775878906, -22.78784942626953, -21.843666076660156, -20.89948272705078, -19.955297470092773, -19.0111141204834, -18.066930770874023, -17.122745513916016, -16.17856216430664, -15.234378814697266, -14.29019546508789, -13.3460111618042, -12.401826858520508, -11.457643508911133, -10.513460159301758, -9.569275856018066, -8.625091552734375, -7.680908203125, -6.736724376678467, -5.792540550231934, -4.8483567237854, -3.904172897338867, -2.959989070892334, -2.015805244445801, -1.0716214179992676, -0.12743759155273438, 0.8167462348937988, 1.760930061340332, 2.7051138877868652, 3.6492996215820312, 4.5934834480285645, 5.537667274475098, 6.481851100921631, 7.426034927368164, 8.370218276977539, 9.31440258026123, 10.258586883544922, 11.202770233154297, 12.146953582763672, 13.091137886047363, 14.035322189331055, 14.97950553894043, 15.923688888549805, 16.867874145507812, 17.812057495117188, 18.756240844726562, 19.700424194335938, 20.644607543945312, 21.58879280090332, 22.532976150512695, 23.47715950012207, 24.421344757080078, 25.365528106689453, 26.309711456298828, 27.253894805908203, 28.198078155517578, 29.142263412475586, 30.08644676208496, 31.030630111694336, 31.974815368652344, 32.91899871826172, 33.863182067871094]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 24.0, 30.0, 45.0, 82.0, 159.0, 223.0, 437.0, 754.0, 1318.0, 2176.0, 3609.0, 6120.0, 9931.0, 15790.0, 25085.0, 38924.0, 58334.0, 86149.0, 122424.0, 168737.0, 221295.0, 279251.0, 333199.0, 376400.0, 396491.0, 392899.0, 364900.0, 320936.0, 265793.0, 208349.0, 156054.0, 112846.0, 78364.0, 52611.0, 34841.0, 22309.0, 14445.0, 8866.0, 5609.0, 3418.0, 2016.0, 1200.0, 695.0, 455.0, 264.0, 170.0, 110.0, 55.0, 44.0, 16.0, 19.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0], "bins": [-18.359375, -17.783447265625, -17.20751953125, -16.631591796875, -16.0556640625, -15.479736328125, -14.90380859375, -14.327880859375, -13.751953125, -13.176025390625, -12.60009765625, -12.024169921875, -11.4482421875, -10.872314453125, -10.29638671875, -9.720458984375, -9.14453125, -8.568603515625, -7.99267578125, -7.416748046875, -6.8408203125, -6.264892578125, -5.68896484375, -5.113037109375, -4.537109375, -3.961181640625, -3.38525390625, -2.809326171875, -2.2333984375, -1.657470703125, -1.08154296875, -0.505615234375, 0.0703125, 0.646240234375, 1.22216796875, 1.798095703125, 2.3740234375, 2.949951171875, 3.52587890625, 4.101806640625, 4.677734375, 5.253662109375, 5.82958984375, 6.405517578125, 6.9814453125, 7.557373046875, 8.13330078125, 8.709228515625, 9.28515625, 9.861083984375, 10.43701171875, 11.012939453125, 11.5888671875, 12.164794921875, 12.74072265625, 13.316650390625, 13.892578125, 14.468505859375, 15.04443359375, 15.620361328125, 16.1962890625, 16.772216796875, 17.34814453125, 17.924072265625, 18.5]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 8.0, 5.0, 7.0, 10.0, 8.0, 15.0, 14.0, 14.0, 14.0, 15.0, 24.0, 14.0, 35.0, 31.0, 37.0, 36.0, 46.0, 42.0, 49.0, 41.0, 33.0, 33.0, 49.0, 37.0, 39.0, 42.0, 28.0, 32.0, 30.0, 28.0, 25.0, 29.0, 23.0, 19.0, 17.0, 13.0, 12.0, 9.0, 12.0, 7.0, 10.0, 5.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.921875, -19.17138671875, -18.4208984375, -17.67041015625, -16.919921875, -16.16943359375, -15.4189453125, -14.66845703125, -13.91796875, -13.16748046875, -12.4169921875, -11.66650390625, -10.916015625, -10.16552734375, -9.4150390625, -8.66455078125, -7.9140625, -7.16357421875, -6.4130859375, -5.66259765625, -4.912109375, -4.16162109375, -3.4111328125, -2.66064453125, -1.91015625, -1.15966796875, -0.4091796875, 0.34130859375, 1.091796875, 1.84228515625, 2.5927734375, 3.34326171875, 4.09375, 4.84423828125, 5.5947265625, 6.34521484375, 7.095703125, 7.84619140625, 8.5966796875, 9.34716796875, 10.09765625, 10.84814453125, 11.5986328125, 12.34912109375, 13.099609375, 13.85009765625, 14.6005859375, 15.35107421875, 16.1015625, 16.85205078125, 17.6025390625, 18.35302734375, 19.103515625, 19.85400390625, 20.6044921875, 21.35498046875, 22.10546875, 22.85595703125, 23.6064453125, 24.35693359375, 25.107421875, 25.85791015625, 26.6083984375, 27.35888671875, 28.109375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 11.0, 12.0, 46.0, 53.0, 115.0, 198.0, 416.0, 681.0, 1209.0, 2261.0, 3657.0, 6290.0, 10435.0, 17270.0, 27662.0, 42852.0, 65283.0, 95128.0, 134154.0, 180834.0, 234065.0, 286730.0, 335238.0, 369249.0, 385563.0, 380392.0, 354573.0, 310661.0, 259022.0, 204484.0, 155555.0, 112600.0, 77634.0, 51812.0, 34085.0, 21785.0, 13326.0, 7995.0, 4669.0, 2722.0, 1612.0, 910.0, 438.0, 275.0, 145.0, 86.0, 51.0, 23.0, 13.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.855224609375, -18.24169921875, -17.628173828125, -17.0146484375, -16.401123046875, -15.78759765625, -15.174072265625, -14.560546875, -13.947021484375, -13.33349609375, -12.719970703125, -12.1064453125, -11.492919921875, -10.87939453125, -10.265869140625, -9.65234375, -9.038818359375, -8.42529296875, -7.811767578125, -7.1982421875, -6.584716796875, -5.97119140625, -5.357666015625, -4.744140625, -4.130615234375, -3.51708984375, -2.903564453125, -2.2900390625, -1.676513671875, -1.06298828125, -0.449462890625, 0.1640625, 0.777587890625, 1.39111328125, 2.004638671875, 2.6181640625, 3.231689453125, 3.84521484375, 4.458740234375, 5.072265625, 5.685791015625, 6.29931640625, 6.912841796875, 7.5263671875, 8.139892578125, 8.75341796875, 9.366943359375, 9.98046875, 10.593994140625, 11.20751953125, 11.821044921875, 12.4345703125, 13.048095703125, 13.66162109375, 14.275146484375, 14.888671875, 15.502197265625, 16.11572265625, 16.729248046875, 17.3427734375, 17.956298828125, 18.56982421875, 19.183349609375, 19.796875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 10.0, 19.0, 16.0, 19.0, 19.0, 23.0, 26.0, 42.0, 41.0, 40.0, 54.0, 79.0, 83.0, 79.0, 95.0, 151.0, 136.0, 162.0, 156.0, 169.0, 170.0, 182.0, 216.0, 177.0, 189.0, 175.0, 175.0, 151.0, 160.0, 142.0, 118.0, 116.0, 109.0, 84.0, 86.0, 59.0, 77.0, 52.0, 38.0, 38.0, 38.0, 22.0, 16.0, 17.0, 12.0, 10.0, 9.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-10.390625, -10.0684814453125, -9.746337890625, -9.4241943359375, -9.10205078125, -8.7799072265625, -8.457763671875, -8.1356201171875, -7.8134765625, -7.4913330078125, -7.169189453125, -6.8470458984375, -6.52490234375, -6.2027587890625, -5.880615234375, -5.5584716796875, -5.236328125, -4.9141845703125, -4.592041015625, -4.2698974609375, -3.94775390625, -3.6256103515625, -3.303466796875, -2.9813232421875, -2.6591796875, -2.3370361328125, -2.014892578125, -1.6927490234375, -1.37060546875, -1.0484619140625, -0.726318359375, -0.4041748046875, -0.08203125, 0.2401123046875, 0.562255859375, 0.8843994140625, 1.20654296875, 1.5286865234375, 1.850830078125, 2.1729736328125, 2.4951171875, 2.8172607421875, 3.139404296875, 3.4615478515625, 3.78369140625, 4.1058349609375, 4.427978515625, 4.7501220703125, 5.072265625, 5.3944091796875, 5.716552734375, 6.0386962890625, 6.36083984375, 6.6829833984375, 7.005126953125, 7.3272705078125, 7.6494140625, 7.9715576171875, 8.293701171875, 8.6158447265625, 8.93798828125, 9.2601318359375, 9.582275390625, 9.9044189453125, 10.2265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 8.0, 3.0, 13.0, 12.0, 7.0, 22.0, 15.0, 19.0, 24.0, 20.0, 17.0, 14.0, 30.0, 29.0, 39.0, 33.0, 37.0, 34.0, 43.0, 37.0, 42.0, 37.0, 42.0, 40.0, 40.0, 45.0, 39.0, 24.0, 28.0, 21.0, 11.0, 16.0, 33.0, 24.0, 21.0, 15.0, 13.0, 12.0, 8.0, 12.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.218730926513672, -25.436527252197266, -24.654325485229492, -23.872121810913086, -23.089920043945312, -22.307716369628906, -21.5255126953125, -20.743309020996094, -19.96110725402832, -19.178903579711914, -18.39670181274414, -17.614498138427734, -16.832294464111328, -16.050092697143555, -15.267889022827148, -14.485686302185059, -13.703483581542969, -12.921280860900879, -12.139078140258789, -11.356874465942383, -10.574671745300293, -9.792469024658203, -9.010265350341797, -8.228062629699707, -7.445859909057617, -6.663657188415527, -5.881453990936279, -5.099250793457031, -4.317048072814941, -3.5348451137542725, -2.7526421546936035, -1.9704389572143555, -1.1882381439208984, -0.4060351848602295, 0.37616777420043945, 1.1583707332611084, 1.9405736923217773, 2.7227766513824463, 3.5049796104431152, 4.287182807922363, 5.069385528564453, 5.851588249206543, 6.633791446685791, 7.415994644165039, 8.198197364807129, 8.980400085449219, 9.762603759765625, 10.544806480407715, 11.327009201049805, 12.109211921691895, 12.891414642333984, 13.67361831665039, 14.45582103729248, 15.23802375793457, 16.020227432250977, 16.80242919921875, 17.584632873535156, 18.366836547851562, 19.149038314819336, 19.931241989135742, 20.713443756103516, 21.495647430419922, 22.277851104736328, 23.060054779052734, 23.842256546020508]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 5.0, 7.0, 12.0, 12.0, 17.0, 14.0, 14.0, 27.0, 12.0, 25.0, 21.0, 22.0, 29.0, 38.0, 32.0, 42.0, 39.0, 35.0, 34.0, 34.0, 40.0, 43.0, 36.0, 34.0, 45.0, 55.0, 40.0, 25.0, 25.0, 21.0, 20.0, 22.0, 13.0, 19.0, 13.0, 13.0, 17.0, 14.0, 5.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.830825805664062, -26.948915481567383, -26.067005157470703, -25.185094833374023, -24.303184509277344, -23.421274185180664, -22.539363861083984, -21.657451629638672, -20.775543212890625, -19.893632888793945, -19.011722564697266, -18.129812240600586, -17.247901916503906, -16.365991592407227, -15.48408031463623, -14.60216999053955, -13.720258712768555, -12.838348388671875, -11.956438064575195, -11.074527740478516, -10.192617416381836, -9.310707092285156, -8.42879581451416, -7.5468854904174805, -6.664975166320801, -5.783064842224121, -4.901154518127441, -4.0192437171936035, -3.137333393096924, -2.255423069000244, -1.3735122680664062, -0.49160194396972656, 0.3903064727783203, 1.2722169160842896, 2.154127359390259, 3.0360379219055176, 3.9179482460021973, 4.799858570098877, 5.681769371032715, 6.5636796951293945, 7.445590019226074, 8.327500343322754, 9.209410667419434, 10.09132194519043, 10.97323226928711, 11.855142593383789, 12.737052917480469, 13.618963241577148, 14.500873565673828, 15.382783889770508, 16.264694213867188, 17.146604537963867, 18.028514862060547, 18.910425186157227, 19.792335510253906, 20.67424774169922, 21.556156158447266, 22.438066482543945, 23.319976806640625, 24.201887130737305, 25.083797454833984, 25.965707778930664, 26.847618103027344, 27.729530334472656, 28.611440658569336]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 6.0, 5.0, 6.0, 23.0, 26.0, 38.0, 64.0, 82.0, 111.0, 177.0, 263.0, 409.0, 645.0, 935.0, 1381.0, 2055.0, 3235.0, 4850.0, 7498.0, 11061.0, 16878.0, 25113.0, 38372.0, 55552.0, 77076.0, 101115.0, 120944.0, 129356.0, 119707.0, 97734.0, 73870.0, 52699.0, 35933.0, 24160.0, 16247.0, 10574.0, 6891.0, 4632.0, 2969.0, 1991.0, 1197.0, 861.0, 594.0, 391.0, 284.0, 185.0, 125.0, 76.0, 62.0, 37.0, 15.0, 19.0, 10.0, 10.0, 4.0, 9.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.76171875, -3.63812255859375, -3.5145263671875, -3.39093017578125, -3.267333984375, -3.14373779296875, -3.0201416015625, -2.89654541015625, -2.77294921875, -2.64935302734375, -2.5257568359375, -2.40216064453125, -2.278564453125, -2.15496826171875, -2.0313720703125, -1.90777587890625, -1.7841796875, -1.66058349609375, -1.5369873046875, -1.41339111328125, -1.289794921875, -1.16619873046875, -1.0426025390625, -0.91900634765625, -0.79541015625, -0.67181396484375, -0.5482177734375, -0.42462158203125, -0.301025390625, -0.17742919921875, -0.0538330078125, 0.06976318359375, 0.193359375, 0.31695556640625, 0.4405517578125, 0.56414794921875, 0.687744140625, 0.81134033203125, 0.9349365234375, 1.05853271484375, 1.18212890625, 1.30572509765625, 1.4293212890625, 1.55291748046875, 1.676513671875, 1.80010986328125, 1.9237060546875, 2.04730224609375, 2.1708984375, 2.29449462890625, 2.4180908203125, 2.54168701171875, 2.665283203125, 2.78887939453125, 2.9124755859375, 3.03607177734375, 3.15966796875, 3.28326416015625, 3.4068603515625, 3.53045654296875, 3.654052734375, 3.77764892578125, 3.9012451171875, 4.02484130859375, 4.1484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 8.0, 6.0, 11.0, 16.0, 14.0, 15.0, 16.0, 20.0, 30.0, 25.0, 28.0, 20.0, 34.0, 36.0, 42.0, 37.0, 29.0, 39.0, 35.0, 43.0, 57.0, 38.0, 52.0, 40.0, 31.0, 36.0, 23.0, 32.0, 26.0, 22.0, 20.0, 15.0, 14.0, 16.0, 15.0, 10.0, 18.0, 8.0, 5.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.328125, -26.374755859375, -25.42138671875, -24.468017578125, -23.5146484375, -22.561279296875, -21.60791015625, -20.654541015625, -19.701171875, -18.747802734375, -17.79443359375, -16.841064453125, -15.8876953125, -14.934326171875, -13.98095703125, -13.027587890625, -12.07421875, -11.120849609375, -10.16748046875, -9.214111328125, -8.2607421875, -7.307373046875, -6.35400390625, -5.400634765625, -4.447265625, -3.493896484375, -2.54052734375, -1.587158203125, -0.6337890625, 0.319580078125, 1.27294921875, 2.226318359375, 3.1796875, 4.133056640625, 5.08642578125, 6.039794921875, 6.9931640625, 7.946533203125, 8.89990234375, 9.853271484375, 10.806640625, 11.760009765625, 12.71337890625, 13.666748046875, 14.6201171875, 15.573486328125, 16.52685546875, 17.480224609375, 18.43359375, 19.386962890625, 20.34033203125, 21.293701171875, 22.2470703125, 23.200439453125, 24.15380859375, 25.107177734375, 26.060546875, 27.013916015625, 27.96728515625, 28.920654296875, 29.8740234375, 30.827392578125, 31.78076171875, 32.734130859375, 33.6875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 16.0, 16.0, 26.0, 30.0, 43.0, 74.0, 101.0, 185.0, 261.0, 398.0, 645.0, 1050.0, 1621.0, 2822.0, 4594.0, 7709.0, 12947.0, 21951.0, 37213.0, 61693.0, 96930.0, 137971.0, 165875.0, 159423.0, 124050.0, 82998.0, 51810.0, 30671.0, 18246.0, 10852.0, 6386.0, 3838.0, 2342.0, 1391.0, 810.0, 524.0, 366.0, 223.0, 134.0, 115.0, 58.0, 38.0, 40.0, 28.0, 11.0, 8.0, 8.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.953125, -4.79241943359375, -4.6317138671875, -4.47100830078125, -4.310302734375, -4.14959716796875, -3.9888916015625, -3.82818603515625, -3.66748046875, -3.50677490234375, -3.3460693359375, -3.18536376953125, -3.024658203125, -2.86395263671875, -2.7032470703125, -2.54254150390625, -2.3818359375, -2.22113037109375, -2.0604248046875, -1.89971923828125, -1.739013671875, -1.57830810546875, -1.4176025390625, -1.25689697265625, -1.09619140625, -0.93548583984375, -0.7747802734375, -0.61407470703125, -0.453369140625, -0.29266357421875, -0.1319580078125, 0.02874755859375, 0.189453125, 0.35015869140625, 0.5108642578125, 0.67156982421875, 0.832275390625, 0.99298095703125, 1.1536865234375, 1.31439208984375, 1.47509765625, 1.63580322265625, 1.7965087890625, 1.95721435546875, 2.117919921875, 2.27862548828125, 2.4393310546875, 2.60003662109375, 2.7607421875, 2.92144775390625, 3.0821533203125, 3.24285888671875, 3.403564453125, 3.56427001953125, 3.7249755859375, 3.88568115234375, 4.04638671875, 4.20709228515625, 4.3677978515625, 4.52850341796875, 4.689208984375, 4.84991455078125, 5.0106201171875, 5.17132568359375, 5.33203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 8.0, 5.0, 10.0, 7.0, 11.0, 11.0, 14.0, 17.0, 16.0, 27.0, 26.0, 22.0, 24.0, 20.0, 41.0, 40.0, 37.0, 38.0, 25.0, 37.0, 27.0, 29.0, 33.0, 41.0, 39.0, 27.0, 35.0, 32.0, 32.0, 32.0, 31.0, 19.0, 18.0, 18.0, 24.0, 21.0, 20.0, 15.0, 14.0, 11.0, 15.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-17.140625, -16.605224609375, -16.06982421875, -15.534423828125, -14.9990234375, -14.463623046875, -13.92822265625, -13.392822265625, -12.857421875, -12.322021484375, -11.78662109375, -11.251220703125, -10.7158203125, -10.180419921875, -9.64501953125, -9.109619140625, -8.57421875, -8.038818359375, -7.50341796875, -6.968017578125, -6.4326171875, -5.897216796875, -5.36181640625, -4.826416015625, -4.291015625, -3.755615234375, -3.22021484375, -2.684814453125, -2.1494140625, -1.614013671875, -1.07861328125, -0.543212890625, -0.0078125, 0.527587890625, 1.06298828125, 1.598388671875, 2.1337890625, 2.669189453125, 3.20458984375, 3.739990234375, 4.275390625, 4.810791015625, 5.34619140625, 5.881591796875, 6.4169921875, 6.952392578125, 7.48779296875, 8.023193359375, 8.55859375, 9.093994140625, 9.62939453125, 10.164794921875, 10.7001953125, 11.235595703125, 11.77099609375, 12.306396484375, 12.841796875, 13.377197265625, 13.91259765625, 14.447998046875, 14.9833984375, 15.518798828125, 16.05419921875, 16.589599609375, 17.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 11.0, 12.0, 21.0, 29.0, 35.0, 65.0, 84.0, 147.0, 210.0, 387.0, 689.0, 1190.0, 2481.0, 5359.0, 13580.0, 38566.0, 124402.0, 349906.0, 336205.0, 116505.0, 35674.0, 12493.0, 5161.0, 2442.0, 1274.0, 653.0, 376.0, 195.0, 138.0, 82.0, 46.0, 36.0, 25.0, 23.0, 12.0, 11.0, 7.0, 4.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5883636474609375, -1.537078857421875, -1.4857940673828125, -1.43450927734375, -1.3832244873046875, -1.331939697265625, -1.2806549072265625, -1.2293701171875, -1.1780853271484375, -1.126800537109375, -1.0755157470703125, -1.02423095703125, -0.9729461669921875, -0.921661376953125, -0.8703765869140625, -0.819091796875, -0.7678070068359375, -0.716522216796875, -0.6652374267578125, -0.61395263671875, -0.5626678466796875, -0.511383056640625, -0.4600982666015625, -0.4088134765625, -0.3575286865234375, -0.306243896484375, -0.2549591064453125, -0.20367431640625, -0.1523895263671875, -0.101104736328125, -0.0498199462890625, 0.00146484375, 0.0527496337890625, 0.104034423828125, 0.1553192138671875, 0.20660400390625, 0.2578887939453125, 0.309173583984375, 0.3604583740234375, 0.4117431640625, 0.4630279541015625, 0.514312744140625, 0.5655975341796875, 0.61688232421875, 0.6681671142578125, 0.719451904296875, 0.7707366943359375, 0.822021484375, 0.8733062744140625, 0.924591064453125, 0.9758758544921875, 1.02716064453125, 1.0784454345703125, 1.129730224609375, 1.1810150146484375, 1.2322998046875, 1.2835845947265625, 1.334869384765625, 1.3861541748046875, 1.43743896484375, 1.4887237548828125, 1.540008544921875, 1.5912933349609375, 1.642578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 8.0, 6.0, 7.0, 5.0, 12.0, 7.0, 13.0, 11.0, 32.0, 21.0, 24.0, 25.0, 33.0, 48.0, 52.0, 48.0, 38.0, 57.0, 59.0, 54.0, 63.0, 47.0, 34.0, 42.0, 45.0, 36.0, 30.0, 23.0, 24.0, 19.0, 12.0, 18.0, 9.0, 4.0, 9.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.666515350341797e-05, -8.384697139263153e-05, -8.102878928184509e-05, -7.821060717105865e-05, -7.539242506027222e-05, -7.257424294948578e-05, -6.975606083869934e-05, -6.69378787279129e-05, -6.411969661712646e-05, -6.130151450634003e-05, -5.848333239555359e-05, -5.566515028476715e-05, -5.284696817398071e-05, -5.0028786063194275e-05, -4.721060395240784e-05, -4.43924218416214e-05, -4.157423973083496e-05, -3.875605762004852e-05, -3.5937875509262085e-05, -3.311969339847565e-05, -3.030151128768921e-05, -2.748332917690277e-05, -2.4665147066116333e-05, -2.1846964955329895e-05, -1.9028782844543457e-05, -1.621060073375702e-05, -1.3392418622970581e-05, -1.0574236512184143e-05, -7.756054401397705e-06, -4.937872290611267e-06, -2.119690179824829e-06, 6.984919309616089e-07, 3.516674041748047e-06, 6.334856152534485e-06, 9.153038263320923e-06, 1.197122037410736e-05, 1.4789402484893799e-05, 1.7607584595680237e-05, 2.0425766706466675e-05, 2.3243948817253113e-05, 2.606213092803955e-05, 2.888031303882599e-05, 3.169849514961243e-05, 3.4516677260398865e-05, 3.73348593711853e-05, 4.015304148197174e-05, 4.297122359275818e-05, 4.578940570354462e-05, 4.8607587814331055e-05, 5.142576992511749e-05, 5.424395203590393e-05, 5.706213414669037e-05, 5.988031625747681e-05, 6.269849836826324e-05, 6.551668047904968e-05, 6.833486258983612e-05, 7.115304470062256e-05, 7.3971226811409e-05, 7.678940892219543e-05, 7.960759103298187e-05, 8.242577314376831e-05, 8.524395525455475e-05, 8.806213736534119e-05, 9.088031947612762e-05, 9.369850158691406e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 10.0, 9.0, 22.0, 23.0, 36.0, 45.0, 59.0, 85.0, 109.0, 182.0, 249.0, 468.0, 687.0, 1167.0, 1996.0, 3723.0, 6929.0, 13571.0, 27314.0, 57751.0, 123364.0, 234646.0, 268297.0, 159230.0, 75871.0, 35658.0, 17408.0, 8777.0, 4629.0, 2499.0, 1443.0, 826.0, 499.0, 343.0, 181.0, 136.0, 93.0, 71.0, 44.0, 29.0, 23.0, 12.0, 14.0, 12.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9375, -1.877288818359375, -1.81707763671875, -1.756866455078125, -1.6966552734375, -1.636444091796875, -1.57623291015625, -1.516021728515625, -1.455810546875, -1.395599365234375, -1.33538818359375, -1.275177001953125, -1.2149658203125, -1.154754638671875, -1.09454345703125, -1.034332275390625, -0.97412109375, -0.913909912109375, -0.85369873046875, -0.793487548828125, -0.7332763671875, -0.673065185546875, -0.61285400390625, -0.552642822265625, -0.492431640625, -0.432220458984375, -0.37200927734375, -0.311798095703125, -0.2515869140625, -0.191375732421875, -0.13116455078125, -0.070953369140625, -0.0107421875, 0.049468994140625, 0.10968017578125, 0.169891357421875, 0.2301025390625, 0.290313720703125, 0.35052490234375, 0.410736083984375, 0.470947265625, 0.531158447265625, 0.59136962890625, 0.651580810546875, 0.7117919921875, 0.772003173828125, 0.83221435546875, 0.892425537109375, 0.95263671875, 1.012847900390625, 1.07305908203125, 1.133270263671875, 1.1934814453125, 1.253692626953125, 1.31390380859375, 1.374114990234375, 1.434326171875, 1.494537353515625, 1.55474853515625, 1.614959716796875, 1.6751708984375, 1.735382080078125, 1.79559326171875, 1.855804443359375, 1.916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 8.0, 13.0, 9.0, 11.0, 19.0, 15.0, 27.0, 20.0, 36.0, 27.0, 49.0, 50.0, 50.0, 58.0, 68.0, 73.0, 49.0, 39.0, 37.0, 46.0, 38.0, 38.0, 36.0, 25.0, 27.0, 9.0, 18.0, 9.0, 11.0, 14.0, 10.0, 6.0, 6.0, 11.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33447265625, -0.32260894775390625, -0.3107452392578125, -0.29888153076171875, -0.287017822265625, -0.27515411376953125, -0.2632904052734375, -0.25142669677734375, -0.23956298828125, -0.22769927978515625, -0.2158355712890625, -0.20397186279296875, -0.192108154296875, -0.18024444580078125, -0.1683807373046875, -0.15651702880859375, -0.1446533203125, -0.13278961181640625, -0.1209259033203125, -0.10906219482421875, -0.097198486328125, -0.08533477783203125, -0.0734710693359375, -0.06160736083984375, -0.04974365234375, -0.03787994384765625, -0.0260162353515625, -0.01415252685546875, -0.002288818359375, 0.00957489013671875, 0.0214385986328125, 0.03330230712890625, 0.045166015625, 0.05702972412109375, 0.0688934326171875, 0.08075714111328125, 0.092620849609375, 0.10448455810546875, 0.1163482666015625, 0.12821197509765625, 0.14007568359375, 0.15193939208984375, 0.1638031005859375, 0.17566680908203125, 0.187530517578125, 0.19939422607421875, 0.2112579345703125, 0.22312164306640625, 0.2349853515625, 0.24684906005859375, 0.2587127685546875, 0.27057647705078125, 0.282440185546875, 0.29430389404296875, 0.3061676025390625, 0.31803131103515625, 0.32989501953125, 0.34175872802734375, 0.3536224365234375, 0.36548614501953125, 0.377349853515625, 0.38921356201171875, 0.4010772705078125, 0.41294097900390625, 0.4248046875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 6.0, 10.0, 10.0, 11.0, 20.0, 22.0, 23.0, 16.0, 18.0, 22.0, 16.0, 31.0, 34.0, 40.0, 43.0, 42.0, 32.0, 37.0, 51.0, 28.0, 46.0, 44.0, 44.0, 45.0, 40.0, 30.0, 23.0, 23.0, 10.0, 25.0, 28.0, 27.0, 18.0, 14.0, 18.0, 10.0, 8.0, 9.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.539588928222656, -26.726106643676758, -25.91262435913086, -25.099140167236328, -24.28565788269043, -23.47217559814453, -22.658693313598633, -21.845211029052734, -21.031726837158203, -20.218244552612305, -19.404762268066406, -18.591278076171875, -17.777795791625977, -16.964313507080078, -16.15083122253418, -15.337347984313965, -14.523865699768066, -13.710383415222168, -12.896900177001953, -12.083417892456055, -11.26993465423584, -10.456452369689941, -9.642969131469727, -8.829486846923828, -8.01600456237793, -7.202521800994873, -6.389039039611816, -5.575556755065918, -4.762073516845703, -3.9485912322998047, -3.135108470916748, -2.3216257095336914, -1.5081424713134766, -0.6946597695350647, 0.11882293224334717, 0.9323055744171143, 1.745788335800171, 2.5592708587646484, 3.372753620147705, 4.186236381530762, 4.999719142913818, 5.813201904296875, 6.626684665679932, 7.440167427062988, 8.253649711608887, 9.067132949829102, 9.880615234375, 10.694097518920898, 11.507580757141113, 12.321063041687012, 13.134546279907227, 13.948028564453125, 14.76151180267334, 15.574994087219238, 16.388477325439453, 17.20195960998535, 18.01544189453125, 18.82892417907715, 19.642406463623047, 20.455890655517578, 21.269372940063477, 22.082855224609375, 22.896337509155273, 23.709819793701172, 24.523303985595703]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 8.0, 4.0, 7.0, 11.0, 14.0, 15.0, 13.0, 16.0, 25.0, 15.0, 24.0, 21.0, 22.0, 31.0, 37.0, 35.0, 41.0, 39.0, 34.0, 33.0, 34.0, 41.0, 45.0, 33.0, 35.0, 48.0, 52.0, 39.0, 24.0, 27.0, 19.0, 18.0, 23.0, 16.0, 17.0, 12.0, 14.0, 15.0, 14.0, 5.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.607845306396484, -26.72903823852539, -25.850229263305664, -24.97142219543457, -24.092613220214844, -23.21380615234375, -22.334997177124023, -21.45619010925293, -20.577381134033203, -19.69857406616211, -18.819765090942383, -17.94095802307129, -17.062149047851562, -16.18334197998047, -15.304533004760742, -14.425725936889648, -13.546917915344238, -12.668109893798828, -11.789301872253418, -10.910493850708008, -10.031685829162598, -9.152877807617188, -8.274070739746094, -7.395262241363525, -6.516454219818115, -5.637646198272705, -4.758838176727295, -3.880030393600464, -3.0012223720550537, -2.1224145889282227, -1.2436065673828125, -0.36479854583740234, 0.5140094757080078, 1.392817497253418, 2.271625518798828, 3.150433301925659, 4.029241561889648, 4.9080491065979, 5.7868571281433105, 6.665665149688721, 7.544473171234131, 8.423280715942383, 9.302088737487793, 10.180896759033203, 11.059704780578613, 11.938512802124023, 12.817320823669434, 13.696128845214844, 14.574936866760254, 15.453744888305664, 16.332551956176758, 17.211360931396484, 18.090167999267578, 18.968976974487305, 19.8477840423584, 20.726593017578125, 21.60540008544922, 22.484207153320312, 23.36301612854004, 24.241823196411133, 25.12063217163086, 25.999439239501953, 26.87824821472168, 27.757055282592773, 28.6358642578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 4.0, 6.0, 5.0, 20.0, 18.0, 40.0, 61.0, 86.0, 122.0, 193.0, 314.0, 526.0, 787.0, 1217.0, 1913.0, 2756.0, 4118.0, 6061.0, 8757.0, 12657.0, 17472.0, 24140.0, 31864.0, 41121.0, 51869.0, 62204.0, 71844.0, 80007.0, 84825.0, 85046.0, 82957.0, 75697.0, 67204.0, 56202.0, 45735.0, 35989.0, 27404.0, 20330.0, 14755.0, 10256.0, 7133.0, 5028.0, 3471.0, 2235.0, 1455.0, 954.0, 638.0, 408.0, 260.0, 163.0, 86.0, 58.0, 35.0, 29.0, 15.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0], "bins": [-13.8984375, -13.4671630859375, -13.035888671875, -12.6046142578125, -12.17333984375, -11.7420654296875, -11.310791015625, -10.8795166015625, -10.4482421875, -10.0169677734375, -9.585693359375, -9.1544189453125, -8.72314453125, -8.2918701171875, -7.860595703125, -7.4293212890625, -6.998046875, -6.5667724609375, -6.135498046875, -5.7042236328125, -5.27294921875, -4.8416748046875, -4.410400390625, -3.9791259765625, -3.5478515625, -3.1165771484375, -2.685302734375, -2.2540283203125, -1.82275390625, -1.3914794921875, -0.960205078125, -0.5289306640625, -0.09765625, 0.3336181640625, 0.764892578125, 1.1961669921875, 1.62744140625, 2.0587158203125, 2.489990234375, 2.9212646484375, 3.3525390625, 3.7838134765625, 4.215087890625, 4.6463623046875, 5.07763671875, 5.5089111328125, 5.940185546875, 6.3714599609375, 6.802734375, 7.2340087890625, 7.665283203125, 8.0965576171875, 8.52783203125, 8.9591064453125, 9.390380859375, 9.8216552734375, 10.2529296875, 10.6842041015625, 11.115478515625, 11.5467529296875, 11.97802734375, 12.4093017578125, 12.840576171875, 13.2718505859375, 13.703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 10.0, 9.0, 14.0, 9.0, 11.0, 20.0, 19.0, 15.0, 24.0, 18.0, 19.0, 21.0, 25.0, 39.0, 23.0, 32.0, 43.0, 40.0, 26.0, 40.0, 30.0, 47.0, 39.0, 41.0, 33.0, 35.0, 47.0, 32.0, 27.0, 27.0, 18.0, 21.0, 24.0, 16.0, 13.0, 18.0, 14.0, 12.0, 10.0, 6.0, 11.0, 5.0, 7.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.84375, -27.9677734375, -27.091796875, -26.2158203125, -25.33984375, -24.4638671875, -23.587890625, -22.7119140625, -21.8359375, -20.9599609375, -20.083984375, -19.2080078125, -18.33203125, -17.4560546875, -16.580078125, -15.7041015625, -14.828125, -13.9521484375, -13.076171875, -12.2001953125, -11.32421875, -10.4482421875, -9.572265625, -8.6962890625, -7.8203125, -6.9443359375, -6.068359375, -5.1923828125, -4.31640625, -3.4404296875, -2.564453125, -1.6884765625, -0.8125, 0.0634765625, 0.939453125, 1.8154296875, 2.69140625, 3.5673828125, 4.443359375, 5.3193359375, 6.1953125, 7.0712890625, 7.947265625, 8.8232421875, 9.69921875, 10.5751953125, 11.451171875, 12.3271484375, 13.203125, 14.0791015625, 14.955078125, 15.8310546875, 16.70703125, 17.5830078125, 18.458984375, 19.3349609375, 20.2109375, 21.0869140625, 21.962890625, 22.8388671875, 23.71484375, 24.5908203125, 25.466796875, 26.3427734375, 27.21875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 8.0, 16.0, 40.0, 46.0, 90.0, 123.0, 193.0, 313.0, 439.0, 735.0, 1220.0, 1840.0, 2923.0, 4373.0, 6548.0, 10053.0, 14514.0, 20990.0, 29454.0, 40023.0, 51606.0, 65049.0, 77755.0, 88018.0, 94312.0, 95784.0, 90278.0, 80684.0, 68736.0, 55069.0, 43041.0, 32276.0, 23153.0, 16188.0, 11074.0, 7467.0, 5066.0, 3279.0, 2075.0, 1343.0, 902.0, 550.0, 349.0, 208.0, 141.0, 86.0, 40.0, 26.0, 17.0, 21.0, 10.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-16.078125, -15.577880859375, -15.07763671875, -14.577392578125, -14.0771484375, -13.576904296875, -13.07666015625, -12.576416015625, -12.076171875, -11.575927734375, -11.07568359375, -10.575439453125, -10.0751953125, -9.574951171875, -9.07470703125, -8.574462890625, -8.07421875, -7.573974609375, -7.07373046875, -6.573486328125, -6.0732421875, -5.572998046875, -5.07275390625, -4.572509765625, -4.072265625, -3.572021484375, -3.07177734375, -2.571533203125, -2.0712890625, -1.571044921875, -1.07080078125, -0.570556640625, -0.0703125, 0.429931640625, 0.93017578125, 1.430419921875, 1.9306640625, 2.430908203125, 2.93115234375, 3.431396484375, 3.931640625, 4.431884765625, 4.93212890625, 5.432373046875, 5.9326171875, 6.432861328125, 6.93310546875, 7.433349609375, 7.93359375, 8.433837890625, 8.93408203125, 9.434326171875, 9.9345703125, 10.434814453125, 10.93505859375, 11.435302734375, 11.935546875, 12.435791015625, 12.93603515625, 13.436279296875, 13.9365234375, 14.436767578125, 14.93701171875, 15.437255859375, 15.9375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 4.0, 5.0, 7.0, 5.0, 17.0, 8.0, 8.0, 15.0, 20.0, 17.0, 29.0, 24.0, 34.0, 30.0, 32.0, 36.0, 30.0, 37.0, 36.0, 45.0, 37.0, 35.0, 42.0, 38.0, 27.0, 46.0, 44.0, 35.0, 42.0, 28.0, 26.0, 24.0, 29.0, 23.0, 10.0, 13.0, 12.0, 11.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.8125, -20.227294921875, -19.64208984375, -19.056884765625, -18.4716796875, -17.886474609375, -17.30126953125, -16.716064453125, -16.130859375, -15.545654296875, -14.96044921875, -14.375244140625, -13.7900390625, -13.204833984375, -12.61962890625, -12.034423828125, -11.44921875, -10.864013671875, -10.27880859375, -9.693603515625, -9.1083984375, -8.523193359375, -7.93798828125, -7.352783203125, -6.767578125, -6.182373046875, -5.59716796875, -5.011962890625, -4.4267578125, -3.841552734375, -3.25634765625, -2.671142578125, -2.0859375, -1.500732421875, -0.91552734375, -0.330322265625, 0.2548828125, 0.840087890625, 1.42529296875, 2.010498046875, 2.595703125, 3.180908203125, 3.76611328125, 4.351318359375, 4.9365234375, 5.521728515625, 6.10693359375, 6.692138671875, 7.27734375, 7.862548828125, 8.44775390625, 9.032958984375, 9.6181640625, 10.203369140625, 10.78857421875, 11.373779296875, 11.958984375, 12.544189453125, 13.12939453125, 13.714599609375, 14.2998046875, 14.885009765625, 15.47021484375, 16.055419921875, 16.640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 9.0, 16.0, 34.0, 50.0, 82.0, 154.0, 226.0, 398.0, 616.0, 1035.0, 1796.0, 3078.0, 5159.0, 8500.0, 13548.0, 21141.0, 31792.0, 46243.0, 62855.0, 80727.0, 96858.0, 107683.0, 110861.0, 106047.0, 93441.0, 76358.0, 58810.0, 42115.0, 28804.0, 19171.0, 12197.0, 7407.0, 4549.0, 2776.0, 1690.0, 910.0, 563.0, 318.0, 203.0, 119.0, 86.0, 50.0, 30.0, 16.0, 15.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-6.16015625, -5.96990966796875, -5.7796630859375, -5.58941650390625, -5.399169921875, -5.20892333984375, -5.0186767578125, -4.82843017578125, -4.63818359375, -4.44793701171875, -4.2576904296875, -4.06744384765625, -3.877197265625, -3.68695068359375, -3.4967041015625, -3.30645751953125, -3.1162109375, -2.92596435546875, -2.7357177734375, -2.54547119140625, -2.355224609375, -2.16497802734375, -1.9747314453125, -1.78448486328125, -1.59423828125, -1.40399169921875, -1.2137451171875, -1.02349853515625, -0.833251953125, -0.64300537109375, -0.4527587890625, -0.26251220703125, -0.072265625, 0.11798095703125, 0.3082275390625, 0.49847412109375, 0.688720703125, 0.87896728515625, 1.0692138671875, 1.25946044921875, 1.44970703125, 1.63995361328125, 1.8302001953125, 2.02044677734375, 2.210693359375, 2.40093994140625, 2.5911865234375, 2.78143310546875, 2.9716796875, 3.16192626953125, 3.3521728515625, 3.54241943359375, 3.732666015625, 3.92291259765625, 4.1131591796875, 4.30340576171875, 4.49365234375, 4.68389892578125, 4.8741455078125, 5.06439208984375, 5.254638671875, 5.44488525390625, 5.6351318359375, 5.82537841796875, 6.015625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 4.0, 7.0, 5.0, 10.0, 18.0, 16.0, 14.0, 23.0, 27.0, 22.0, 27.0, 25.0, 38.0, 43.0, 43.0, 40.0, 48.0, 39.0, 52.0, 29.0, 52.0, 43.0, 48.0, 34.0, 37.0, 35.0, 34.0, 20.0, 25.0, 16.0, 16.0, 21.0, 12.0, 10.0, 15.0, 11.0, 8.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0006465911865234375, -0.0006256401538848877, -0.0006046891212463379, -0.0005837380886077881, -0.0005627870559692383, -0.0005418360233306885, -0.0005208849906921387, -0.0004999339580535889, -0.00047898292541503906, -0.00045803189277648926, -0.00043708086013793945, -0.00041612982749938965, -0.00039517879486083984, -0.00037422776222229004, -0.00035327672958374023, -0.00033232569694519043, -0.0003113746643066406, -0.0002904236316680908, -0.000269472599029541, -0.0002485215663909912, -0.0002275705337524414, -0.0002066195011138916, -0.0001856684684753418, -0.000164717435836792, -0.0001437664031982422, -0.00012281537055969238, -0.00010186433792114258, -8.091330528259277e-05, -5.996227264404297e-05, -3.9011240005493164e-05, -1.806020736694336e-05, 2.8908252716064453e-06, 2.384185791015625e-05, 4.4792890548706055e-05, 6.574392318725586e-05, 8.669495582580566e-05, 0.00010764598846435547, 0.00012859702110290527, 0.00014954805374145508, 0.00017049908638000488, 0.0001914501190185547, 0.0002124011516571045, 0.0002333521842956543, 0.0002543032169342041, 0.0002752542495727539, 0.0002962052822113037, 0.0003171563148498535, 0.0003381073474884033, 0.0003590583801269531, 0.00038000941276550293, 0.00040096044540405273, 0.00042191147804260254, 0.00044286251068115234, 0.00046381354331970215, 0.00048476457595825195, 0.0005057156085968018, 0.0005266666412353516, 0.0005476176738739014, 0.0005685687065124512, 0.000589519739151001, 0.0006104707717895508, 0.0006314218044281006, 0.0006523728370666504, 0.0006733238697052002, 0.00069427490234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 8.0, 22.0, 33.0, 37.0, 63.0, 86.0, 189.0, 293.0, 467.0, 790.0, 1400.0, 2520.0, 4296.0, 7438.0, 12829.0, 21659.0, 35124.0, 54509.0, 78294.0, 102872.0, 123164.0, 132313.0, 125688.0, 107993.0, 82475.0, 58567.0, 38303.0, 23797.0, 14187.0, 8126.0, 4642.0, 2620.0, 1527.0, 886.0, 520.0, 312.0, 196.0, 126.0, 61.0, 51.0, 33.0, 16.0, 9.0, 6.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.71368408203125, -6.4703369140625, -6.22698974609375, -5.983642578125, -5.74029541015625, -5.4969482421875, -5.25360107421875, -5.01025390625, -4.76690673828125, -4.5235595703125, -4.28021240234375, -4.036865234375, -3.79351806640625, -3.5501708984375, -3.30682373046875, -3.0634765625, -2.82012939453125, -2.5767822265625, -2.33343505859375, -2.090087890625, -1.84674072265625, -1.6033935546875, -1.36004638671875, -1.11669921875, -0.87335205078125, -0.6300048828125, -0.38665771484375, -0.143310546875, 0.10003662109375, 0.3433837890625, 0.58673095703125, 0.830078125, 1.07342529296875, 1.3167724609375, 1.56011962890625, 1.803466796875, 2.04681396484375, 2.2901611328125, 2.53350830078125, 2.77685546875, 3.02020263671875, 3.2635498046875, 3.50689697265625, 3.750244140625, 3.99359130859375, 4.2369384765625, 4.48028564453125, 4.7236328125, 4.96697998046875, 5.2103271484375, 5.45367431640625, 5.697021484375, 5.94036865234375, 6.1837158203125, 6.42706298828125, 6.67041015625, 6.91375732421875, 7.1571044921875, 7.40045166015625, 7.643798828125, 7.88714599609375, 8.1304931640625, 8.37384033203125, 8.6171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 3.0, 5.0, 13.0, 21.0, 13.0, 17.0, 20.0, 34.0, 33.0, 37.0, 49.0, 65.0, 72.0, 64.0, 79.0, 66.0, 61.0, 68.0, 58.0, 48.0, 41.0, 40.0, 25.0, 17.0, 18.0, 12.0, 4.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.34765625, -5.2008056640625, -5.053955078125, -4.9071044921875, -4.76025390625, -4.6134033203125, -4.466552734375, -4.3197021484375, -4.1728515625, -4.0260009765625, -3.879150390625, -3.7322998046875, -3.58544921875, -3.4385986328125, -3.291748046875, -3.1448974609375, -2.998046875, -2.8511962890625, -2.704345703125, -2.5574951171875, -2.41064453125, -2.2637939453125, -2.116943359375, -1.9700927734375, -1.8232421875, -1.6763916015625, -1.529541015625, -1.3826904296875, -1.23583984375, -1.0889892578125, -0.942138671875, -0.7952880859375, -0.6484375, -0.5015869140625, -0.354736328125, -0.2078857421875, -0.06103515625, 0.0858154296875, 0.232666015625, 0.3795166015625, 0.5263671875, 0.6732177734375, 0.820068359375, 0.9669189453125, 1.11376953125, 1.2606201171875, 1.407470703125, 1.5543212890625, 1.701171875, 1.8480224609375, 1.994873046875, 2.1417236328125, 2.28857421875, 2.4354248046875, 2.582275390625, 2.7291259765625, 2.8759765625, 3.0228271484375, 3.169677734375, 3.3165283203125, 3.46337890625, 3.6102294921875, 3.757080078125, 3.9039306640625, 4.05078125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 7.0, 9.0, 12.0, 7.0, 10.0, 15.0, 21.0, 7.0, 27.0, 15.0, 30.0, 31.0, 30.0, 20.0, 27.0, 45.0, 37.0, 42.0, 40.0, 47.0, 34.0, 43.0, 41.0, 29.0, 44.0, 34.0, 34.0, 39.0, 22.0, 23.0, 18.0, 23.0, 11.0, 24.0, 21.0, 19.0, 12.0, 9.0, 14.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.427213668823242, -25.63755989074707, -24.84790802001953, -24.05825424194336, -23.26860237121582, -22.47894859313965, -21.68929672241211, -20.899642944335938, -20.109989166259766, -19.320335388183594, -18.530683517456055, -17.741029739379883, -16.951377868652344, -16.161724090576172, -15.372071266174316, -14.582418441772461, -13.792766571044922, -13.003113746643066, -12.213460922241211, -11.423807144165039, -10.6341552734375, -9.844501495361328, -9.054848670959473, -8.265195846557617, -7.475543022155762, -6.685890197753906, -5.896237373352051, -5.106584072113037, -4.316931247711182, -3.527278423309326, -2.7376251220703125, -1.947972297668457, -1.1583213806152344, -0.36866843700408936, 0.42098450660705566, 1.2106375694274902, 2.0002903938293457, 2.789943218231201, 3.579596519470215, 4.36924934387207, 5.158902168273926, 5.948554992675781, 6.738207817077637, 7.52786111831665, 8.317514419555664, 9.107166290283203, 9.896820068359375, 10.68647289276123, 11.476125717163086, 12.265778541564941, 13.055431365966797, 13.845085144042969, 14.634737014770508, 15.42439079284668, 16.21404266357422, 17.00369644165039, 17.793350219726562, 18.583003997802734, 19.372655868530273, 20.162309646606445, 20.951961517333984, 21.741615295410156, 22.531269073486328, 23.320920944213867, 24.110572814941406]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 15.0, 12.0, 10.0, 17.0, 22.0, 19.0, 17.0, 12.0, 20.0, 30.0, 20.0, 34.0, 30.0, 32.0, 44.0, 35.0, 22.0, 48.0, 29.0, 33.0, 39.0, 39.0, 37.0, 40.0, 25.0, 44.0, 31.0, 22.0, 18.0, 23.0, 17.0, 20.0, 20.0, 14.0, 13.0, 9.0, 14.0, 10.0, 9.0, 7.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-27.040788650512695, -26.192590713500977, -25.34439468383789, -24.496196746826172, -23.647998809814453, -22.799802780151367, -21.95160484313965, -21.103408813476562, -20.255210876464844, -19.407012939453125, -18.55881690979004, -17.71061897277832, -16.862422943115234, -16.014225006103516, -15.166027069091797, -14.317830085754395, -13.469633102416992, -12.62143611907959, -11.773239135742188, -10.925041198730469, -10.076844215393066, -9.228647232055664, -8.380449295043945, -7.532252311706543, -6.684055328369141, -5.835858345031738, -4.987660884857178, -4.139463424682617, -3.291266441345215, -2.4430694580078125, -1.594871997833252, -0.7466745376586914, 0.10152053833007812, 0.9497177600860596, 1.797914981842041, 2.6461122035980225, 3.494309425354004, 4.342506408691406, 5.190703868865967, 6.038901329040527, 6.88709831237793, 7.735295295715332, 8.583492279052734, 9.431690216064453, 10.279887199401855, 11.128084182739258, 11.976282119750977, 12.824479103088379, 13.672676086425781, 14.520873069763184, 15.369070053100586, 16.217267990112305, 17.06546401977539, 17.91366195678711, 18.761859893798828, 19.610057830810547, 20.458253860473633, 21.30645179748535, 22.154647827148438, 23.002845764160156, 23.851043701171875, 24.69923973083496, 25.54743766784668, 26.395633697509766, 27.243831634521484]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 11.0, 10.0, 29.0, 35.0, 70.0, 135.0, 219.0, 421.0, 748.0, 1123.0, 1943.0, 3011.0, 5241.0, 8197.0, 13118.0, 20438.0, 31227.0, 46811.0, 68162.0, 96449.0, 134381.0, 177285.0, 226564.0, 276061.0, 322527.0, 355998.0, 372262.0, 369075.0, 344991.0, 308245.0, 260467.0, 209333.0, 161810.0, 119834.0, 86005.0, 59701.0, 40361.0, 26310.0, 17210.0, 10947.0, 6840.0, 4170.0, 2625.0, 1594.0, 969.0, 559.0, 313.0, 191.0, 103.0, 70.0, 45.0, 27.0, 8.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.453125, -17.8544921875, -17.255859375, -16.6572265625, -16.05859375, -15.4599609375, -14.861328125, -14.2626953125, -13.6640625, -13.0654296875, -12.466796875, -11.8681640625, -11.26953125, -10.6708984375, -10.072265625, -9.4736328125, -8.875, -8.2763671875, -7.677734375, -7.0791015625, -6.48046875, -5.8818359375, -5.283203125, -4.6845703125, -4.0859375, -3.4873046875, -2.888671875, -2.2900390625, -1.69140625, -1.0927734375, -0.494140625, 0.1044921875, 0.703125, 1.3017578125, 1.900390625, 2.4990234375, 3.09765625, 3.6962890625, 4.294921875, 4.8935546875, 5.4921875, 6.0908203125, 6.689453125, 7.2880859375, 7.88671875, 8.4853515625, 9.083984375, 9.6826171875, 10.28125, 10.8798828125, 11.478515625, 12.0771484375, 12.67578125, 13.2744140625, 13.873046875, 14.4716796875, 15.0703125, 15.6689453125, 16.267578125, 16.8662109375, 17.46484375, 18.0634765625, 18.662109375, 19.2607421875, 19.859375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 9.0, 1.0, 6.0, 12.0, 11.0, 13.0, 13.0, 12.0, 19.0, 22.0, 20.0, 20.0, 27.0, 25.0, 20.0, 31.0, 33.0, 37.0, 42.0, 29.0, 40.0, 44.0, 35.0, 38.0, 41.0, 36.0, 42.0, 39.0, 27.0, 28.0, 26.0, 29.0, 20.0, 8.0, 18.0, 26.0, 22.0, 14.0, 13.0, 9.0, 7.0, 3.0, 9.0, 5.0, 4.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-24.046875, -23.3056640625, -22.564453125, -21.8232421875, -21.08203125, -20.3408203125, -19.599609375, -18.8583984375, -18.1171875, -17.3759765625, -16.634765625, -15.8935546875, -15.15234375, -14.4111328125, -13.669921875, -12.9287109375, -12.1875, -11.4462890625, -10.705078125, -9.9638671875, -9.22265625, -8.4814453125, -7.740234375, -6.9990234375, -6.2578125, -5.5166015625, -4.775390625, -4.0341796875, -3.29296875, -2.5517578125, -1.810546875, -1.0693359375, -0.328125, 0.4130859375, 1.154296875, 1.8955078125, 2.63671875, 3.3779296875, 4.119140625, 4.8603515625, 5.6015625, 6.3427734375, 7.083984375, 7.8251953125, 8.56640625, 9.3076171875, 10.048828125, 10.7900390625, 11.53125, 12.2724609375, 13.013671875, 13.7548828125, 14.49609375, 15.2373046875, 15.978515625, 16.7197265625, 17.4609375, 18.2021484375, 18.943359375, 19.6845703125, 20.42578125, 21.1669921875, 21.908203125, 22.6494140625, 23.390625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 12.0, 20.0, 27.0, 65.0, 99.0, 172.0, 316.0, 551.0, 1016.0, 1772.0, 2883.0, 4847.0, 8182.0, 13100.0, 20800.0, 32164.0, 48395.0, 71408.0, 100836.0, 136966.0, 181598.0, 226880.0, 274677.0, 314341.0, 346614.0, 362459.0, 358773.0, 339575.0, 304291.0, 259835.0, 213387.0, 168000.0, 125982.0, 91825.0, 63586.0, 43012.0, 28474.0, 18454.0, 11455.0, 7197.0, 4321.0, 2505.0, 1428.0, 884.0, 491.0, 258.0, 157.0, 97.0, 52.0, 23.0, 19.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.03125, -18.393798828125, -17.75634765625, -17.118896484375, -16.4814453125, -15.843994140625, -15.20654296875, -14.569091796875, -13.931640625, -13.294189453125, -12.65673828125, -12.019287109375, -11.3818359375, -10.744384765625, -10.10693359375, -9.469482421875, -8.83203125, -8.194580078125, -7.55712890625, -6.919677734375, -6.2822265625, -5.644775390625, -5.00732421875, -4.369873046875, -3.732421875, -3.094970703125, -2.45751953125, -1.820068359375, -1.1826171875, -0.545166015625, 0.09228515625, 0.729736328125, 1.3671875, 2.004638671875, 2.64208984375, 3.279541015625, 3.9169921875, 4.554443359375, 5.19189453125, 5.829345703125, 6.466796875, 7.104248046875, 7.74169921875, 8.379150390625, 9.0166015625, 9.654052734375, 10.29150390625, 10.928955078125, 11.56640625, 12.203857421875, 12.84130859375, 13.478759765625, 14.1162109375, 14.753662109375, 15.39111328125, 16.028564453125, 16.666015625, 17.303466796875, 17.94091796875, 18.578369140625, 19.2158203125, 19.853271484375, 20.49072265625, 21.128173828125, 21.765625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 11.0, 16.0, 13.0, 10.0, 25.0, 36.0, 39.0, 46.0, 55.0, 61.0, 85.0, 102.0, 102.0, 139.0, 146.0, 167.0, 160.0, 178.0, 183.0, 177.0, 186.0, 205.0, 195.0, 205.0, 171.0, 184.0, 184.0, 137.0, 128.0, 121.0, 102.0, 101.0, 75.0, 69.0, 71.0, 46.0, 39.0, 18.0, 20.0, 17.0, 5.0, 22.0, 1.0, 7.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.3984375, -12.0150146484375, -11.631591796875, -11.2481689453125, -10.86474609375, -10.4813232421875, -10.097900390625, -9.7144775390625, -9.3310546875, -8.9476318359375, -8.564208984375, -8.1807861328125, -7.79736328125, -7.4139404296875, -7.030517578125, -6.6470947265625, -6.263671875, -5.8802490234375, -5.496826171875, -5.1134033203125, -4.72998046875, -4.3465576171875, -3.963134765625, -3.5797119140625, -3.1962890625, -2.8128662109375, -2.429443359375, -2.0460205078125, -1.66259765625, -1.2791748046875, -0.895751953125, -0.5123291015625, -0.12890625, 0.2545166015625, 0.637939453125, 1.0213623046875, 1.40478515625, 1.7882080078125, 2.171630859375, 2.5550537109375, 2.9384765625, 3.3218994140625, 3.705322265625, 4.0887451171875, 4.47216796875, 4.8555908203125, 5.239013671875, 5.6224365234375, 6.005859375, 6.3892822265625, 6.772705078125, 7.1561279296875, 7.53955078125, 7.9229736328125, 8.306396484375, 8.6898193359375, 9.0732421875, 9.4566650390625, 9.840087890625, 10.2235107421875, 10.60693359375, 10.9903564453125, 11.373779296875, 11.7572021484375, 12.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 11.0, 9.0, 7.0, 8.0, 12.0, 19.0, 13.0, 20.0, 18.0, 20.0, 21.0, 30.0, 33.0, 33.0, 30.0, 42.0, 41.0, 39.0, 34.0, 35.0, 50.0, 34.0, 33.0, 30.0, 49.0, 29.0, 35.0, 32.0, 26.0, 16.0, 27.0, 14.0, 14.0, 16.0, 20.0, 15.0, 16.0, 11.0, 8.0, 12.0, 4.0, 9.0, 4.0, 10.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.096071243286133, -25.275848388671875, -24.45562744140625, -23.635404586791992, -22.815183639526367, -21.99496078491211, -21.174739837646484, -20.354516983032227, -19.5342960357666, -18.714073181152344, -17.89385223388672, -17.07362937927246, -16.253408432006836, -15.433185577392578, -14.612964630126953, -13.792741775512695, -12.972519874572754, -12.152297973632812, -11.332076072692871, -10.51185417175293, -9.691632270812988, -8.871410369873047, -8.051187515258789, -7.230966091156006, -6.4107441902160645, -5.590522289276123, -4.770300388336182, -3.950078248977661, -3.1298563480377197, -2.309634208679199, -1.4894123077392578, -0.6691904067993164, 0.151031494140625, 0.9712534546852112, 1.7914754152297974, 2.6116974353790283, 3.4319193363189697, 4.25214147567749, 5.072363376617432, 5.892585277557373, 6.7128071784973145, 7.533029079437256, 8.353251457214355, 9.173473358154297, 9.993695259094238, 10.81391716003418, 11.634139060974121, 12.454360961914062, 13.274582862854004, 14.094804763793945, 14.915026664733887, 15.735248565673828, 16.555471420288086, 17.37569236755371, 18.19591522216797, 19.016136169433594, 19.83635902404785, 20.65658187866211, 21.476802825927734, 22.297025680541992, 23.117246627807617, 23.937469482421875, 24.7576904296875, 25.577913284301758, 26.398134231567383]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 11.0, 8.0, 6.0, 4.0, 12.0, 17.0, 22.0, 17.0, 26.0, 26.0, 14.0, 36.0, 31.0, 32.0, 37.0, 32.0, 41.0, 38.0, 40.0, 42.0, 36.0, 39.0, 33.0, 40.0, 29.0, 31.0, 37.0, 27.0, 31.0, 34.0, 24.0, 18.0, 19.0, 22.0, 14.0, 14.0, 12.0, 7.0, 9.0, 3.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-28.561195373535156, -27.63642692565918, -26.711658477783203, -25.78689193725586, -24.862123489379883, -23.937355041503906, -23.012588500976562, -22.087820053100586, -21.16305160522461, -20.238283157348633, -19.313514709472656, -18.388748168945312, -17.463979721069336, -16.53921127319336, -15.6144437789917, -14.689676284790039, -13.764907836914062, -12.840139389038086, -11.915371894836426, -10.990604400634766, -10.065835952758789, -9.141067504882812, -8.216300010681152, -7.291532039642334, -6.366764068603516, -5.441996097564697, -4.517228126525879, -3.5924601554870605, -2.667692184448242, -1.7429242134094238, -0.8181562423706055, 0.10661172866821289, 1.0313777923583984, 1.9561457633972168, 2.880913734436035, 3.8056817054748535, 4.730449676513672, 5.65521764755249, 6.579985618591309, 7.504753589630127, 8.429521560668945, 9.354290008544922, 10.279057502746582, 11.203824996948242, 12.128593444824219, 13.053361892700195, 13.978129386901855, 14.902896881103516, 15.827665328979492, 16.75243377685547, 17.677200317382812, 18.60196876525879, 19.526737213134766, 20.451505661010742, 21.37627410888672, 22.301040649414062, 23.22580909729004, 24.150577545166016, 25.07534408569336, 26.000112533569336, 26.924880981445312, 27.84964942932129, 28.774417877197266, 29.69918441772461, 30.623952865600586]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 6.0, 9.0, 19.0, 22.0, 42.0, 71.0, 83.0, 166.0, 232.0, 413.0, 692.0, 1142.0, 1913.0, 3290.0, 5610.0, 9548.0, 16294.0, 26958.0, 44308.0, 70363.0, 105411.0, 140851.0, 160258.0, 147657.0, 113157.0, 76799.0, 48719.0, 30132.0, 18206.0, 10775.0, 6330.0, 3758.0, 2111.0, 1266.0, 731.0, 470.0, 274.0, 183.0, 115.0, 57.0, 43.0, 18.0, 23.0, 6.0, 9.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7109375, -4.5570068359375, -4.403076171875, -4.2491455078125, -4.09521484375, -3.9412841796875, -3.787353515625, -3.6334228515625, -3.4794921875, -3.3255615234375, -3.171630859375, -3.0177001953125, -2.86376953125, -2.7098388671875, -2.555908203125, -2.4019775390625, -2.248046875, -2.0941162109375, -1.940185546875, -1.7862548828125, -1.63232421875, -1.4783935546875, -1.324462890625, -1.1705322265625, -1.0166015625, -0.8626708984375, -0.708740234375, -0.5548095703125, -0.40087890625, -0.2469482421875, -0.093017578125, 0.0609130859375, 0.21484375, 0.3687744140625, 0.522705078125, 0.6766357421875, 0.83056640625, 0.9844970703125, 1.138427734375, 1.2923583984375, 1.4462890625, 1.6002197265625, 1.754150390625, 1.9080810546875, 2.06201171875, 2.2159423828125, 2.369873046875, 2.5238037109375, 2.677734375, 2.8316650390625, 2.985595703125, 3.1395263671875, 3.29345703125, 3.4473876953125, 3.601318359375, 3.7552490234375, 3.9091796875, 4.0631103515625, 4.217041015625, 4.3709716796875, 4.52490234375, 4.6788330078125, 4.832763671875, 4.9866943359375, 5.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 7.0, 12.0, 9.0, 13.0, 18.0, 13.0, 18.0, 23.0, 20.0, 27.0, 30.0, 35.0, 34.0, 40.0, 47.0, 46.0, 46.0, 38.0, 38.0, 42.0, 44.0, 32.0, 48.0, 33.0, 26.0, 41.0, 30.0, 26.0, 27.0, 18.0, 22.0, 10.0, 22.0, 14.0, 10.0, 8.0, 4.0, 5.0, 10.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.25, -28.1884765625, -27.126953125, -26.0654296875, -25.00390625, -23.9423828125, -22.880859375, -21.8193359375, -20.7578125, -19.6962890625, -18.634765625, -17.5732421875, -16.51171875, -15.4501953125, -14.388671875, -13.3271484375, -12.265625, -11.2041015625, -10.142578125, -9.0810546875, -8.01953125, -6.9580078125, -5.896484375, -4.8349609375, -3.7734375, -2.7119140625, -1.650390625, -0.5888671875, 0.47265625, 1.5341796875, 2.595703125, 3.6572265625, 4.71875, 5.7802734375, 6.841796875, 7.9033203125, 8.96484375, 10.0263671875, 11.087890625, 12.1494140625, 13.2109375, 14.2724609375, 15.333984375, 16.3955078125, 17.45703125, 18.5185546875, 19.580078125, 20.6416015625, 21.703125, 22.7646484375, 23.826171875, 24.8876953125, 25.94921875, 27.0107421875, 28.072265625, 29.1337890625, 30.1953125, 31.2568359375, 32.318359375, 33.3798828125, 34.44140625, 35.5029296875, 36.564453125, 37.6259765625, 38.6875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 0.0, 12.0, 13.0, 13.0, 19.0, 21.0, 47.0, 74.0, 99.0, 148.0, 221.0, 362.0, 544.0, 881.0, 1403.0, 2200.0, 3383.0, 5527.0, 9097.0, 14946.0, 24913.0, 40711.0, 64082.0, 96898.0, 131393.0, 155018.0, 149274.0, 120313.0, 83862.0, 54994.0, 34160.0, 20986.0, 12571.0, 7644.0, 4746.0, 2884.0, 1832.0, 1130.0, 718.0, 506.0, 304.0, 189.0, 145.0, 102.0, 56.0, 41.0, 25.0, 20.0, 14.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.1484375, -4.9915771484375, -4.834716796875, -4.6778564453125, -4.52099609375, -4.3641357421875, -4.207275390625, -4.0504150390625, -3.8935546875, -3.7366943359375, -3.579833984375, -3.4229736328125, -3.26611328125, -3.1092529296875, -2.952392578125, -2.7955322265625, -2.638671875, -2.4818115234375, -2.324951171875, -2.1680908203125, -2.01123046875, -1.8543701171875, -1.697509765625, -1.5406494140625, -1.3837890625, -1.2269287109375, -1.070068359375, -0.9132080078125, -0.75634765625, -0.5994873046875, -0.442626953125, -0.2857666015625, -0.12890625, 0.0279541015625, 0.184814453125, 0.3416748046875, 0.49853515625, 0.6553955078125, 0.812255859375, 0.9691162109375, 1.1259765625, 1.2828369140625, 1.439697265625, 1.5965576171875, 1.75341796875, 1.9102783203125, 2.067138671875, 2.2239990234375, 2.380859375, 2.5377197265625, 2.694580078125, 2.8514404296875, 3.00830078125, 3.1651611328125, 3.322021484375, 3.4788818359375, 3.6357421875, 3.7926025390625, 3.949462890625, 4.1063232421875, 4.26318359375, 4.4200439453125, 4.576904296875, 4.7337646484375, 4.890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 10.0, 2.0, 11.0, 8.0, 19.0, 18.0, 19.0, 24.0, 20.0, 41.0, 38.0, 32.0, 33.0, 37.0, 40.0, 43.0, 42.0, 31.0, 34.0, 50.0, 48.0, 42.0, 38.0, 50.0, 37.0, 41.0, 26.0, 26.0, 21.0, 20.0, 15.0, 13.0, 8.0, 11.0, 12.0, 12.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.875, -24.16748046875, -23.4599609375, -22.75244140625, -22.044921875, -21.33740234375, -20.6298828125, -19.92236328125, -19.21484375, -18.50732421875, -17.7998046875, -17.09228515625, -16.384765625, -15.67724609375, -14.9697265625, -14.26220703125, -13.5546875, -12.84716796875, -12.1396484375, -11.43212890625, -10.724609375, -10.01708984375, -9.3095703125, -8.60205078125, -7.89453125, -7.18701171875, -6.4794921875, -5.77197265625, -5.064453125, -4.35693359375, -3.6494140625, -2.94189453125, -2.234375, -1.52685546875, -0.8193359375, -0.11181640625, 0.595703125, 1.30322265625, 2.0107421875, 2.71826171875, 3.42578125, 4.13330078125, 4.8408203125, 5.54833984375, 6.255859375, 6.96337890625, 7.6708984375, 8.37841796875, 9.0859375, 9.79345703125, 10.5009765625, 11.20849609375, 11.916015625, 12.62353515625, 13.3310546875, 14.03857421875, 14.74609375, 15.45361328125, 16.1611328125, 16.86865234375, 17.576171875, 18.28369140625, 18.9912109375, 19.69873046875, 20.40625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 9.0, 8.0, 12.0, 19.0, 32.0, 29.0, 51.0, 78.0, 109.0, 138.0, 237.0, 316.0, 519.0, 747.0, 1185.0, 2030.0, 3481.0, 6163.0, 11574.0, 23092.0, 47805.0, 97774.0, 183397.0, 252908.0, 198495.0, 109199.0, 53632.0, 26149.0, 12849.0, 6923.0, 3737.0, 2150.0, 1284.0, 747.0, 544.0, 351.0, 215.0, 159.0, 119.0, 85.0, 52.0, 49.0, 30.0, 19.0, 19.0, 9.0, 9.0, 5.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0244140625, -0.991973876953125, -0.95953369140625, -0.927093505859375, -0.8946533203125, -0.862213134765625, -0.82977294921875, -0.797332763671875, -0.764892578125, -0.732452392578125, -0.70001220703125, -0.667572021484375, -0.6351318359375, -0.602691650390625, -0.57025146484375, -0.537811279296875, -0.50537109375, -0.472930908203125, -0.44049072265625, -0.408050537109375, -0.3756103515625, -0.343170166015625, -0.31072998046875, -0.278289794921875, -0.245849609375, -0.213409423828125, -0.18096923828125, -0.148529052734375, -0.1160888671875, -0.083648681640625, -0.05120849609375, -0.018768310546875, 0.013671875, 0.046112060546875, 0.07855224609375, 0.110992431640625, 0.1434326171875, 0.175872802734375, 0.20831298828125, 0.240753173828125, 0.273193359375, 0.305633544921875, 0.33807373046875, 0.370513916015625, 0.4029541015625, 0.435394287109375, 0.46783447265625, 0.500274658203125, 0.53271484375, 0.565155029296875, 0.59759521484375, 0.630035400390625, 0.6624755859375, 0.694915771484375, 0.72735595703125, 0.759796142578125, 0.792236328125, 0.824676513671875, 0.85711669921875, 0.889556884765625, 0.9219970703125, 0.954437255859375, 0.98687744140625, 1.019317626953125, 1.0517578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 4.0, 10.0, 16.0, 17.0, 21.0, 43.0, 46.0, 44.0, 53.0, 46.0, 57.0, 63.0, 56.0, 80.0, 69.0, 51.0, 50.0, 51.0, 38.0, 37.0, 34.0, 26.0, 12.0, 23.0, 10.0, 12.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010210275650024414, -9.870342910289764e-05, -9.530410170555115e-05, -9.190477430820465e-05, -8.850544691085815e-05, -8.510611951351166e-05, -8.170679211616516e-05, -7.830746471881866e-05, -7.490813732147217e-05, -7.150880992412567e-05, -6.810948252677917e-05, -6.471015512943268e-05, -6.131082773208618e-05, -5.7911500334739685e-05, -5.451217293739319e-05, -5.111284554004669e-05, -4.7713518142700195e-05, -4.43141907453537e-05, -4.09148633480072e-05, -3.7515535950660706e-05, -3.411620855331421e-05, -3.071688115596771e-05, -2.7317553758621216e-05, -2.391822636127472e-05, -2.0518898963928223e-05, -1.7119571566581726e-05, -1.372024416923523e-05, -1.0320916771888733e-05, -6.921589374542236e-06, -3.5222619771957397e-06, -1.2293457984924316e-07, 3.2763928174972534e-06, 6.67572021484375e-06, 1.0075047612190247e-05, 1.3474375009536743e-05, 1.687370240688324e-05, 2.0273029804229736e-05, 2.3672357201576233e-05, 2.707168459892273e-05, 3.0471011996269226e-05, 3.387033939361572e-05, 3.726966679096222e-05, 4.0668994188308716e-05, 4.406832158565521e-05, 4.746764898300171e-05, 5.0866976380348206e-05, 5.42663037776947e-05, 5.76656311750412e-05, 6.10649585723877e-05, 6.446428596973419e-05, 6.786361336708069e-05, 7.126294076442719e-05, 7.466226816177368e-05, 7.806159555912018e-05, 8.146092295646667e-05, 8.486025035381317e-05, 8.825957775115967e-05, 9.165890514850616e-05, 9.505823254585266e-05, 9.845755994319916e-05, 0.00010185688734054565, 0.00010525621473789215, 0.00010865554213523865, 0.00011205486953258514, 0.00011545419692993164]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 4.0, 9.0, 10.0, 14.0, 18.0, 19.0, 28.0, 44.0, 67.0, 89.0, 120.0, 165.0, 256.0, 302.0, 498.0, 672.0, 1054.0, 1417.0, 2201.0, 3311.0, 4975.0, 7910.0, 12469.0, 19676.0, 31990.0, 50423.0, 78788.0, 118470.0, 159318.0, 167276.0, 133652.0, 92164.0, 58687.0, 37603.0, 23354.0, 14515.0, 9306.0, 5921.0, 3831.0, 2498.0, 1633.0, 1132.0, 778.0, 588.0, 401.0, 254.0, 191.0, 154.0, 110.0, 51.0, 44.0, 29.0, 28.0, 17.0, 9.0, 6.0, 7.0, 4.0, 3.0, 4.0], "bins": [-1.21484375, -1.17822265625, -1.1416015625, -1.10498046875, -1.068359375, -1.03173828125, -0.9951171875, -0.95849609375, -0.921875, -0.88525390625, -0.8486328125, -0.81201171875, -0.775390625, -0.73876953125, -0.7021484375, -0.66552734375, -0.62890625, -0.59228515625, -0.5556640625, -0.51904296875, -0.482421875, -0.44580078125, -0.4091796875, -0.37255859375, -0.3359375, -0.29931640625, -0.2626953125, -0.22607421875, -0.189453125, -0.15283203125, -0.1162109375, -0.07958984375, -0.04296875, -0.00634765625, 0.0302734375, 0.06689453125, 0.103515625, 0.14013671875, 0.1767578125, 0.21337890625, 0.25, 0.28662109375, 0.3232421875, 0.35986328125, 0.396484375, 0.43310546875, 0.4697265625, 0.50634765625, 0.54296875, 0.57958984375, 0.6162109375, 0.65283203125, 0.689453125, 0.72607421875, 0.7626953125, 0.79931640625, 0.8359375, 0.87255859375, 0.9091796875, 0.94580078125, 0.982421875, 1.01904296875, 1.0556640625, 1.09228515625, 1.12890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 7.0, 11.0, 5.0, 21.0, 16.0, 21.0, 26.0, 22.0, 28.0, 40.0, 42.0, 41.0, 52.0, 45.0, 53.0, 53.0, 66.0, 51.0, 42.0, 61.0, 50.0, 43.0, 31.0, 31.0, 21.0, 21.0, 13.0, 13.0, 14.0, 10.0, 5.0, 6.0, 7.0, 3.0, 7.0, 4.0, 3.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.5445823669433594, -0.5286178588867188, -0.5126533508300781, -0.4966888427734375, -0.4807243347167969, -0.46475982666015625, -0.4487953186035156, -0.432830810546875, -0.4168663024902344, -0.40090179443359375, -0.3849372863769531, -0.3689727783203125, -0.3530082702636719, -0.33704376220703125, -0.3210792541503906, -0.30511474609375, -0.2891502380371094, -0.27318572998046875, -0.2572212219238281, -0.2412567138671875, -0.22529220581054688, -0.20932769775390625, -0.19336318969726562, -0.177398681640625, -0.16143417358398438, -0.14546966552734375, -0.12950515747070312, -0.1135406494140625, -0.09757614135742188, -0.08161163330078125, -0.06564712524414062, -0.0496826171875, -0.033718109130859375, -0.01775360107421875, -0.001789093017578125, 0.0141754150390625, 0.030139923095703125, 0.04610443115234375, 0.062068939208984375, 0.078033447265625, 0.09399795532226562, 0.10996246337890625, 0.12592697143554688, 0.1418914794921875, 0.15785598754882812, 0.17382049560546875, 0.18978500366210938, 0.20574951171875, 0.22171401977539062, 0.23767852783203125, 0.2536430358886719, 0.2696075439453125, 0.2855720520019531, 0.30153656005859375, 0.3175010681152344, 0.333465576171875, 0.3494300842285156, 0.36539459228515625, 0.3813591003417969, 0.3973236083984375, 0.4132881164550781, 0.42925262451171875, 0.4452171325683594, 0.461181640625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 10.0, 7.0, 8.0, 19.0, 15.0, 14.0, 18.0, 20.0, 21.0, 24.0, 32.0, 35.0, 34.0, 37.0, 40.0, 31.0, 41.0, 39.0, 42.0, 41.0, 36.0, 36.0, 34.0, 39.0, 38.0, 26.0, 33.0, 24.0, 17.0, 21.0, 14.0, 16.0, 20.0, 14.0, 19.0, 10.0, 11.0, 8.0, 10.0, 6.0, 8.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.874074935913086, -25.047775268554688, -24.221477508544922, -23.395177841186523, -22.568880081176758, -21.74258041381836, -20.916282653808594, -20.089982986450195, -19.26368522644043, -18.43738555908203, -17.611087799072266, -16.784788131713867, -15.958490371704102, -15.132190704345703, -14.305892944335938, -13.479593276977539, -12.653294563293457, -11.826995849609375, -11.000697135925293, -10.174398422241211, -9.348099708557129, -8.521800994873047, -7.695501804351807, -6.869203090667725, -6.042904376983643, -5.2166056632995605, -4.3903069496154785, -3.5640079975128174, -2.7377092838287354, -1.9114103317260742, -1.0851116180419922, -0.25881290435791016, 0.5674858093261719, 1.393784523010254, 2.220083236694336, 3.046382188796997, 3.872680902481079, 4.69897985458374, 5.525278568267822, 6.351577281951904, 7.177875995635986, 8.004175186157227, 8.830473899841309, 9.65677261352539, 10.483071327209473, 11.309370040893555, 12.135668754577637, 12.961967468261719, 13.7882661819458, 14.614564895629883, 15.440863609313965, 16.267162322998047, 17.093461990356445, 17.91975975036621, 18.74605941772461, 19.572357177734375, 20.398656845092773, 21.224956512451172, 22.051254272460938, 22.877553939819336, 23.7038516998291, 24.5301513671875, 25.356449127197266, 26.182748794555664, 27.00904655456543]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 13.0, 6.0, 6.0, 4.0, 11.0, 17.0, 23.0, 17.0, 23.0, 29.0, 15.0, 36.0, 32.0, 32.0, 40.0, 26.0, 43.0, 38.0, 46.0, 36.0, 37.0, 34.0, 37.0, 40.0, 29.0, 33.0, 35.0, 28.0, 32.0, 31.0, 24.0, 21.0, 20.0, 19.0, 14.0, 15.0, 10.0, 8.0, 8.0, 3.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-28.726627349853516, -27.802722930908203, -26.878816604614258, -25.954912185668945, -25.031005859375, -24.107101440429688, -23.183197021484375, -22.25929069519043, -21.335384368896484, -20.411479949951172, -19.487573623657227, -18.563669204711914, -17.63976287841797, -16.715858459472656, -15.791953086853027, -14.868047714233398, -13.944143295288086, -13.020237922668457, -12.096332550048828, -11.172428131103516, -10.24852180480957, -9.324617385864258, -8.400712013244629, -7.476806640625, -6.552901268005371, -5.628995895385742, -4.705090522766113, -3.7811856269836426, -2.8572802543640137, -1.9333748817443848, -1.009469985961914, -0.08556461334228516, 0.8383426666259766, 1.762247920036316, 2.6861531734466553, 3.610058307647705, 4.533963680267334, 5.457869052886963, 6.381773948669434, 7.3056793212890625, 8.229584693908691, 9.15349006652832, 10.07739543914795, 11.001300811767578, 11.92520523071289, 12.849111557006836, 13.773015975952148, 14.696921348571777, 15.620826721191406, 16.54473114013672, 17.468637466430664, 18.392541885375977, 19.316448211669922, 20.240352630615234, 21.164257049560547, 22.088163375854492, 23.012069702148438, 23.93597412109375, 24.859880447387695, 25.783784866333008, 26.707691192626953, 27.631595611572266, 28.555500030517578, 29.479406356811523, 30.403310775756836]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 14.0, 17.0, 34.0, 51.0, 89.0, 136.0, 250.0, 331.0, 574.0, 892.0, 1369.0, 2025.0, 3053.0, 4586.0, 6659.0, 9603.0, 13780.0, 19007.0, 25736.0, 33629.0, 43077.0, 53346.0, 63328.0, 73103.0, 80407.0, 83923.0, 83709.0, 80621.0, 74100.0, 65040.0, 54865.0, 44640.0, 35045.0, 26474.0, 19793.0, 14229.0, 10027.0, 7014.0, 4835.0, 3135.0, 2111.0, 1367.0, 960.0, 564.0, 367.0, 251.0, 156.0, 99.0, 61.0, 35.0, 21.0, 13.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.8125, -13.3677978515625, -12.923095703125, -12.4783935546875, -12.03369140625, -11.5889892578125, -11.144287109375, -10.6995849609375, -10.2548828125, -9.8101806640625, -9.365478515625, -8.9207763671875, -8.47607421875, -8.0313720703125, -7.586669921875, -7.1419677734375, -6.697265625, -6.2525634765625, -5.807861328125, -5.3631591796875, -4.91845703125, -4.4737548828125, -4.029052734375, -3.5843505859375, -3.1396484375, -2.6949462890625, -2.250244140625, -1.8055419921875, -1.36083984375, -0.9161376953125, -0.471435546875, -0.0267333984375, 0.41796875, 0.8626708984375, 1.307373046875, 1.7520751953125, 2.19677734375, 2.6414794921875, 3.086181640625, 3.5308837890625, 3.9755859375, 4.4202880859375, 4.864990234375, 5.3096923828125, 5.75439453125, 6.1990966796875, 6.643798828125, 7.0885009765625, 7.533203125, 7.9779052734375, 8.422607421875, 8.8673095703125, 9.31201171875, 9.7567138671875, 10.201416015625, 10.6461181640625, 11.0908203125, 11.5355224609375, 11.980224609375, 12.4249267578125, 12.86962890625, 13.3143310546875, 13.759033203125, 14.2037353515625, 14.6484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 6.0, 5.0, 12.0, 5.0, 7.0, 12.0, 13.0, 16.0, 19.0, 9.0, 22.0, 25.0, 29.0, 37.0, 35.0, 31.0, 27.0, 35.0, 43.0, 47.0, 34.0, 34.0, 33.0, 34.0, 29.0, 44.0, 40.0, 35.0, 41.0, 18.0, 27.0, 31.0, 31.0, 22.0, 14.0, 15.0, 15.0, 13.0, 13.0, 8.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.71875, -25.783203125, -24.84765625, -23.912109375, -22.9765625, -22.041015625, -21.10546875, -20.169921875, -19.234375, -18.298828125, -17.36328125, -16.427734375, -15.4921875, -14.556640625, -13.62109375, -12.685546875, -11.75, -10.814453125, -9.87890625, -8.943359375, -8.0078125, -7.072265625, -6.13671875, -5.201171875, -4.265625, -3.330078125, -2.39453125, -1.458984375, -0.5234375, 0.412109375, 1.34765625, 2.283203125, 3.21875, 4.154296875, 5.08984375, 6.025390625, 6.9609375, 7.896484375, 8.83203125, 9.767578125, 10.703125, 11.638671875, 12.57421875, 13.509765625, 14.4453125, 15.380859375, 16.31640625, 17.251953125, 18.1875, 19.123046875, 20.05859375, 20.994140625, 21.9296875, 22.865234375, 23.80078125, 24.736328125, 25.671875, 26.607421875, 27.54296875, 28.478515625, 29.4140625, 30.349609375, 31.28515625, 32.220703125, 33.15625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 6.0, 5.0, 20.0, 31.0, 42.0, 82.0, 130.0, 196.0, 331.0, 485.0, 851.0, 1299.0, 2156.0, 3262.0, 5113.0, 7788.0, 11715.0, 17291.0, 24647.0, 34423.0, 45852.0, 59222.0, 71842.0, 85043.0, 93231.0, 97698.0, 94089.0, 87430.0, 75287.0, 61809.0, 48943.0, 36751.0, 26471.0, 18707.0, 12513.0, 8367.0, 5468.0, 3692.0, 2353.0, 1501.0, 910.0, 554.0, 364.0, 237.0, 129.0, 80.0, 69.0, 28.0, 18.0, 12.0, 14.0, 4.0, 4.0, 1.0, 1.0], "bins": [-18.15625, -17.631591796875, -17.10693359375, -16.582275390625, -16.0576171875, -15.532958984375, -15.00830078125, -14.483642578125, -13.958984375, -13.434326171875, -12.90966796875, -12.385009765625, -11.8603515625, -11.335693359375, -10.81103515625, -10.286376953125, -9.76171875, -9.237060546875, -8.71240234375, -8.187744140625, -7.6630859375, -7.138427734375, -6.61376953125, -6.089111328125, -5.564453125, -5.039794921875, -4.51513671875, -3.990478515625, -3.4658203125, -2.941162109375, -2.41650390625, -1.891845703125, -1.3671875, -0.842529296875, -0.31787109375, 0.206787109375, 0.7314453125, 1.256103515625, 1.78076171875, 2.305419921875, 2.830078125, 3.354736328125, 3.87939453125, 4.404052734375, 4.9287109375, 5.453369140625, 5.97802734375, 6.502685546875, 7.02734375, 7.552001953125, 8.07666015625, 8.601318359375, 9.1259765625, 9.650634765625, 10.17529296875, 10.699951171875, 11.224609375, 11.749267578125, 12.27392578125, 12.798583984375, 13.3232421875, 13.847900390625, 14.37255859375, 14.897216796875, 15.421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 6.0, 7.0, 13.0, 11.0, 25.0, 31.0, 22.0, 25.0, 21.0, 30.0, 25.0, 32.0, 32.0, 34.0, 34.0, 38.0, 53.0, 44.0, 37.0, 39.0, 41.0, 33.0, 27.0, 30.0, 33.0, 27.0, 29.0, 24.0, 23.0, 22.0, 25.0, 22.0, 20.0, 8.0, 13.0, 9.0, 9.0, 9.0, 5.0, 4.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.703125, -18.066650390625, -17.43017578125, -16.793701171875, -16.1572265625, -15.520751953125, -14.88427734375, -14.247802734375, -13.611328125, -12.974853515625, -12.33837890625, -11.701904296875, -11.0654296875, -10.428955078125, -9.79248046875, -9.156005859375, -8.51953125, -7.883056640625, -7.24658203125, -6.610107421875, -5.9736328125, -5.337158203125, -4.70068359375, -4.064208984375, -3.427734375, -2.791259765625, -2.15478515625, -1.518310546875, -0.8818359375, -0.245361328125, 0.39111328125, 1.027587890625, 1.6640625, 2.300537109375, 2.93701171875, 3.573486328125, 4.2099609375, 4.846435546875, 5.48291015625, 6.119384765625, 6.755859375, 7.392333984375, 8.02880859375, 8.665283203125, 9.3017578125, 9.938232421875, 10.57470703125, 11.211181640625, 11.84765625, 12.484130859375, 13.12060546875, 13.757080078125, 14.3935546875, 15.030029296875, 15.66650390625, 16.302978515625, 16.939453125, 17.575927734375, 18.21240234375, 18.848876953125, 19.4853515625, 20.121826171875, 20.75830078125, 21.394775390625, 22.03125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 7.0, 5.0, 13.0, 13.0, 23.0, 30.0, 61.0, 89.0, 155.0, 291.0, 449.0, 775.0, 1344.0, 2216.0, 3765.0, 5955.0, 9781.0, 14989.0, 22818.0, 33121.0, 45601.0, 60484.0, 75419.0, 89967.0, 98891.0, 102447.0, 99983.0, 91041.0, 77892.0, 62582.0, 47429.0, 34379.0, 24126.0, 15945.0, 10175.0, 6403.0, 4015.0, 2428.0, 1422.0, 797.0, 488.0, 296.0, 185.0, 105.0, 69.0, 38.0, 21.0, 7.0, 12.0, 5.0, 9.0, 3.0, 2.0, 1.0, 2.0], "bins": [-6.39453125, -6.20953369140625, -6.0245361328125, -5.83953857421875, -5.654541015625, -5.46954345703125, -5.2845458984375, -5.09954833984375, -4.91455078125, -4.72955322265625, -4.5445556640625, -4.35955810546875, -4.174560546875, -3.98956298828125, -3.8045654296875, -3.61956787109375, -3.4345703125, -3.24957275390625, -3.0645751953125, -2.87957763671875, -2.694580078125, -2.50958251953125, -2.3245849609375, -2.13958740234375, -1.95458984375, -1.76959228515625, -1.5845947265625, -1.39959716796875, -1.214599609375, -1.02960205078125, -0.8446044921875, -0.65960693359375, -0.474609375, -0.28961181640625, -0.1046142578125, 0.08038330078125, 0.265380859375, 0.45037841796875, 0.6353759765625, 0.82037353515625, 1.00537109375, 1.19036865234375, 1.3753662109375, 1.56036376953125, 1.745361328125, 1.93035888671875, 2.1153564453125, 2.30035400390625, 2.4853515625, 2.67034912109375, 2.8553466796875, 3.04034423828125, 3.225341796875, 3.41033935546875, 3.5953369140625, 3.78033447265625, 3.96533203125, 4.15032958984375, 4.3353271484375, 4.52032470703125, 4.705322265625, 4.89031982421875, 5.0753173828125, 5.26031494140625, 5.4453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 11.0, 8.0, 6.0, 8.0, 12.0, 15.0, 22.0, 21.0, 16.0, 19.0, 27.0, 38.0, 29.0, 32.0, 37.0, 43.0, 29.0, 31.0, 38.0, 41.0, 44.0, 44.0, 40.0, 36.0, 45.0, 39.0, 34.0, 31.0, 32.0, 27.0, 24.0, 22.0, 15.0, 23.0, 14.0, 8.0, 4.0, 4.0, 7.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0006084442138671875, -0.0005877465009689331, -0.0005670487880706787, -0.0005463510751724243, -0.0005256533622741699, -0.0005049556493759155, -0.00048425793647766113, -0.00046356022357940674, -0.00044286251068115234, -0.00042216479778289795, -0.00040146708488464355, -0.00038076937198638916, -0.00036007165908813477, -0.00033937394618988037, -0.000318676233291626, -0.0002979785203933716, -0.0002772808074951172, -0.0002565830945968628, -0.0002358853816986084, -0.000215187668800354, -0.0001944899559020996, -0.00017379224300384521, -0.00015309453010559082, -0.00013239681720733643, -0.00011169910430908203, -9.100139141082764e-05, -7.030367851257324e-05, -4.960596561431885e-05, -2.8908252716064453e-05, -8.210539817810059e-06, 1.2487173080444336e-05, 3.318488597869873e-05, 5.3882598876953125e-05, 7.458031177520752e-05, 9.527802467346191e-05, 0.00011597573757171631, 0.0001366734504699707, 0.0001573711633682251, 0.0001780688762664795, 0.0001987665891647339, 0.00021946430206298828, 0.00024016201496124268, 0.00026085972785949707, 0.00028155744075775146, 0.00030225515365600586, 0.00032295286655426025, 0.00034365057945251465, 0.00036434829235076904, 0.00038504600524902344, 0.00040574371814727783, 0.0004264414310455322, 0.0004471391439437866, 0.000467836856842041, 0.0004885345697402954, 0.0005092322826385498, 0.0005299299955368042, 0.0005506277084350586, 0.000571325421333313, 0.0005920231342315674, 0.0006127208471298218, 0.0006334185600280762, 0.0006541162729263306, 0.000674813985824585, 0.0006955116987228394, 0.0007162094116210938]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 10.0, 15.0, 26.0, 30.0, 68.0, 93.0, 149.0, 247.0, 370.0, 571.0, 885.0, 1438.0, 2126.0, 3405.0, 5243.0, 7977.0, 12052.0, 17651.0, 24826.0, 34757.0, 46595.0, 58556.0, 71905.0, 83055.0, 91261.0, 95113.0, 92480.0, 85898.0, 75408.0, 62319.0, 49924.0, 37862.0, 27660.0, 19707.0, 13443.0, 8826.0, 5952.0, 3743.0, 2553.0, 1571.0, 1029.0, 600.0, 416.0, 277.0, 181.0, 112.0, 61.0, 44.0, 29.0, 15.0, 8.0, 10.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-5.85546875, -5.67608642578125, -5.4967041015625, -5.31732177734375, -5.137939453125, -4.95855712890625, -4.7791748046875, -4.59979248046875, -4.42041015625, -4.24102783203125, -4.0616455078125, -3.88226318359375, -3.702880859375, -3.52349853515625, -3.3441162109375, -3.16473388671875, -2.9853515625, -2.80596923828125, -2.6265869140625, -2.44720458984375, -2.267822265625, -2.08843994140625, -1.9090576171875, -1.72967529296875, -1.55029296875, -1.37091064453125, -1.1915283203125, -1.01214599609375, -0.832763671875, -0.65338134765625, -0.4739990234375, -0.29461669921875, -0.115234375, 0.06414794921875, 0.2435302734375, 0.42291259765625, 0.602294921875, 0.78167724609375, 0.9610595703125, 1.14044189453125, 1.31982421875, 1.49920654296875, 1.6785888671875, 1.85797119140625, 2.037353515625, 2.21673583984375, 2.3961181640625, 2.57550048828125, 2.7548828125, 2.93426513671875, 3.1136474609375, 3.29302978515625, 3.472412109375, 3.65179443359375, 3.8311767578125, 4.01055908203125, 4.18994140625, 4.36932373046875, 4.5487060546875, 4.72808837890625, 4.907470703125, 5.08685302734375, 5.2662353515625, 5.44561767578125, 5.625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 18.0, 15.0, 15.0, 18.0, 23.0, 30.0, 24.0, 36.0, 33.0, 36.0, 46.0, 33.0, 38.0, 45.0, 40.0, 44.0, 39.0, 43.0, 45.0, 38.0, 32.0, 40.0, 40.0, 33.0, 24.0, 18.0, 22.0, 17.0, 25.0, 14.0, 7.0, 10.0, 6.0, 8.0, 4.0, 9.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.794921875, -2.708770751953125, -2.62261962890625, -2.536468505859375, -2.4503173828125, -2.364166259765625, -2.27801513671875, -2.191864013671875, -2.105712890625, -2.019561767578125, -1.93341064453125, -1.847259521484375, -1.7611083984375, -1.674957275390625, -1.58880615234375, -1.502655029296875, -1.41650390625, -1.330352783203125, -1.24420166015625, -1.158050537109375, -1.0718994140625, -0.985748291015625, -0.89959716796875, -0.813446044921875, -0.727294921875, -0.641143798828125, -0.55499267578125, -0.468841552734375, -0.3826904296875, -0.296539306640625, -0.21038818359375, -0.124237060546875, -0.0380859375, 0.048065185546875, 0.13421630859375, 0.220367431640625, 0.3065185546875, 0.392669677734375, 0.47882080078125, 0.564971923828125, 0.651123046875, 0.737274169921875, 0.82342529296875, 0.909576416015625, 0.9957275390625, 1.081878662109375, 1.16802978515625, 1.254180908203125, 1.34033203125, 1.426483154296875, 1.51263427734375, 1.598785400390625, 1.6849365234375, 1.771087646484375, 1.85723876953125, 1.943389892578125, 2.029541015625, 2.115692138671875, 2.20184326171875, 2.287994384765625, 2.3741455078125, 2.460296630859375, 2.54644775390625, 2.632598876953125, 2.71875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 4.0, 14.0, 9.0, 15.0, 19.0, 24.0, 19.0, 20.0, 18.0, 32.0, 34.0, 34.0, 46.0, 46.0, 52.0, 40.0, 38.0, 47.0, 34.0, 42.0, 32.0, 38.0, 50.0, 35.0, 32.0, 17.0, 23.0, 19.0, 22.0, 19.0, 16.0, 20.0, 11.0, 14.0, 9.0, 12.0, 10.0, 3.0, 6.0, 1.0, 1.0, 10.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.839197158813477, -26.94318199157715, -26.047168731689453, -25.151153564453125, -24.255138397216797, -23.3591251373291, -22.463109970092773, -21.567096710205078, -20.67108154296875, -19.775066375732422, -18.879053115844727, -17.9830379486084, -17.087024688720703, -16.191009521484375, -15.294994354248047, -14.398980140686035, -13.502965927124023, -12.606951713562012, -11.7109375, -10.814922332763672, -9.91890811920166, -9.022893905639648, -8.12687873840332, -7.230864524841309, -6.334850311279297, -5.438836097717285, -4.542821407318115, -3.6468069553375244, -2.7507925033569336, -1.8547782897949219, -0.958763599395752, -0.06274890899658203, 0.8332653045654297, 1.7292797565460205, 2.6252942085266113, 3.521308660507202, 4.417323112487793, 5.313337326049805, 6.209352016448975, 7.1053667068481445, 8.001380920410156, 8.897395133972168, 9.79340934753418, 10.689424514770508, 11.58543872833252, 12.481452941894531, 13.37746810913086, 14.273482322692871, 15.169496536254883, 16.06551170349121, 16.961524963378906, 17.857540130615234, 18.753555297851562, 19.649568557739258, 20.545583724975586, 21.44159698486328, 22.33761215209961, 23.233627319335938, 24.129640579223633, 25.02565574645996, 25.921669006347656, 26.817684173583984, 27.713699340820312, 28.60971450805664, 29.505727767944336]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 12.0, 6.0, 13.0, 7.0, 16.0, 14.0, 17.0, 21.0, 18.0, 24.0, 29.0, 31.0, 30.0, 26.0, 37.0, 39.0, 38.0, 36.0, 33.0, 23.0, 45.0, 39.0, 37.0, 31.0, 30.0, 41.0, 33.0, 40.0, 24.0, 35.0, 28.0, 19.0, 17.0, 14.0, 15.0, 15.0, 10.0, 6.0, 6.0, 9.0, 7.0, 2.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-32.157630920410156, -31.153738021850586, -30.149845123291016, -29.145950317382812, -28.142057418823242, -27.138164520263672, -26.1342716217041, -25.13037872314453, -24.126483917236328, -23.122591018676758, -22.118698120117188, -21.114803314208984, -20.110910415649414, -19.107017517089844, -18.103124618530273, -17.099231719970703, -16.095338821411133, -15.091445922851562, -14.087552070617676, -13.083659172058105, -12.079765319824219, -11.075872421264648, -10.071979522705078, -9.068086624145508, -8.064192771911621, -7.060299396514893, -6.056406021118164, -5.052513122558594, -4.048619747161865, -3.0447263717651367, -2.0408334732055664, -1.036940097808838, -0.033046722412109375, 0.9708465337753296, 1.9747397899627686, 2.978632926940918, 3.9825263023376465, 4.986419677734375, 5.990312576293945, 6.994205951690674, 7.998099327087402, 9.001992225646973, 10.00588607788086, 11.00977897644043, 12.013671875, 13.017565727233887, 14.021458625793457, 15.025352478027344, 16.029245376586914, 17.033138275146484, 18.037031173706055, 19.040924072265625, 20.044818878173828, 21.0487117767334, 22.05260467529297, 23.05649757385254, 24.06039047241211, 25.06428337097168, 26.06817626953125, 27.072071075439453, 28.075963973999023, 29.079856872558594, 30.083749771118164, 31.087642669677734, 32.09153747558594]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 8.0, 8.0, 14.0, 47.0, 63.0, 111.0, 181.0, 329.0, 547.0, 920.0, 1536.0, 2393.0, 3974.0, 6179.0, 9805.0, 15433.0, 23073.0, 34938.0, 50284.0, 71667.0, 98933.0, 132272.0, 172187.0, 215002.0, 258732.0, 298868.0, 329597.0, 346264.0, 347508.0, 332179.0, 303680.0, 264815.0, 220957.0, 179074.0, 137422.0, 103347.0, 74315.0, 52486.0, 36188.0, 24613.0, 16111.0, 10451.0, 6690.0, 4194.0, 2635.0, 1686.0, 1027.0, 616.0, 365.0, 232.0, 141.0, 78.0, 42.0, 38.0, 19.0, 10.0, 6.0, 5.0, 2.0, 2.0], "bins": [-20.671875, -20.027587890625, -19.38330078125, -18.739013671875, -18.0947265625, -17.450439453125, -16.80615234375, -16.161865234375, -15.517578125, -14.873291015625, -14.22900390625, -13.584716796875, -12.9404296875, -12.296142578125, -11.65185546875, -11.007568359375, -10.36328125, -9.718994140625, -9.07470703125, -8.430419921875, -7.7861328125, -7.141845703125, -6.49755859375, -5.853271484375, -5.208984375, -4.564697265625, -3.92041015625, -3.276123046875, -2.6318359375, -1.987548828125, -1.34326171875, -0.698974609375, -0.0546875, 0.589599609375, 1.23388671875, 1.878173828125, 2.5224609375, 3.166748046875, 3.81103515625, 4.455322265625, 5.099609375, 5.743896484375, 6.38818359375, 7.032470703125, 7.6767578125, 8.321044921875, 8.96533203125, 9.609619140625, 10.25390625, 10.898193359375, 11.54248046875, 12.186767578125, 12.8310546875, 13.475341796875, 14.11962890625, 14.763916015625, 15.408203125, 16.052490234375, 16.69677734375, 17.341064453125, 17.9853515625, 18.629638671875, 19.27392578125, 19.918212890625, 20.5625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 2.0, 8.0, 5.0, 7.0, 16.0, 11.0, 11.0, 16.0, 22.0, 21.0, 23.0, 27.0, 33.0, 22.0, 34.0, 32.0, 41.0, 36.0, 35.0, 29.0, 22.0, 44.0, 39.0, 22.0, 47.0, 41.0, 30.0, 37.0, 39.0, 28.0, 32.0, 25.0, 15.0, 23.0, 16.0, 12.0, 14.0, 11.0, 7.0, 11.0, 10.0, 9.0, 6.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0], "bins": [-27.96875, -27.11083984375, -26.2529296875, -25.39501953125, -24.537109375, -23.67919921875, -22.8212890625, -21.96337890625, -21.10546875, -20.24755859375, -19.3896484375, -18.53173828125, -17.673828125, -16.81591796875, -15.9580078125, -15.10009765625, -14.2421875, -13.38427734375, -12.5263671875, -11.66845703125, -10.810546875, -9.95263671875, -9.0947265625, -8.23681640625, -7.37890625, -6.52099609375, -5.6630859375, -4.80517578125, -3.947265625, -3.08935546875, -2.2314453125, -1.37353515625, -0.515625, 0.34228515625, 1.2001953125, 2.05810546875, 2.916015625, 3.77392578125, 4.6318359375, 5.48974609375, 6.34765625, 7.20556640625, 8.0634765625, 8.92138671875, 9.779296875, 10.63720703125, 11.4951171875, 12.35302734375, 13.2109375, 14.06884765625, 14.9267578125, 15.78466796875, 16.642578125, 17.50048828125, 18.3583984375, 19.21630859375, 20.07421875, 20.93212890625, 21.7900390625, 22.64794921875, 23.505859375, 24.36376953125, 25.2216796875, 26.07958984375, 26.9375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 12.0, 32.0, 43.0, 75.0, 147.0, 248.0, 491.0, 927.0, 1662.0, 3022.0, 5181.0, 9158.0, 15639.0, 26344.0, 41817.0, 65980.0, 98571.0, 141613.0, 195492.0, 255479.0, 314962.0, 364596.0, 399752.0, 408325.0, 392928.0, 354043.0, 301228.0, 240798.0, 181857.0, 131700.0, 89898.0, 59527.0, 37406.0, 23146.0, 13864.0, 8171.0, 4621.0, 2472.0, 1391.0, 753.0, 449.0, 221.0, 104.0, 74.0, 32.0, 14.0, 14.0, 2.0, 4.0, 4.0], "bins": [-31.3125, -30.474853515625, -29.63720703125, -28.799560546875, -27.9619140625, -27.124267578125, -26.28662109375, -25.448974609375, -24.611328125, -23.773681640625, -22.93603515625, -22.098388671875, -21.2607421875, -20.423095703125, -19.58544921875, -18.747802734375, -17.91015625, -17.072509765625, -16.23486328125, -15.397216796875, -14.5595703125, -13.721923828125, -12.88427734375, -12.046630859375, -11.208984375, -10.371337890625, -9.53369140625, -8.696044921875, -7.8583984375, -7.020751953125, -6.18310546875, -5.345458984375, -4.5078125, -3.670166015625, -2.83251953125, -1.994873046875, -1.1572265625, -0.319580078125, 0.51806640625, 1.355712890625, 2.193359375, 3.031005859375, 3.86865234375, 4.706298828125, 5.5439453125, 6.381591796875, 7.21923828125, 8.056884765625, 8.89453125, 9.732177734375, 10.56982421875, 11.407470703125, 12.2451171875, 13.082763671875, 13.92041015625, 14.758056640625, 15.595703125, 16.433349609375, 17.27099609375, 18.108642578125, 18.9462890625, 19.783935546875, 20.62158203125, 21.459228515625, 22.296875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 9.0, 10.0, 13.0, 18.0, 20.0, 28.0, 25.0, 29.0, 41.0, 41.0, 49.0, 56.0, 64.0, 83.0, 88.0, 97.0, 110.0, 136.0, 142.0, 153.0, 158.0, 164.0, 175.0, 183.0, 176.0, 162.0, 160.0, 170.0, 148.0, 138.0, 151.0, 143.0, 132.0, 111.0, 88.0, 89.0, 72.0, 69.0, 67.0, 58.0, 41.0, 44.0, 36.0, 20.0, 18.0, 20.0, 15.0, 15.0, 12.0, 5.0, 6.0, 5.0, 4.0, 6.0, 0.0, 4.0, 0.0, 1.0], "bins": [-11.7578125, -11.374267578125, -10.99072265625, -10.607177734375, -10.2236328125, -9.840087890625, -9.45654296875, -9.072998046875, -8.689453125, -8.305908203125, -7.92236328125, -7.538818359375, -7.1552734375, -6.771728515625, -6.38818359375, -6.004638671875, -5.62109375, -5.237548828125, -4.85400390625, -4.470458984375, -4.0869140625, -3.703369140625, -3.31982421875, -2.936279296875, -2.552734375, -2.169189453125, -1.78564453125, -1.402099609375, -1.0185546875, -0.635009765625, -0.25146484375, 0.132080078125, 0.515625, 0.899169921875, 1.28271484375, 1.666259765625, 2.0498046875, 2.433349609375, 2.81689453125, 3.200439453125, 3.583984375, 3.967529296875, 4.35107421875, 4.734619140625, 5.1181640625, 5.501708984375, 5.88525390625, 6.268798828125, 6.65234375, 7.035888671875, 7.41943359375, 7.802978515625, 8.1865234375, 8.570068359375, 8.95361328125, 9.337158203125, 9.720703125, 10.104248046875, 10.48779296875, 10.871337890625, 11.2548828125, 11.638427734375, 12.02197265625, 12.405517578125, 12.7890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 5.0, 8.0, 8.0, 17.0, 15.0, 10.0, 17.0, 30.0, 30.0, 15.0, 37.0, 24.0, 32.0, 29.0, 33.0, 39.0, 43.0, 41.0, 38.0, 37.0, 54.0, 44.0, 31.0, 33.0, 33.0, 34.0, 35.0, 34.0, 26.0, 24.0, 17.0, 16.0, 10.0, 19.0, 17.0, 7.0, 8.0, 5.0, 11.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.37582015991211, -29.334218978881836, -28.292619705200195, -27.251018524169922, -26.20941925048828, -25.167818069458008, -24.126216888427734, -23.084617614746094, -22.04301643371582, -21.001415252685547, -19.959815979003906, -18.918214797973633, -17.87661361694336, -16.83501434326172, -15.793413162231445, -14.751812934875488, -13.710212707519531, -12.668612480163574, -11.627012252807617, -10.585411071777344, -9.543810844421387, -8.50221061706543, -7.4606099128723145, -6.419009208679199, -5.377408981323242, -4.335808753967285, -3.29420804977417, -2.252607583999634, -1.2110071182250977, -0.16940689086914062, 0.8721938133239746, 1.9137945175170898, 2.9553985595703125, 3.9969990253448486, 5.038599491119385, 6.0802001953125, 7.121800422668457, 8.163400650024414, 9.205001831054688, 10.246602058410645, 11.288202285766602, 12.329802513122559, 13.371402740478516, 14.413003921508789, 15.454604148864746, 16.496204376220703, 17.537805557250977, 18.57940673828125, 19.62100601196289, 20.662607192993164, 21.704206466674805, 22.745807647705078, 23.78740692138672, 24.829008102416992, 25.870609283447266, 26.912208557128906, 27.95380973815918, 28.995410919189453, 30.037010192871094, 31.078611373901367, 32.12021255493164, 33.16181182861328, 34.20341110229492, 35.24501419067383, 36.28661346435547]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 7.0, 13.0, 10.0, 26.0, 15.0, 17.0, 23.0, 24.0, 34.0, 41.0, 37.0, 28.0, 41.0, 41.0, 39.0, 44.0, 43.0, 47.0, 47.0, 49.0, 34.0, 41.0, 47.0, 29.0, 22.0, 27.0, 27.0, 27.0, 23.0, 18.0, 15.0, 8.0, 13.0, 6.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.401611328125, -34.16838836669922, -32.93516159057617, -31.70193862915039, -30.46871566772461, -29.235490798950195, -28.00226593017578, -26.76904296875, -25.535818099975586, -24.302593231201172, -23.06937026977539, -21.836145401000977, -20.602920532226562, -19.36969757080078, -18.136472702026367, -16.903247833251953, -15.670024871826172, -14.436800956726074, -13.203577041625977, -11.970352172851562, -10.737128257751465, -9.503904342651367, -8.270679473876953, -7.0374555587768555, -5.804231643676758, -4.57100772857666, -3.3377833366394043, -2.1045591831207275, -0.8713350296020508, 0.3618888854980469, 1.5951132774353027, 2.8283376693725586, 4.061561584472656, 5.294785499572754, 6.52800989151001, 7.761234283447266, 8.994458198547363, 10.227682113647461, 11.460906982421875, 12.694130897521973, 13.92735481262207, 15.160578727722168, 16.393802642822266, 17.62702751159668, 18.860252380371094, 20.093475341796875, 21.32670021057129, 22.559925079345703, 23.793148040771484, 25.0263729095459, 26.25959587097168, 27.492820739746094, 28.726043701171875, 29.95926856994629, 31.192493438720703, 32.425716400146484, 33.65894317626953, 34.89216613769531, 36.12539291381836, 37.35861587524414, 38.59183883666992, 39.82506561279297, 41.05828857421875, 42.29151153564453, 43.52473449707031]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 12.0, 20.0, 31.0, 41.0, 69.0, 127.0, 142.0, 218.0, 338.0, 505.0, 843.0, 1326.0, 2101.0, 3236.0, 5248.0, 8367.0, 13515.0, 21893.0, 35227.0, 54864.0, 82203.0, 113623.0, 140268.0, 148513.0, 129380.0, 99063.0, 67912.0, 44540.0, 28186.0, 17693.0, 10953.0, 6703.0, 4235.0, 2555.0, 1646.0, 1041.0, 652.0, 470.0, 281.0, 167.0, 122.0, 73.0, 50.0, 29.0, 20.0, 15.0, 10.0, 4.0, 2.0, 7.0, 4.0, 1.0, 2.0], "bins": [-5.5859375, -5.42291259765625, -5.2598876953125, -5.09686279296875, -4.933837890625, -4.77081298828125, -4.6077880859375, -4.44476318359375, -4.28173828125, -4.11871337890625, -3.9556884765625, -3.79266357421875, -3.629638671875, -3.46661376953125, -3.3035888671875, -3.14056396484375, -2.9775390625, -2.81451416015625, -2.6514892578125, -2.48846435546875, -2.325439453125, -2.16241455078125, -1.9993896484375, -1.83636474609375, -1.67333984375, -1.51031494140625, -1.3472900390625, -1.18426513671875, -1.021240234375, -0.85821533203125, -0.6951904296875, -0.53216552734375, -0.369140625, -0.20611572265625, -0.0430908203125, 0.11993408203125, 0.282958984375, 0.44598388671875, 0.6090087890625, 0.77203369140625, 0.93505859375, 1.09808349609375, 1.2611083984375, 1.42413330078125, 1.587158203125, 1.75018310546875, 1.9132080078125, 2.07623291015625, 2.2392578125, 2.40228271484375, 2.5653076171875, 2.72833251953125, 2.891357421875, 3.05438232421875, 3.2174072265625, 3.38043212890625, 3.54345703125, 3.70648193359375, 3.8695068359375, 4.03253173828125, 4.195556640625, 4.35858154296875, 4.5216064453125, 4.68463134765625, 4.84765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 1.0, 5.0, 7.0, 12.0, 7.0, 7.0, 14.0, 19.0, 30.0, 14.0, 26.0, 27.0, 28.0, 34.0, 31.0, 40.0, 37.0, 36.0, 39.0, 45.0, 61.0, 56.0, 33.0, 37.0, 52.0, 38.0, 35.0, 33.0, 28.0, 23.0, 25.0, 29.0, 13.0, 12.0, 10.0, 11.0, 11.0, 12.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.53125, -32.2587890625, -30.986328125, -29.7138671875, -28.44140625, -27.1689453125, -25.896484375, -24.6240234375, -23.3515625, -22.0791015625, -20.806640625, -19.5341796875, -18.26171875, -16.9892578125, -15.716796875, -14.4443359375, -13.171875, -11.8994140625, -10.626953125, -9.3544921875, -8.08203125, -6.8095703125, -5.537109375, -4.2646484375, -2.9921875, -1.7197265625, -0.447265625, 0.8251953125, 2.09765625, 3.3701171875, 4.642578125, 5.9150390625, 7.1875, 8.4599609375, 9.732421875, 11.0048828125, 12.27734375, 13.5498046875, 14.822265625, 16.0947265625, 17.3671875, 18.6396484375, 19.912109375, 21.1845703125, 22.45703125, 23.7294921875, 25.001953125, 26.2744140625, 27.546875, 28.8193359375, 30.091796875, 31.3642578125, 32.63671875, 33.9091796875, 35.181640625, 36.4541015625, 37.7265625, 38.9990234375, 40.271484375, 41.5439453125, 42.81640625, 44.0888671875, 45.361328125, 46.6337890625, 47.90625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 7.0, 15.0, 18.0, 28.0, 42.0, 79.0, 84.0, 184.0, 292.0, 456.0, 815.0, 1394.0, 2274.0, 3952.0, 7367.0, 13227.0, 23916.0, 42727.0, 73601.0, 120781.0, 171806.0, 189673.0, 154606.0, 101995.0, 60739.0, 34740.0, 19197.0, 10675.0, 5808.0, 3329.0, 1911.0, 1115.0, 659.0, 393.0, 244.0, 156.0, 90.0, 59.0, 40.0, 24.0, 20.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.72265625, -7.49761962890625, -7.2725830078125, -7.04754638671875, -6.822509765625, -6.59747314453125, -6.3724365234375, -6.14739990234375, -5.92236328125, -5.69732666015625, -5.4722900390625, -5.24725341796875, -5.022216796875, -4.79718017578125, -4.5721435546875, -4.34710693359375, -4.1220703125, -3.89703369140625, -3.6719970703125, -3.44696044921875, -3.221923828125, -2.99688720703125, -2.7718505859375, -2.54681396484375, -2.32177734375, -2.09674072265625, -1.8717041015625, -1.64666748046875, -1.421630859375, -1.19659423828125, -0.9715576171875, -0.74652099609375, -0.521484375, -0.29644775390625, -0.0714111328125, 0.15362548828125, 0.378662109375, 0.60369873046875, 0.8287353515625, 1.05377197265625, 1.27880859375, 1.50384521484375, 1.7288818359375, 1.95391845703125, 2.178955078125, 2.40399169921875, 2.6290283203125, 2.85406494140625, 3.0791015625, 3.30413818359375, 3.5291748046875, 3.75421142578125, 3.979248046875, 4.20428466796875, 4.4293212890625, 4.65435791015625, 4.87939453125, 5.10443115234375, 5.3294677734375, 5.55450439453125, 5.779541015625, 6.00457763671875, 6.2296142578125, 6.45465087890625, 6.6796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 5.0, 7.0, 6.0, 4.0, 9.0, 13.0, 15.0, 19.0, 22.0, 24.0, 20.0, 27.0, 15.0, 24.0, 35.0, 29.0, 29.0, 31.0, 39.0, 33.0, 52.0, 46.0, 39.0, 44.0, 41.0, 22.0, 34.0, 43.0, 22.0, 37.0, 26.0, 26.0, 23.0, 21.0, 18.0, 17.0, 16.0, 8.0, 10.0, 10.0, 7.0, 10.0, 4.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.34375, -18.637939453125, -17.93212890625, -17.226318359375, -16.5205078125, -15.814697265625, -15.10888671875, -14.403076171875, -13.697265625, -12.991455078125, -12.28564453125, -11.579833984375, -10.8740234375, -10.168212890625, -9.46240234375, -8.756591796875, -8.05078125, -7.344970703125, -6.63916015625, -5.933349609375, -5.2275390625, -4.521728515625, -3.81591796875, -3.110107421875, -2.404296875, -1.698486328125, -0.99267578125, -0.286865234375, 0.4189453125, 1.124755859375, 1.83056640625, 2.536376953125, 3.2421875, 3.947998046875, 4.65380859375, 5.359619140625, 6.0654296875, 6.771240234375, 7.47705078125, 8.182861328125, 8.888671875, 9.594482421875, 10.30029296875, 11.006103515625, 11.7119140625, 12.417724609375, 13.12353515625, 13.829345703125, 14.53515625, 15.240966796875, 15.94677734375, 16.652587890625, 17.3583984375, 18.064208984375, 18.77001953125, 19.475830078125, 20.181640625, 20.887451171875, 21.59326171875, 22.299072265625, 23.0048828125, 23.710693359375, 24.41650390625, 25.122314453125, 25.828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 20.0, 20.0, 23.0, 29.0, 61.0, 68.0, 112.0, 175.0, 263.0, 401.0, 686.0, 1177.0, 2120.0, 4001.0, 8348.0, 18638.0, 43074.0, 101222.0, 211693.0, 290066.0, 199938.0, 93504.0, 39512.0, 16967.0, 7738.0, 3797.0, 1936.0, 1121.0, 624.0, 421.0, 287.0, 156.0, 91.0, 78.0, 55.0, 31.0, 27.0, 22.0, 15.0, 7.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0166778564453125, -0.979644775390625, -0.9426116943359375, -0.90557861328125, -0.8685455322265625, -0.831512451171875, -0.7944793701171875, -0.7574462890625, -0.7204132080078125, -0.683380126953125, -0.6463470458984375, -0.60931396484375, -0.5722808837890625, -0.535247802734375, -0.4982147216796875, -0.461181640625, -0.4241485595703125, -0.387115478515625, -0.3500823974609375, -0.31304931640625, -0.2760162353515625, -0.238983154296875, -0.2019500732421875, -0.1649169921875, -0.1278839111328125, -0.090850830078125, -0.0538177490234375, -0.01678466796875, 0.0202484130859375, 0.057281494140625, 0.0943145751953125, 0.13134765625, 0.1683807373046875, 0.205413818359375, 0.2424468994140625, 0.27947998046875, 0.3165130615234375, 0.353546142578125, 0.3905792236328125, 0.4276123046875, 0.4646453857421875, 0.501678466796875, 0.5387115478515625, 0.57574462890625, 0.6127777099609375, 0.649810791015625, 0.6868438720703125, 0.723876953125, 0.7609100341796875, 0.797943115234375, 0.8349761962890625, 0.87200927734375, 0.9090423583984375, 0.946075439453125, 0.9831085205078125, 1.0201416015625, 1.0571746826171875, 1.094207763671875, 1.1312408447265625, 1.16827392578125, 1.2053070068359375, 1.242340087890625, 1.2793731689453125, 1.31640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 6.0, 3.0, 11.0, 14.0, 29.0, 25.0, 26.0, 46.0, 38.0, 48.0, 46.0, 58.0, 59.0, 64.0, 60.0, 62.0, 56.0, 49.0, 46.0, 51.0, 31.0, 37.0, 29.0, 24.0, 20.0, 16.0, 10.0, 16.0, 4.0, 4.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001023411750793457, -9.90256667137146e-05, -9.57101583480835e-05, -9.239464998245239e-05, -8.907914161682129e-05, -8.576363325119019e-05, -8.244812488555908e-05, -7.913261651992798e-05, -7.581710815429688e-05, -7.250159978866577e-05, -6.918609142303467e-05, -6.587058305740356e-05, -6.255507469177246e-05, -5.923956632614136e-05, -5.5924057960510254e-05, -5.260854959487915e-05, -4.929304122924805e-05, -4.597753286361694e-05, -4.266202449798584e-05, -3.9346516132354736e-05, -3.603100776672363e-05, -3.271549940109253e-05, -2.9399991035461426e-05, -2.6084482669830322e-05, -2.276897430419922e-05, -1.9453465938568115e-05, -1.6137957572937012e-05, -1.2822449207305908e-05, -9.506940841674805e-06, -6.191432476043701e-06, -2.8759241104125977e-06, 4.3958425521850586e-07, 3.7550926208496094e-06, 7.070600986480713e-06, 1.0386109352111816e-05, 1.370161771774292e-05, 1.7017126083374023e-05, 2.0332634449005127e-05, 2.364814281463623e-05, 2.6963651180267334e-05, 3.0279159545898438e-05, 3.359466791152954e-05, 3.6910176277160645e-05, 4.022568464279175e-05, 4.354119300842285e-05, 4.6856701374053955e-05, 5.017220973968506e-05, 5.348771810531616e-05, 5.6803226470947266e-05, 6.011873483657837e-05, 6.343424320220947e-05, 6.674975156784058e-05, 7.006525993347168e-05, 7.338076829910278e-05, 7.669627666473389e-05, 8.001178503036499e-05, 8.33272933959961e-05, 8.66428017616272e-05, 8.99583101272583e-05, 9.32738184928894e-05, 9.658932685852051e-05, 9.990483522415161e-05, 0.00010322034358978271, 0.00010653585195541382, 0.00010985136032104492]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 13.0, 18.0, 31.0, 38.0, 63.0, 84.0, 119.0, 160.0, 227.0, 314.0, 415.0, 688.0, 874.0, 1301.0, 1953.0, 3005.0, 4692.0, 7300.0, 11657.0, 19819.0, 33247.0, 56441.0, 94377.0, 148807.0, 193370.0, 173366.0, 117360.0, 71045.0, 42295.0, 24872.0, 14945.0, 8991.0, 5556.0, 3604.0, 2265.0, 1613.0, 1063.0, 766.0, 547.0, 364.0, 279.0, 203.0, 122.0, 101.0, 63.0, 42.0, 26.0, 18.0, 10.0, 11.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.3046875, -1.2622222900390625, -1.219757080078125, -1.1772918701171875, -1.13482666015625, -1.0923614501953125, -1.049896240234375, -1.0074310302734375, -0.9649658203125, -0.9225006103515625, -0.880035400390625, -0.8375701904296875, -0.79510498046875, -0.7526397705078125, -0.710174560546875, -0.6677093505859375, -0.625244140625, -0.5827789306640625, -0.540313720703125, -0.4978485107421875, -0.45538330078125, -0.4129180908203125, -0.370452880859375, -0.3279876708984375, -0.2855224609375, -0.2430572509765625, -0.200592041015625, -0.1581268310546875, -0.11566162109375, -0.0731964111328125, -0.030731201171875, 0.0117340087890625, 0.05419921875, 0.0966644287109375, 0.139129638671875, 0.1815948486328125, 0.22406005859375, 0.2665252685546875, 0.308990478515625, 0.3514556884765625, 0.3939208984375, 0.4363861083984375, 0.478851318359375, 0.5213165283203125, 0.56378173828125, 0.6062469482421875, 0.648712158203125, 0.6911773681640625, 0.733642578125, 0.7761077880859375, 0.818572998046875, 0.8610382080078125, 0.90350341796875, 0.9459686279296875, 0.988433837890625, 1.0308990478515625, 1.0733642578125, 1.1158294677734375, 1.158294677734375, 1.2007598876953125, 1.24322509765625, 1.2856903076171875, 1.328155517578125, 1.3706207275390625, 1.4130859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 6.0, 5.0, 7.0, 4.0, 5.0, 9.0, 8.0, 9.0, 6.0, 17.0, 20.0, 22.0, 15.0, 25.0, 43.0, 37.0, 36.0, 41.0, 52.0, 45.0, 54.0, 57.0, 70.0, 45.0, 46.0, 44.0, 37.0, 35.0, 38.0, 26.0, 19.0, 20.0, 17.0, 18.0, 11.0, 9.0, 12.0, 9.0, 6.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.4677734375, -0.4536399841308594, -0.43950653076171875, -0.4253730773925781, -0.4112396240234375, -0.3971061706542969, -0.38297271728515625, -0.3688392639160156, -0.354705810546875, -0.3405723571777344, -0.32643890380859375, -0.3123054504394531, -0.2981719970703125, -0.2840385437011719, -0.26990509033203125, -0.2557716369628906, -0.24163818359375, -0.22750473022460938, -0.21337127685546875, -0.19923782348632812, -0.1851043701171875, -0.17097091674804688, -0.15683746337890625, -0.14270401000976562, -0.128570556640625, -0.11443710327148438, -0.10030364990234375, -0.08617019653320312, -0.0720367431640625, -0.057903289794921875, -0.04376983642578125, -0.029636383056640625, -0.0155029296875, -0.001369476318359375, 0.01276397705078125, 0.026897430419921875, 0.0410308837890625, 0.055164337158203125, 0.06929779052734375, 0.08343124389648438, 0.097564697265625, 0.11169815063476562, 0.12583160400390625, 0.13996505737304688, 0.1540985107421875, 0.16823196411132812, 0.18236541748046875, 0.19649887084960938, 0.21063232421875, 0.22476577758789062, 0.23889923095703125, 0.2530326843261719, 0.2671661376953125, 0.2812995910644531, 0.29543304443359375, 0.3095664978027344, 0.323699951171875, 0.3378334045410156, 0.35196685791015625, 0.3661003112792969, 0.3802337646484375, 0.3943672180175781, 0.40850067138671875, 0.4226341247558594, 0.436767578125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 6.0, 10.0, 16.0, 12.0, 10.0, 19.0, 33.0, 27.0, 21.0, 33.0, 22.0, 34.0, 23.0, 40.0, 42.0, 45.0, 38.0, 31.0, 49.0, 40.0, 42.0, 33.0, 37.0, 33.0, 30.0, 37.0, 30.0, 26.0, 26.0, 18.0, 15.0, 13.0, 16.0, 16.0, 6.0, 12.0, 5.0, 11.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.883255004882812, -28.85761070251465, -27.831966400146484, -26.80632209777832, -25.780677795410156, -24.755033493041992, -23.729389190673828, -22.703746795654297, -21.6781005859375, -20.652456283569336, -19.626811981201172, -18.601167678833008, -17.575523376464844, -16.54987907409668, -15.524235725402832, -14.498591423034668, -13.47294807434082, -12.447303771972656, -11.421659469604492, -10.396015167236328, -9.370370864868164, -8.3447265625, -7.319083213806152, -6.293438911437988, -5.267794609069824, -4.24215030670166, -3.216506242752075, -2.1908621788024902, -1.1652178764343262, -0.1395735740661621, 0.8860702514648438, 1.9117145538330078, 2.937358856201172, 3.963003158569336, 4.9886474609375, 6.014291286468506, 7.03993558883667, 8.065580368041992, 9.09122371673584, 10.116868019104004, 11.142512321472168, 12.168156623840332, 13.193800926208496, 14.219444274902344, 15.245088577270508, 16.270732879638672, 17.296377182006836, 18.322021484375, 19.347665786743164, 20.373310089111328, 21.398954391479492, 22.424598693847656, 23.45024299621582, 24.475887298583984, 25.501529693603516, 26.527175903320312, 27.552818298339844, 28.578462600708008, 29.604106903076172, 30.629751205444336, 31.6553955078125, 32.68103790283203, 33.70668411254883, 34.73232650756836, 35.757972717285156]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 9.0, 11.0, 9.0, 26.0, 17.0, 16.0, 24.0, 27.0, 35.0, 36.0, 41.0, 24.0, 47.0, 38.0, 43.0, 45.0, 36.0, 47.0, 50.0, 50.0, 33.0, 44.0, 46.0, 26.0, 23.0, 26.0, 28.0, 25.0, 24.0, 19.0, 13.0, 8.0, 11.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.287620544433594, -34.051116943359375, -32.814613342285156, -31.578107833862305, -30.341602325439453, -29.105098724365234, -27.868595123291016, -26.632091522216797, -25.395586013793945, -24.159082412719727, -22.922576904296875, -21.686073303222656, -20.449569702148438, -19.213064193725586, -17.976560592651367, -16.740055084228516, -15.503551483154297, -14.267046928405762, -13.030542373657227, -11.794038772583008, -10.557534217834473, -9.321029663085938, -8.084526062011719, -6.848021507263184, -5.611516952514648, -4.375012397766113, -3.1385083198547363, -1.9020040035247803, -0.6654996871948242, 0.5710048675537109, 1.807508945465088, 3.044013023376465, 4.280513763427734, 5.5170183181762695, 6.7535223960876465, 7.990026473999023, 9.226531028747559, 10.463035583496094, 11.699539184570312, 12.936043739318848, 14.172548294067383, 15.409052848815918, 16.645557403564453, 17.882061004638672, 19.11856460571289, 20.355070114135742, 21.59157371520996, 22.828079223632812, 24.06458282470703, 25.30108642578125, 26.5375919342041, 27.77409553527832, 29.010601043701172, 30.24710464477539, 31.48360824584961, 32.72011184692383, 33.95661926269531, 35.19312286376953, 36.42962646484375, 37.666133880615234, 38.90263748168945, 40.13914108276367, 41.37564468383789, 42.61214828491211, 43.84865188598633]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 15.0, 22.0, 45.0, 74.0, 113.0, 203.0, 315.0, 504.0, 784.0, 1284.0, 1958.0, 3073.0, 4587.0, 6883.0, 9971.0, 14144.0, 20162.0, 27051.0, 35815.0, 46010.0, 56099.0, 66439.0, 75504.0, 82655.0, 85804.0, 85363.0, 80498.0, 72788.0, 62901.0, 52907.0, 41923.0, 32267.0, 24521.0, 17519.0, 12627.0, 8919.0, 5819.0, 3808.0, 2616.0, 1702.0, 1024.0, 714.0, 430.0, 280.0, 146.0, 98.0, 77.0, 42.0, 25.0, 11.0, 11.0, 4.0, 0.0, 1.0, 3.0], "bins": [-17.0625, -16.5579833984375, -16.053466796875, -15.5489501953125, -15.04443359375, -14.5399169921875, -14.035400390625, -13.5308837890625, -13.0263671875, -12.5218505859375, -12.017333984375, -11.5128173828125, -11.00830078125, -10.5037841796875, -9.999267578125, -9.4947509765625, -8.990234375, -8.4857177734375, -7.981201171875, -7.4766845703125, -6.97216796875, -6.4676513671875, -5.963134765625, -5.4586181640625, -4.9541015625, -4.4495849609375, -3.945068359375, -3.4405517578125, -2.93603515625, -2.4315185546875, -1.927001953125, -1.4224853515625, -0.91796875, -0.4134521484375, 0.091064453125, 0.5955810546875, 1.10009765625, 1.6046142578125, 2.109130859375, 2.6136474609375, 3.1181640625, 3.6226806640625, 4.127197265625, 4.6317138671875, 5.13623046875, 5.6407470703125, 6.145263671875, 6.6497802734375, 7.154296875, 7.6588134765625, 8.163330078125, 8.6678466796875, 9.17236328125, 9.6768798828125, 10.181396484375, 10.6859130859375, 11.1904296875, 11.6949462890625, 12.199462890625, 12.7039794921875, 13.20849609375, 13.7130126953125, 14.217529296875, 14.7220458984375, 15.2265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 7.0, 10.0, 19.0, 15.0, 20.0, 23.0, 24.0, 24.0, 35.0, 36.0, 35.0, 37.0, 35.0, 36.0, 40.0, 42.0, 44.0, 47.0, 36.0, 38.0, 42.0, 34.0, 37.0, 42.0, 28.0, 22.0, 26.0, 32.0, 24.0, 23.0, 23.0, 8.0, 11.0, 4.0, 7.0, 0.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -34.02685546875, -32.8037109375, -31.58056640625, -30.357421875, -29.13427734375, -27.9111328125, -26.68798828125, -25.46484375, -24.24169921875, -23.0185546875, -21.79541015625, -20.572265625, -19.34912109375, -18.1259765625, -16.90283203125, -15.6796875, -14.45654296875, -13.2333984375, -12.01025390625, -10.787109375, -9.56396484375, -8.3408203125, -7.11767578125, -5.89453125, -4.67138671875, -3.4482421875, -2.22509765625, -1.001953125, 0.22119140625, 1.4443359375, 2.66748046875, 3.890625, 5.11376953125, 6.3369140625, 7.56005859375, 8.783203125, 10.00634765625, 11.2294921875, 12.45263671875, 13.67578125, 14.89892578125, 16.1220703125, 17.34521484375, 18.568359375, 19.79150390625, 21.0146484375, 22.23779296875, 23.4609375, 24.68408203125, 25.9072265625, 27.13037109375, 28.353515625, 29.57666015625, 30.7998046875, 32.02294921875, 33.24609375, 34.46923828125, 35.6923828125, 36.91552734375, 38.138671875, 39.36181640625, 40.5849609375, 41.80810546875, 43.03125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 7.0, 8.0, 16.0, 11.0, 22.0, 32.0, 69.0, 76.0, 135.0, 212.0, 369.0, 534.0, 844.0, 1295.0, 1869.0, 2870.0, 4304.0, 6263.0, 9374.0, 13320.0, 18927.0, 25823.0, 34755.0, 44481.0, 55747.0, 66369.0, 76799.0, 83823.0, 87047.0, 86446.0, 82317.0, 73883.0, 64474.0, 52546.0, 41952.0, 32340.0, 23973.0, 17293.0, 12059.0, 8498.0, 5864.0, 4006.0, 2582.0, 1712.0, 1103.0, 736.0, 467.0, 308.0, 224.0, 124.0, 84.0, 69.0, 46.0, 12.0, 14.0, 12.0, 12.0, 5.0, 4.0, 2.0], "bins": [-17.609375, -17.07373046875, -16.5380859375, -16.00244140625, -15.466796875, -14.93115234375, -14.3955078125, -13.85986328125, -13.32421875, -12.78857421875, -12.2529296875, -11.71728515625, -11.181640625, -10.64599609375, -10.1103515625, -9.57470703125, -9.0390625, -8.50341796875, -7.9677734375, -7.43212890625, -6.896484375, -6.36083984375, -5.8251953125, -5.28955078125, -4.75390625, -4.21826171875, -3.6826171875, -3.14697265625, -2.611328125, -2.07568359375, -1.5400390625, -1.00439453125, -0.46875, 0.06689453125, 0.6025390625, 1.13818359375, 1.673828125, 2.20947265625, 2.7451171875, 3.28076171875, 3.81640625, 4.35205078125, 4.8876953125, 5.42333984375, 5.958984375, 6.49462890625, 7.0302734375, 7.56591796875, 8.1015625, 8.63720703125, 9.1728515625, 9.70849609375, 10.244140625, 10.77978515625, 11.3154296875, 11.85107421875, 12.38671875, 12.92236328125, 13.4580078125, 13.99365234375, 14.529296875, 15.06494140625, 15.6005859375, 16.13623046875, 16.671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 7.0, 7.0, 11.0, 10.0, 9.0, 11.0, 16.0, 19.0, 19.0, 18.0, 27.0, 24.0, 15.0, 40.0, 28.0, 46.0, 30.0, 38.0, 35.0, 36.0, 45.0, 50.0, 38.0, 39.0, 42.0, 42.0, 45.0, 33.0, 33.0, 25.0, 26.0, 20.0, 21.0, 22.0, 11.0, 10.0, 14.0, 8.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.4375, -23.658447265625, -22.87939453125, -22.100341796875, -21.3212890625, -20.542236328125, -19.76318359375, -18.984130859375, -18.205078125, -17.426025390625, -16.64697265625, -15.867919921875, -15.0888671875, -14.309814453125, -13.53076171875, -12.751708984375, -11.97265625, -11.193603515625, -10.41455078125, -9.635498046875, -8.8564453125, -8.077392578125, -7.29833984375, -6.519287109375, -5.740234375, -4.961181640625, -4.18212890625, -3.403076171875, -2.6240234375, -1.844970703125, -1.06591796875, -0.286865234375, 0.4921875, 1.271240234375, 2.05029296875, 2.829345703125, 3.6083984375, 4.387451171875, 5.16650390625, 5.945556640625, 6.724609375, 7.503662109375, 8.28271484375, 9.061767578125, 9.8408203125, 10.619873046875, 11.39892578125, 12.177978515625, 12.95703125, 13.736083984375, 14.51513671875, 15.294189453125, 16.0732421875, 16.852294921875, 17.63134765625, 18.410400390625, 19.189453125, 19.968505859375, 20.74755859375, 21.526611328125, 22.3056640625, 23.084716796875, 23.86376953125, 24.642822265625, 25.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 7.0, 3.0, 7.0, 8.0, 15.0, 38.0, 44.0, 85.0, 109.0, 205.0, 295.0, 453.0, 647.0, 1001.0, 1675.0, 2361.0, 3453.0, 5270.0, 7475.0, 10788.0, 15100.0, 21362.0, 28402.0, 36810.0, 46685.0, 56833.0, 66858.0, 75087.0, 81151.0, 83486.0, 83117.0, 78028.0, 70702.0, 61922.0, 51497.0, 41561.0, 32314.0, 24619.0, 18272.0, 12863.0, 9139.0, 6226.0, 4269.0, 2903.0, 1868.0, 1245.0, 779.0, 558.0, 339.0, 205.0, 147.0, 98.0, 64.0, 35.0, 25.0, 32.0, 11.0, 9.0, 4.0, 3.0, 4.0], "bins": [-6.26171875, -6.07049560546875, -5.8792724609375, -5.68804931640625, -5.496826171875, -5.30560302734375, -5.1143798828125, -4.92315673828125, -4.73193359375, -4.54071044921875, -4.3494873046875, -4.15826416015625, -3.967041015625, -3.77581787109375, -3.5845947265625, -3.39337158203125, -3.2021484375, -3.01092529296875, -2.8197021484375, -2.62847900390625, -2.437255859375, -2.24603271484375, -2.0548095703125, -1.86358642578125, -1.67236328125, -1.48114013671875, -1.2899169921875, -1.09869384765625, -0.907470703125, -0.71624755859375, -0.5250244140625, -0.33380126953125, -0.142578125, 0.04864501953125, 0.2398681640625, 0.43109130859375, 0.622314453125, 0.81353759765625, 1.0047607421875, 1.19598388671875, 1.38720703125, 1.57843017578125, 1.7696533203125, 1.96087646484375, 2.152099609375, 2.34332275390625, 2.5345458984375, 2.72576904296875, 2.9169921875, 3.10821533203125, 3.2994384765625, 3.49066162109375, 3.681884765625, 3.87310791015625, 4.0643310546875, 4.25555419921875, 4.44677734375, 4.63800048828125, 4.8292236328125, 5.02044677734375, 5.211669921875, 5.40289306640625, 5.5941162109375, 5.78533935546875, 5.9765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 4.0, 10.0, 8.0, 18.0, 15.0, 13.0, 16.0, 17.0, 30.0, 22.0, 31.0, 28.0, 37.0, 40.0, 46.0, 45.0, 40.0, 55.0, 45.0, 40.0, 45.0, 42.0, 37.0, 36.0, 33.0, 41.0, 34.0, 28.0, 22.0, 21.0, 24.0, 18.0, 10.0, 5.0, 11.0, 6.0, 7.0, 8.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009441375732421875, -0.0009143650531768799, -0.0008845925331115723, -0.0008548200130462646, -0.000825047492980957, -0.0007952749729156494, -0.0007655024528503418, -0.0007357299327850342, -0.0007059574127197266, -0.0006761848926544189, -0.0006464123725891113, -0.0006166398525238037, -0.0005868673324584961, -0.0005570948123931885, -0.0005273222923278809, -0.0004975497722625732, -0.0004677772521972656, -0.000438004732131958, -0.0004082322120666504, -0.0003784596920013428, -0.00034868717193603516, -0.00031891465187072754, -0.0002891421318054199, -0.0002593696117401123, -0.0002295970916748047, -0.00019982457160949707, -0.00017005205154418945, -0.00014027953147888184, -0.00011050701141357422, -8.07344913482666e-05, -5.0961971282958984e-05, -2.1189451217651367e-05, 8.58306884765625e-06, 3.835558891296387e-05, 6.812810897827148e-05, 9.79006290435791e-05, 0.00012767314910888672, 0.00015744566917419434, 0.00018721818923950195, 0.00021699070930480957, 0.0002467632293701172, 0.0002765357494354248, 0.0003063082695007324, 0.00033608078956604004, 0.00036585330963134766, 0.0003956258296966553, 0.0004253983497619629, 0.0004551708698272705, 0.0004849433898925781, 0.0005147159099578857, 0.0005444884300231934, 0.000574260950088501, 0.0006040334701538086, 0.0006338059902191162, 0.0006635785102844238, 0.0006933510303497314, 0.0007231235504150391, 0.0007528960704803467, 0.0007826685905456543, 0.0008124411106109619, 0.0008422136306762695, 0.0008719861507415771, 0.0009017586708068848, 0.0009315311908721924, 0.0009613037109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 12.0, 16.0, 29.0, 39.0, 63.0, 111.0, 150.0, 232.0, 363.0, 635.0, 963.0, 1535.0, 2448.0, 3877.0, 5923.0, 9022.0, 13848.0, 20084.0, 28824.0, 39891.0, 53558.0, 67445.0, 81671.0, 92332.0, 98720.0, 98803.0, 93045.0, 81615.0, 68516.0, 54119.0, 40884.0, 29510.0, 20568.0, 13893.0, 9219.0, 6072.0, 3845.0, 2412.0, 1547.0, 997.0, 637.0, 417.0, 261.0, 147.0, 108.0, 61.0, 41.0, 19.0, 18.0, 11.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.7109375, -7.47015380859375, -7.2293701171875, -6.98858642578125, -6.747802734375, -6.50701904296875, -6.2662353515625, -6.02545166015625, -5.78466796875, -5.54388427734375, -5.3031005859375, -5.06231689453125, -4.821533203125, -4.58074951171875, -4.3399658203125, -4.09918212890625, -3.8583984375, -3.61761474609375, -3.3768310546875, -3.13604736328125, -2.895263671875, -2.65447998046875, -2.4136962890625, -2.17291259765625, -1.93212890625, -1.69134521484375, -1.4505615234375, -1.20977783203125, -0.968994140625, -0.72821044921875, -0.4874267578125, -0.24664306640625, -0.005859375, 0.23492431640625, 0.4757080078125, 0.71649169921875, 0.957275390625, 1.19805908203125, 1.4388427734375, 1.67962646484375, 1.92041015625, 2.16119384765625, 2.4019775390625, 2.64276123046875, 2.883544921875, 3.12432861328125, 3.3651123046875, 3.60589599609375, 3.8466796875, 4.08746337890625, 4.3282470703125, 4.56903076171875, 4.809814453125, 5.05059814453125, 5.2913818359375, 5.53216552734375, 5.77294921875, 6.01373291015625, 6.2545166015625, 6.49530029296875, 6.736083984375, 6.97686767578125, 7.2176513671875, 7.45843505859375, 7.69921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 5.0, 10.0, 9.0, 7.0, 8.0, 9.0, 12.0, 14.0, 20.0, 28.0, 20.0, 27.0, 34.0, 27.0, 30.0, 45.0, 46.0, 38.0, 43.0, 36.0, 41.0, 37.0, 50.0, 46.0, 36.0, 36.0, 33.0, 31.0, 28.0, 29.0, 37.0, 22.0, 11.0, 15.0, 14.0, 12.0, 5.0, 12.0, 8.0, 4.0, 3.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0], "bins": [-3.625, -3.5166015625, -3.408203125, -3.2998046875, -3.19140625, -3.0830078125, -2.974609375, -2.8662109375, -2.7578125, -2.6494140625, -2.541015625, -2.4326171875, -2.32421875, -2.2158203125, -2.107421875, -1.9990234375, -1.890625, -1.7822265625, -1.673828125, -1.5654296875, -1.45703125, -1.3486328125, -1.240234375, -1.1318359375, -1.0234375, -0.9150390625, -0.806640625, -0.6982421875, -0.58984375, -0.4814453125, -0.373046875, -0.2646484375, -0.15625, -0.0478515625, 0.060546875, 0.1689453125, 0.27734375, 0.3857421875, 0.494140625, 0.6025390625, 0.7109375, 0.8193359375, 0.927734375, 1.0361328125, 1.14453125, 1.2529296875, 1.361328125, 1.4697265625, 1.578125, 1.6865234375, 1.794921875, 1.9033203125, 2.01171875, 2.1201171875, 2.228515625, 2.3369140625, 2.4453125, 2.5537109375, 2.662109375, 2.7705078125, 2.87890625, 2.9873046875, 3.095703125, 3.2041015625, 3.3125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 3.0, 13.0, 7.0, 19.0, 13.0, 16.0, 19.0, 21.0, 28.0, 26.0, 31.0, 28.0, 33.0, 39.0, 45.0, 37.0, 56.0, 59.0, 46.0, 47.0, 35.0, 47.0, 52.0, 28.0, 35.0, 36.0, 32.0, 27.0, 13.0, 11.0, 18.0, 17.0, 13.0, 6.0, 9.0, 6.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.935272216796875, -35.74992752075195, -34.56458282470703, -33.37923812866211, -32.19389343261719, -31.008546829223633, -29.823200225830078, -28.637855529785156, -27.452510833740234, -26.267166137695312, -25.08182144165039, -23.896474838256836, -22.711130142211914, -21.525785446166992, -20.340438842773438, -19.155094146728516, -17.969749450683594, -16.784404754638672, -15.599059104919434, -14.413713455200195, -13.228368759155273, -12.043024063110352, -10.857678413391113, -9.672332763671875, -8.486988067626953, -7.301642894744873, -6.116297721862793, -4.930952548980713, -3.745607376098633, -2.5602622032165527, -1.3749170303344727, -0.18957138061523438, 0.9957771301269531, 2.181122303009033, 3.3664674758911133, 4.551812648773193, 5.737157821655273, 6.9225029945373535, 8.107848167419434, 9.293193817138672, 10.478538513183594, 11.663883209228516, 12.849228858947754, 14.034574508666992, 15.219919204711914, 16.405263900756836, 17.59061050415039, 18.775955200195312, 19.961299896240234, 21.146644592285156, 22.331989288330078, 23.517335891723633, 24.702680587768555, 25.888025283813477, 27.07337188720703, 28.258716583251953, 29.444061279296875, 30.629405975341797, 31.81475067138672, 33.00009536743164, 34.18544006347656, 35.37078857421875, 36.55613327026367, 37.741477966308594, 38.926822662353516]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 12.0, 8.0, 16.0, 16.0, 23.0, 23.0, 31.0, 30.0, 46.0, 38.0, 36.0, 33.0, 34.0, 49.0, 46.0, 48.0, 28.0, 45.0, 43.0, 39.0, 59.0, 41.0, 36.0, 34.0, 35.0, 17.0, 26.0, 22.0, 9.0, 17.0, 12.0, 11.0, 3.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.25132751464844, -40.81850814819336, -39.38568878173828, -37.9528694152832, -36.520050048828125, -35.08723068237305, -33.65441131591797, -32.221595764160156, -30.788774490356445, -29.355955123901367, -27.92313575744629, -26.490318298339844, -25.057498931884766, -23.624679565429688, -22.19186019897461, -20.75904083251953, -19.326221466064453, -17.893402099609375, -16.460582733154297, -15.027764320373535, -13.594944953918457, -12.162125587463379, -10.729307174682617, -9.296487808227539, -7.863668441772461, -6.430849075317383, -4.998030185699463, -3.565211296081543, -2.132391929626465, -0.6995725631713867, 0.733245849609375, 2.166065216064453, 3.5988845825195312, 5.031703948974609, 6.464522838592529, 7.897341728210449, 9.330161094665527, 10.762980461120605, 12.195798873901367, 13.628618240356445, 15.061437606811523, 16.4942569732666, 17.92707633972168, 19.359893798828125, 20.792713165283203, 22.22553253173828, 23.65835189819336, 25.091171264648438, 26.523990631103516, 27.956809997558594, 29.389629364013672, 30.82244873046875, 32.25526809692383, 33.688087463378906, 35.12090301513672, 36.55372619628906, 37.986541748046875, 39.41936111450195, 40.85218048095703, 42.28499984741211, 43.71781921386719, 45.150638580322266, 46.583457946777344, 48.016273498535156, 49.4490966796875]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [3.0, 14.0, 11.0, 19.0, 25.0, 54.0, 84.0, 142.0, 221.0, 370.0, 557.0, 916.0, 1530.0, 2302.0, 3497.0, 5439.0, 8434.0, 12306.0, 18511.0, 26811.0, 38447.0, 54175.0, 75005.0, 99963.0, 132461.0, 167132.0, 206725.0, 244937.0, 280860.0, 308619.0, 325407.0, 330308.0, 318000.0, 296064.0, 263961.0, 225580.0, 187133.0, 147743.0, 114878.0, 86603.0, 63796.0, 45592.0, 32333.0, 22043.0, 15227.0, 10215.0, 7048.0, 4489.0, 2884.0, 1952.0, 1241.0, 808.0, 530.0, 336.0, 232.0, 123.0, 75.0, 52.0, 33.0, 16.0, 18.0, 7.0, 5.0, 2.0], "bins": [-23.625, -22.869140625, -22.11328125, -21.357421875, -20.6015625, -19.845703125, -19.08984375, -18.333984375, -17.578125, -16.822265625, -16.06640625, -15.310546875, -14.5546875, -13.798828125, -13.04296875, -12.287109375, -11.53125, -10.775390625, -10.01953125, -9.263671875, -8.5078125, -7.751953125, -6.99609375, -6.240234375, -5.484375, -4.728515625, -3.97265625, -3.216796875, -2.4609375, -1.705078125, -0.94921875, -0.193359375, 0.5625, 1.318359375, 2.07421875, 2.830078125, 3.5859375, 4.341796875, 5.09765625, 5.853515625, 6.609375, 7.365234375, 8.12109375, 8.876953125, 9.6328125, 10.388671875, 11.14453125, 11.900390625, 12.65625, 13.412109375, 14.16796875, 14.923828125, 15.6796875, 16.435546875, 17.19140625, 17.947265625, 18.703125, 19.458984375, 20.21484375, 20.970703125, 21.7265625, 22.482421875, 23.23828125, 23.994140625, 24.75]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 3.0, 4.0, 12.0, 10.0, 11.0, 15.0, 30.0, 25.0, 24.0, 29.0, 34.0, 47.0, 41.0, 50.0, 38.0, 42.0, 38.0, 46.0, 39.0, 55.0, 42.0, 33.0, 43.0, 48.0, 32.0, 29.0, 39.0, 26.0, 27.0, 18.0, 21.0, 6.0, 11.0, 8.0, 5.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.21875, -38.82568359375, -37.4326171875, -36.03955078125, -34.646484375, -33.25341796875, -31.8603515625, -30.46728515625, -29.07421875, -27.68115234375, -26.2880859375, -24.89501953125, -23.501953125, -22.10888671875, -20.7158203125, -19.32275390625, -17.9296875, -16.53662109375, -15.1435546875, -13.75048828125, -12.357421875, -10.96435546875, -9.5712890625, -8.17822265625, -6.78515625, -5.39208984375, -3.9990234375, -2.60595703125, -1.212890625, 0.18017578125, 1.5732421875, 2.96630859375, 4.359375, 5.75244140625, 7.1455078125, 8.53857421875, 9.931640625, 11.32470703125, 12.7177734375, 14.11083984375, 15.50390625, 16.89697265625, 18.2900390625, 19.68310546875, 21.076171875, 22.46923828125, 23.8623046875, 25.25537109375, 26.6484375, 28.04150390625, 29.4345703125, 30.82763671875, 32.220703125, 33.61376953125, 35.0068359375, 36.39990234375, 37.79296875, 39.18603515625, 40.5791015625, 41.97216796875, 43.365234375, 44.75830078125, 46.1513671875, 47.54443359375, 48.9375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 7.0, 22.0, 33.0, 52.0, 101.0, 195.0, 335.0, 613.0, 1176.0, 2123.0, 3734.0, 6502.0, 11439.0, 19120.0, 32274.0, 52148.0, 81254.0, 122102.0, 174636.0, 236404.0, 304919.0, 364503.0, 409665.0, 427608.0, 417532.0, 378398.0, 321869.0, 255505.0, 192704.0, 136198.0, 91395.0, 58871.0, 37299.0, 22367.0, 13303.0, 7797.0, 4468.0, 2489.0, 1397.0, 779.0, 409.0, 243.0, 127.0, 75.0, 31.0, 27.0, 25.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.0, -34.8623046875, -33.724609375, -32.5869140625, -31.44921875, -30.3115234375, -29.173828125, -28.0361328125, -26.8984375, -25.7607421875, -24.623046875, -23.4853515625, -22.34765625, -21.2099609375, -20.072265625, -18.9345703125, -17.796875, -16.6591796875, -15.521484375, -14.3837890625, -13.24609375, -12.1083984375, -10.970703125, -9.8330078125, -8.6953125, -7.5576171875, -6.419921875, -5.2822265625, -4.14453125, -3.0068359375, -1.869140625, -0.7314453125, 0.40625, 1.5439453125, 2.681640625, 3.8193359375, 4.95703125, 6.0947265625, 7.232421875, 8.3701171875, 9.5078125, 10.6455078125, 11.783203125, 12.9208984375, 14.05859375, 15.1962890625, 16.333984375, 17.4716796875, 18.609375, 19.7470703125, 20.884765625, 22.0224609375, 23.16015625, 24.2978515625, 25.435546875, 26.5732421875, 27.7109375, 28.8486328125, 29.986328125, 31.1240234375, 32.26171875, 33.3994140625, 34.537109375, 35.6748046875, 36.8125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 6.0, 10.0, 7.0, 15.0, 17.0, 27.0, 25.0, 35.0, 30.0, 41.0, 73.0, 93.0, 109.0, 109.0, 140.0, 140.0, 164.0, 176.0, 188.0, 201.0, 203.0, 202.0, 230.0, 203.0, 182.0, 187.0, 189.0, 155.0, 129.0, 115.0, 135.0, 93.0, 98.0, 66.0, 65.0, 55.0, 38.0, 35.0, 23.0, 18.0, 20.0, 8.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0], "bins": [-23.359375, -22.739501953125, -22.11962890625, -21.499755859375, -20.8798828125, -20.260009765625, -19.64013671875, -19.020263671875, -18.400390625, -17.780517578125, -17.16064453125, -16.540771484375, -15.9208984375, -15.301025390625, -14.68115234375, -14.061279296875, -13.44140625, -12.821533203125, -12.20166015625, -11.581787109375, -10.9619140625, -10.342041015625, -9.72216796875, -9.102294921875, -8.482421875, -7.862548828125, -7.24267578125, -6.622802734375, -6.0029296875, -5.383056640625, -4.76318359375, -4.143310546875, -3.5234375, -2.903564453125, -2.28369140625, -1.663818359375, -1.0439453125, -0.424072265625, 0.19580078125, 0.815673828125, 1.435546875, 2.055419921875, 2.67529296875, 3.295166015625, 3.9150390625, 4.534912109375, 5.15478515625, 5.774658203125, 6.39453125, 7.014404296875, 7.63427734375, 8.254150390625, 8.8740234375, 9.493896484375, 10.11376953125, 10.733642578125, 11.353515625, 11.973388671875, 12.59326171875, 13.213134765625, 13.8330078125, 14.452880859375, 15.07275390625, 15.692626953125, 16.3125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 3.0, 4.0, 5.0, 6.0, 12.0, 13.0, 15.0, 28.0, 19.0, 21.0, 16.0, 36.0, 33.0, 38.0, 43.0, 43.0, 62.0, 57.0, 47.0, 48.0, 59.0, 40.0, 37.0, 34.0, 34.0, 41.0, 24.0, 26.0, 31.0, 18.0, 20.0, 18.0, 11.0, 10.0, 11.0, 6.0, 7.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-57.164886474609375, -55.528656005859375, -53.892425537109375, -52.25619125366211, -50.61996078491211, -48.98373031616211, -47.347496032714844, -45.711265563964844, -44.075035095214844, -42.438804626464844, -40.802574157714844, -39.16633987426758, -37.53010940551758, -35.89387893676758, -34.25764465332031, -32.62141418457031, -30.985183715820312, -29.348953247070312, -27.71272087097168, -26.076488494873047, -24.440258026123047, -22.804027557373047, -21.167795181274414, -19.53156280517578, -17.89533233642578, -16.25910186767578, -14.622869491577148, -12.986638069152832, -11.350406646728516, -9.7141752243042, -8.077943801879883, -6.441712379455566, -4.80548095703125, -3.1692495346069336, -1.5330181121826172, 0.10321331024169922, 1.7394447326660156, 3.375676155090332, 5.011907577514648, 6.648138999938965, 8.284370422363281, 9.920601844787598, 11.556833267211914, 13.19306468963623, 14.829296112060547, 16.465526580810547, 18.10175895690918, 19.737991333007812, 21.374221801757812, 23.010452270507812, 24.646684646606445, 26.282917022705078, 27.919147491455078, 29.555377960205078, 31.19161033630371, 32.827842712402344, 34.464073181152344, 36.100303649902344, 37.736534118652344, 39.37276840209961, 41.00899887084961, 42.64522933959961, 44.281463623046875, 45.917694091796875, 47.553924560546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 12.0, 10.0, 12.0, 20.0, 17.0, 13.0, 21.0, 24.0, 26.0, 30.0, 49.0, 37.0, 43.0, 38.0, 50.0, 36.0, 50.0, 40.0, 46.0, 54.0, 38.0, 50.0, 45.0, 37.0, 35.0, 30.0, 22.0, 27.0, 18.0, 10.0, 12.0, 11.0, 10.0, 5.0, 4.0, 5.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.53180694580078, -53.77714920043945, -52.022491455078125, -50.26783752441406, -48.513179779052734, -46.758522033691406, -45.00386428833008, -43.24920654296875, -41.49454879760742, -39.739891052246094, -37.985233306884766, -36.23057556152344, -34.475921630859375, -32.72126388549805, -30.96660614013672, -29.21194839477539, -27.457292556762695, -25.702634811401367, -23.947978973388672, -22.193321228027344, -20.438663482666016, -18.684005737304688, -16.929349899291992, -15.174692153930664, -13.420035362243652, -11.66537857055664, -9.910720825195312, -8.1560640335083, -6.401406764984131, -4.646749496459961, -2.892092704772949, -1.137434959411621, 0.6172218322753906, 2.3718791007995605, 4.1265363693237305, 5.881193161010742, 7.635850429534912, 9.390507698059082, 11.145164489746094, 12.899822235107422, 14.654479026794434, 16.409135818481445, 18.163793563842773, 19.91844940185547, 21.673107147216797, 23.427764892578125, 25.182422637939453, 26.93708038330078, 28.691736221313477, 30.446393966674805, 32.2010498046875, 33.95570755004883, 35.710365295410156, 37.465023040771484, 39.21968078613281, 40.974334716796875, 42.7289924621582, 44.48365020751953, 46.23830795288086, 47.99296569824219, 49.74761962890625, 51.50227737426758, 53.256935119628906, 55.011592864990234, 56.76625061035156]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 13.0, 16.0, 49.0, 42.0, 53.0, 94.0, 135.0, 201.0, 289.0, 452.0, 706.0, 1112.0, 1557.0, 2543.0, 3829.0, 5839.0, 9310.0, 14902.0, 23269.0, 36531.0, 56100.0, 82515.0, 114099.0, 138189.0, 143347.0, 126019.0, 96425.0, 67221.0, 44701.0, 28626.0, 18124.0, 11495.0, 7311.0, 4640.0, 3039.0, 2035.0, 1232.0, 839.0, 515.0, 365.0, 250.0, 194.0, 107.0, 75.0, 57.0, 40.0, 13.0, 11.0, 11.0, 3.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.78125, -6.5640869140625, -6.346923828125, -6.1297607421875, -5.91259765625, -5.6954345703125, -5.478271484375, -5.2611083984375, -5.0439453125, -4.8267822265625, -4.609619140625, -4.3924560546875, -4.17529296875, -3.9581298828125, -3.740966796875, -3.5238037109375, -3.306640625, -3.0894775390625, -2.872314453125, -2.6551513671875, -2.43798828125, -2.2208251953125, -2.003662109375, -1.7864990234375, -1.5693359375, -1.3521728515625, -1.135009765625, -0.9178466796875, -0.70068359375, -0.4835205078125, -0.266357421875, -0.0491943359375, 0.16796875, 0.3851318359375, 0.602294921875, 0.8194580078125, 1.03662109375, 1.2537841796875, 1.470947265625, 1.6881103515625, 1.9052734375, 2.1224365234375, 2.339599609375, 2.5567626953125, 2.77392578125, 2.9910888671875, 3.208251953125, 3.4254150390625, 3.642578125, 3.8597412109375, 4.076904296875, 4.2940673828125, 4.51123046875, 4.7283935546875, 4.945556640625, 5.1627197265625, 5.3798828125, 5.5970458984375, 5.814208984375, 6.0313720703125, 6.24853515625, 6.4656982421875, 6.682861328125, 6.9000244140625, 7.1171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 8.0, 6.0, 13.0, 9.0, 13.0, 13.0, 9.0, 16.0, 22.0, 18.0, 15.0, 27.0, 28.0, 37.0, 36.0, 34.0, 37.0, 25.0, 45.0, 33.0, 45.0, 37.0, 41.0, 47.0, 36.0, 40.0, 42.0, 31.0, 22.0, 22.0, 25.0, 23.0, 25.0, 19.0, 23.0, 15.0, 11.0, 6.0, 14.0, 6.0, 0.0, 9.0, 0.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.21875, -44.666015625, -43.11328125, -41.560546875, -40.0078125, -38.455078125, -36.90234375, -35.349609375, -33.796875, -32.244140625, -30.69140625, -29.138671875, -27.5859375, -26.033203125, -24.48046875, -22.927734375, -21.375, -19.822265625, -18.26953125, -16.716796875, -15.1640625, -13.611328125, -12.05859375, -10.505859375, -8.953125, -7.400390625, -5.84765625, -4.294921875, -2.7421875, -1.189453125, 0.36328125, 1.916015625, 3.46875, 5.021484375, 6.57421875, 8.126953125, 9.6796875, 11.232421875, 12.78515625, 14.337890625, 15.890625, 17.443359375, 18.99609375, 20.548828125, 22.1015625, 23.654296875, 25.20703125, 26.759765625, 28.3125, 29.865234375, 31.41796875, 32.970703125, 34.5234375, 36.076171875, 37.62890625, 39.181640625, 40.734375, 42.287109375, 43.83984375, 45.392578125, 46.9453125, 48.498046875, 50.05078125, 51.603515625, 53.15625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 16.0, 17.0, 30.0, 45.0, 74.0, 111.0, 179.0, 302.0, 515.0, 802.0, 1309.0, 2351.0, 3983.0, 7066.0, 12593.0, 22085.0, 39185.0, 68192.0, 110313.0, 159828.0, 185231.0, 161237.0, 112624.0, 68505.0, 39576.0, 22451.0, 12793.0, 7182.0, 4072.0, 2415.0, 1316.0, 830.0, 532.0, 279.0, 197.0, 109.0, 78.0, 42.0, 33.0, 17.0, 15.0, 11.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.796875, -8.5177001953125, -8.238525390625, -7.9593505859375, -7.68017578125, -7.4010009765625, -7.121826171875, -6.8426513671875, -6.5634765625, -6.2843017578125, -6.005126953125, -5.7259521484375, -5.44677734375, -5.1676025390625, -4.888427734375, -4.6092529296875, -4.330078125, -4.0509033203125, -3.771728515625, -3.4925537109375, -3.21337890625, -2.9342041015625, -2.655029296875, -2.3758544921875, -2.0966796875, -1.8175048828125, -1.538330078125, -1.2591552734375, -0.97998046875, -0.7008056640625, -0.421630859375, -0.1424560546875, 0.13671875, 0.4158935546875, 0.695068359375, 0.9742431640625, 1.25341796875, 1.5325927734375, 1.811767578125, 2.0909423828125, 2.3701171875, 2.6492919921875, 2.928466796875, 3.2076416015625, 3.48681640625, 3.7659912109375, 4.045166015625, 4.3243408203125, 4.603515625, 4.8826904296875, 5.161865234375, 5.4410400390625, 5.72021484375, 5.9993896484375, 6.278564453125, 6.5577392578125, 6.8369140625, 7.1160888671875, 7.395263671875, 7.6744384765625, 7.95361328125, 8.2327880859375, 8.511962890625, 8.7911376953125, 9.0703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 8.0, 1.0, 5.0, 6.0, 16.0, 11.0, 10.0, 16.0, 15.0, 15.0, 29.0, 26.0, 22.0, 23.0, 39.0, 54.0, 50.0, 24.0, 38.0, 31.0, 44.0, 46.0, 44.0, 38.0, 35.0, 34.0, 35.0, 31.0, 25.0, 23.0, 34.0, 31.0, 20.0, 14.0, 15.0, 13.0, 14.0, 14.0, 8.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-31.328125, -30.367919921875, -29.40771484375, -28.447509765625, -27.4873046875, -26.527099609375, -25.56689453125, -24.606689453125, -23.646484375, -22.686279296875, -21.72607421875, -20.765869140625, -19.8056640625, -18.845458984375, -17.88525390625, -16.925048828125, -15.96484375, -15.004638671875, -14.04443359375, -13.084228515625, -12.1240234375, -11.163818359375, -10.20361328125, -9.243408203125, -8.283203125, -7.322998046875, -6.36279296875, -5.402587890625, -4.4423828125, -3.482177734375, -2.52197265625, -1.561767578125, -0.6015625, 0.358642578125, 1.31884765625, 2.279052734375, 3.2392578125, 4.199462890625, 5.15966796875, 6.119873046875, 7.080078125, 8.040283203125, 9.00048828125, 9.960693359375, 10.9208984375, 11.881103515625, 12.84130859375, 13.801513671875, 14.76171875, 15.721923828125, 16.68212890625, 17.642333984375, 18.6025390625, 19.562744140625, 20.52294921875, 21.483154296875, 22.443359375, 23.403564453125, 24.36376953125, 25.323974609375, 26.2841796875, 27.244384765625, 28.20458984375, 29.164794921875, 30.125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 8.0, 14.0, 12.0, 22.0, 35.0, 42.0, 72.0, 100.0, 143.0, 200.0, 307.0, 464.0, 673.0, 1096.0, 1886.0, 3221.0, 5569.0, 10178.0, 19075.0, 36435.0, 68869.0, 124002.0, 193172.0, 216490.0, 160888.0, 94473.0, 51086.0, 27193.0, 14327.0, 7676.0, 4362.0, 2449.0, 1479.0, 891.0, 537.0, 324.0, 255.0, 149.0, 103.0, 80.0, 56.0, 31.0, 38.0, 19.0, 15.0, 12.0, 10.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.179931640625, -1.13818359375, -1.096435546875, -1.0546875, -1.012939453125, -0.97119140625, -0.929443359375, -0.8876953125, -0.845947265625, -0.80419921875, -0.762451171875, -0.720703125, -0.678955078125, -0.63720703125, -0.595458984375, -0.5537109375, -0.511962890625, -0.47021484375, -0.428466796875, -0.38671875, -0.344970703125, -0.30322265625, -0.261474609375, -0.2197265625, -0.177978515625, -0.13623046875, -0.094482421875, -0.052734375, -0.010986328125, 0.03076171875, 0.072509765625, 0.1142578125, 0.156005859375, 0.19775390625, 0.239501953125, 0.28125, 0.322998046875, 0.36474609375, 0.406494140625, 0.4482421875, 0.489990234375, 0.53173828125, 0.573486328125, 0.615234375, 0.656982421875, 0.69873046875, 0.740478515625, 0.7822265625, 0.823974609375, 0.86572265625, 0.907470703125, 0.94921875, 0.990966796875, 1.03271484375, 1.074462890625, 1.1162109375, 1.157958984375, 1.19970703125, 1.241455078125, 1.283203125, 1.324951171875, 1.36669921875, 1.408447265625, 1.4501953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 5.0, 6.0, 12.0, 7.0, 12.0, 18.0, 6.0, 15.0, 19.0, 17.0, 21.0, 20.0, 29.0, 29.0, 30.0, 47.0, 35.0, 34.0, 33.0, 53.0, 38.0, 36.0, 54.0, 44.0, 36.0, 39.0, 37.0, 23.0, 31.0, 32.0, 30.0, 23.0, 19.0, 15.0, 19.0, 10.0, 6.0, 9.0, 7.0, 2.0, 8.0, 9.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.00010484457015991211, -0.00010163150727748871, -9.841844439506531e-05, -9.52053815126419e-05, -9.19923186302185e-05, -8.87792557477951e-05, -8.55661928653717e-05, -8.23531299829483e-05, -7.91400671005249e-05, -7.59270042181015e-05, -7.27139413356781e-05, -6.95008784532547e-05, -6.62878155708313e-05, -6.30747526884079e-05, -5.98616898059845e-05, -5.6648626923561096e-05, -5.3435564041137695e-05, -5.0222501158714294e-05, -4.7009438276290894e-05, -4.379637539386749e-05, -4.058331251144409e-05, -3.737024962902069e-05, -3.415718674659729e-05, -3.094412386417389e-05, -2.7731060981750488e-05, -2.4517998099327087e-05, -2.1304935216903687e-05, -1.8091872334480286e-05, -1.4878809452056885e-05, -1.1665746569633484e-05, -8.452683687210083e-06, -5.239620804786682e-06, -2.0265579223632812e-06, 1.1865049600601196e-06, 4.3995678424835205e-06, 7.612630724906921e-06, 1.0825693607330322e-05, 1.4038756489753723e-05, 1.7251819372177124e-05, 2.0464882254600525e-05, 2.3677945137023926e-05, 2.6891008019447327e-05, 3.0104070901870728e-05, 3.331713378429413e-05, 3.653019666671753e-05, 3.974325954914093e-05, 4.295632243156433e-05, 4.616938531398773e-05, 4.938244819641113e-05, 5.2595511078834534e-05, 5.5808573961257935e-05, 5.9021636843681335e-05, 6.223469972610474e-05, 6.544776260852814e-05, 6.866082549095154e-05, 7.187388837337494e-05, 7.508695125579834e-05, 7.830001413822174e-05, 8.151307702064514e-05, 8.472613990306854e-05, 8.793920278549194e-05, 9.115226566791534e-05, 9.436532855033875e-05, 9.757839143276215e-05, 0.00010079145431518555]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 9.0, 16.0, 17.0, 35.0, 53.0, 53.0, 88.0, 110.0, 180.0, 278.0, 364.0, 621.0, 840.0, 1328.0, 1968.0, 3073.0, 4799.0, 7393.0, 12016.0, 19239.0, 32285.0, 52732.0, 85821.0, 135501.0, 183883.0, 177617.0, 124874.0, 78745.0, 47734.0, 28872.0, 17517.0, 10952.0, 6790.0, 4453.0, 2711.0, 1860.0, 1251.0, 770.0, 566.0, 357.0, 237.0, 173.0, 108.0, 83.0, 54.0, 38.0, 28.0, 19.0, 15.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0], "bins": [-2.193359375, -2.128662109375, -2.06396484375, -1.999267578125, -1.9345703125, -1.869873046875, -1.80517578125, -1.740478515625, -1.67578125, -1.611083984375, -1.54638671875, -1.481689453125, -1.4169921875, -1.352294921875, -1.28759765625, -1.222900390625, -1.158203125, -1.093505859375, -1.02880859375, -0.964111328125, -0.8994140625, -0.834716796875, -0.77001953125, -0.705322265625, -0.640625, -0.575927734375, -0.51123046875, -0.446533203125, -0.3818359375, -0.317138671875, -0.25244140625, -0.187744140625, -0.123046875, -0.058349609375, 0.00634765625, 0.071044921875, 0.1357421875, 0.200439453125, 0.26513671875, 0.329833984375, 0.39453125, 0.459228515625, 0.52392578125, 0.588623046875, 0.6533203125, 0.718017578125, 0.78271484375, 0.847412109375, 0.912109375, 0.976806640625, 1.04150390625, 1.106201171875, 1.1708984375, 1.235595703125, 1.30029296875, 1.364990234375, 1.4296875, 1.494384765625, 1.55908203125, 1.623779296875, 1.6884765625, 1.753173828125, 1.81787109375, 1.882568359375, 1.947265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 7.0, 9.0, 10.0, 9.0, 20.0, 22.0, 17.0, 30.0, 27.0, 41.0, 40.0, 61.0, 61.0, 72.0, 80.0, 83.0, 68.0, 63.0, 48.0, 49.0, 38.0, 32.0, 25.0, 18.0, 21.0, 11.0, 14.0, 6.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71337890625, -0.6857070922851562, -0.6580352783203125, -0.6303634643554688, -0.602691650390625, -0.5750198364257812, -0.5473480224609375, -0.5196762084960938, -0.49200439453125, -0.46433258056640625, -0.4366607666015625, -0.40898895263671875, -0.381317138671875, -0.35364532470703125, -0.3259735107421875, -0.29830169677734375, -0.2706298828125, -0.24295806884765625, -0.2152862548828125, -0.18761444091796875, -0.159942626953125, -0.13227081298828125, -0.1045989990234375, -0.07692718505859375, -0.04925537109375, -0.02158355712890625, 0.0060882568359375, 0.03376007080078125, 0.061431884765625, 0.08910369873046875, 0.1167755126953125, 0.14444732666015625, 0.172119140625, 0.19979095458984375, 0.2274627685546875, 0.25513458251953125, 0.282806396484375, 0.31047821044921875, 0.3381500244140625, 0.36582183837890625, 0.39349365234375, 0.42116546630859375, 0.4488372802734375, 0.47650909423828125, 0.504180908203125, 0.5318527221679688, 0.5595245361328125, 0.5871963500976562, 0.6148681640625, 0.6425399780273438, 0.6702117919921875, 0.6978836059570312, 0.725555419921875, 0.7532272338867188, 0.7808990478515625, 0.8085708618164062, 0.83624267578125, 0.8639144897460938, 0.8915863037109375, 0.9192581176757812, 0.946929931640625, 0.9746017456054688, 1.0022735595703125, 1.0299453735351562, 1.0576171875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 2.0, 4.0, 4.0, 8.0, 9.0, 13.0, 16.0, 21.0, 24.0, 19.0, 17.0, 34.0, 32.0, 35.0, 48.0, 39.0, 63.0, 60.0, 45.0, 42.0, 55.0, 52.0, 34.0, 32.0, 41.0, 40.0, 27.0, 23.0, 33.0, 19.0, 17.0, 19.0, 17.0, 8.0, 7.0, 11.0, 6.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.571441650390625, -55.9372673034668, -54.30309295654297, -52.66891860961914, -51.03474426269531, -49.400569915771484, -47.766395568847656, -46.132225036621094, -44.498046875, -42.86387252807617, -41.229698181152344, -39.595523834228516, -37.96134948730469, -36.32717514038086, -34.69300079345703, -33.05883026123047, -31.42465591430664, -29.790481567382812, -28.156307220458984, -26.522132873535156, -24.887958526611328, -23.2537841796875, -21.619611740112305, -19.985437393188477, -18.35126304626465, -16.71708869934082, -15.082914352416992, -13.44874095916748, -11.814566612243652, -10.180392265319824, -8.546218872070312, -6.912044525146484, -5.277873992919922, -3.643699884414673, -2.009525775909424, -0.3753519058227539, 1.2588224411010742, 2.8929967880249023, 4.527170181274414, 6.161344528198242, 7.79551887512207, 9.429693222045898, 11.063867568969727, 12.698040962219238, 14.332215309143066, 15.966389656066895, 17.600563049316406, 19.234737396240234, 20.868911743164062, 22.50308609008789, 24.13726043701172, 25.771434783935547, 27.405609130859375, 29.039783477783203, 30.6739559173584, 32.308128356933594, 33.94230651855469, 35.576480865478516, 37.210655212402344, 38.84482955932617, 40.47900390625, 42.11317825317383, 43.747352600097656, 45.38152313232422, 47.01569747924805]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 13.0, 8.0, 13.0, 20.0, 17.0, 14.0, 18.0, 29.0, 24.0, 31.0, 49.0, 35.0, 45.0, 38.0, 50.0, 36.0, 52.0, 39.0, 47.0, 51.0, 39.0, 49.0, 46.0, 38.0, 34.0, 32.0, 19.0, 30.0, 16.0, 10.0, 10.0, 12.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.09373092651367, -54.33269500732422, -52.571659088134766, -50.81062316894531, -49.049591064453125, -47.28855514526367, -45.52751922607422, -43.766483306884766, -42.00544738769531, -40.24441146850586, -38.483375549316406, -36.72234344482422, -34.961307525634766, -33.20027160644531, -31.43923568725586, -29.678199768066406, -27.91716766357422, -26.156131744384766, -24.395097732543945, -22.634061813354492, -20.873027801513672, -19.11199188232422, -17.350955963134766, -15.589920997619629, -13.828886032104492, -12.067851066589355, -10.306816101074219, -8.545780181884766, -6.784745216369629, -5.023710250854492, -3.262674331665039, -1.5016393661499023, 0.2593955993652344, 2.02043080329895, 3.781466007232666, 5.542501449584961, 7.303536415100098, 9.064571380615234, 10.825607299804688, 12.586642265319824, 14.347677230834961, 16.108713150024414, 17.869747161865234, 19.630783081054688, 21.39181900024414, 23.15285301208496, 24.913888931274414, 26.674922943115234, 28.435958862304688, 30.19699478149414, 31.95802879333496, 33.71906280517578, 35.480098724365234, 37.24113464355469, 39.00217056274414, 40.763206481933594, 42.52423858642578, 44.285274505615234, 46.04631042480469, 47.807342529296875, 49.56837844848633, 51.32941436767578, 53.090450286865234, 54.85148620605469, 56.61252212524414]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 12.0, 22.0, 51.0, 87.0, 127.0, 196.0, 333.0, 566.0, 919.0, 1516.0, 2474.0, 3760.0, 6025.0, 9551.0, 14535.0, 21571.0, 30723.0, 42543.0, 56514.0, 71576.0, 85019.0, 96656.0, 101366.0, 100010.0, 92359.0, 79701.0, 65271.0, 50505.0, 36997.0, 26568.0, 18029.0, 12052.0, 7652.0, 4997.0, 3245.0, 1974.0, 1216.0, 738.0, 417.0, 268.0, 154.0, 110.0, 64.0, 30.0, 22.0, 11.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.34375, -23.5263671875, -22.708984375, -21.8916015625, -21.07421875, -20.2568359375, -19.439453125, -18.6220703125, -17.8046875, -16.9873046875, -16.169921875, -15.3525390625, -14.53515625, -13.7177734375, -12.900390625, -12.0830078125, -11.265625, -10.4482421875, -9.630859375, -8.8134765625, -7.99609375, -7.1787109375, -6.361328125, -5.5439453125, -4.7265625, -3.9091796875, -3.091796875, -2.2744140625, -1.45703125, -0.6396484375, 0.177734375, 0.9951171875, 1.8125, 2.6298828125, 3.447265625, 4.2646484375, 5.08203125, 5.8994140625, 6.716796875, 7.5341796875, 8.3515625, 9.1689453125, 9.986328125, 10.8037109375, 11.62109375, 12.4384765625, 13.255859375, 14.0732421875, 14.890625, 15.7080078125, 16.525390625, 17.3427734375, 18.16015625, 18.9775390625, 19.794921875, 20.6123046875, 21.4296875, 22.2470703125, 23.064453125, 23.8818359375, 24.69921875, 25.5166015625, 26.333984375, 27.1513671875, 27.96875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 10.0, 5.0, 10.0, 6.0, 10.0, 18.0, 14.0, 17.0, 23.0, 28.0, 34.0, 37.0, 30.0, 39.0, 41.0, 42.0, 41.0, 54.0, 45.0, 41.0, 46.0, 41.0, 42.0, 50.0, 47.0, 37.0, 26.0, 26.0, 21.0, 24.0, 10.0, 14.0, 11.0, 16.0, 14.0, 2.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.03125, -52.3818359375, -50.732421875, -49.0830078125, -47.43359375, -45.7841796875, -44.134765625, -42.4853515625, -40.8359375, -39.1865234375, -37.537109375, -35.8876953125, -34.23828125, -32.5888671875, -30.939453125, -29.2900390625, -27.640625, -25.9912109375, -24.341796875, -22.6923828125, -21.04296875, -19.3935546875, -17.744140625, -16.0947265625, -14.4453125, -12.7958984375, -11.146484375, -9.4970703125, -7.84765625, -6.1982421875, -4.548828125, -2.8994140625, -1.25, 0.3994140625, 2.048828125, 3.6982421875, 5.34765625, 6.9970703125, 8.646484375, 10.2958984375, 11.9453125, 13.5947265625, 15.244140625, 16.8935546875, 18.54296875, 20.1923828125, 21.841796875, 23.4912109375, 25.140625, 26.7900390625, 28.439453125, 30.0888671875, 31.73828125, 33.3876953125, 35.037109375, 36.6865234375, 38.3359375, 39.9853515625, 41.634765625, 43.2841796875, 44.93359375, 46.5830078125, 48.232421875, 49.8818359375, 51.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 14.0, 16.0, 23.0, 29.0, 67.0, 99.0, 137.0, 243.0, 342.0, 545.0, 822.0, 1270.0, 1928.0, 2865.0, 4457.0, 6630.0, 9839.0, 14633.0, 21082.0, 30221.0, 41777.0, 55117.0, 69928.0, 83714.0, 94793.0, 101026.0, 99316.0, 91615.0, 79307.0, 64797.0, 50538.0, 37021.0, 26753.0, 18866.0, 12893.0, 8877.0, 5857.0, 3774.0, 2587.0, 1728.0, 1023.0, 667.0, 451.0, 301.0, 193.0, 124.0, 81.0, 59.0, 38.0, 34.0, 16.0, 12.0, 9.0, 1.0, 3.0, 2.0, 1.0], "bins": [-30.484375, -29.555908203125, -28.62744140625, -27.698974609375, -26.7705078125, -25.842041015625, -24.91357421875, -23.985107421875, -23.056640625, -22.128173828125, -21.19970703125, -20.271240234375, -19.3427734375, -18.414306640625, -17.48583984375, -16.557373046875, -15.62890625, -14.700439453125, -13.77197265625, -12.843505859375, -11.9150390625, -10.986572265625, -10.05810546875, -9.129638671875, -8.201171875, -7.272705078125, -6.34423828125, -5.415771484375, -4.4873046875, -3.558837890625, -2.63037109375, -1.701904296875, -0.7734375, 0.155029296875, 1.08349609375, 2.011962890625, 2.9404296875, 3.868896484375, 4.79736328125, 5.725830078125, 6.654296875, 7.582763671875, 8.51123046875, 9.439697265625, 10.3681640625, 11.296630859375, 12.22509765625, 13.153564453125, 14.08203125, 15.010498046875, 15.93896484375, 16.867431640625, 17.7958984375, 18.724365234375, 19.65283203125, 20.581298828125, 21.509765625, 22.438232421875, 23.36669921875, 24.295166015625, 25.2236328125, 26.152099609375, 27.08056640625, 28.009033203125, 28.9375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 11.0, 9.0, 21.0, 24.0, 19.0, 25.0, 22.0, 37.0, 29.0, 39.0, 34.0, 34.0, 39.0, 43.0, 42.0, 46.0, 46.0, 44.0, 41.0, 40.0, 32.0, 35.0, 31.0, 29.0, 44.0, 21.0, 27.0, 23.0, 14.0, 12.0, 10.0, 11.0, 9.0, 6.0, 4.0, 5.0, 8.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.375, -30.36181640625, -29.3486328125, -28.33544921875, -27.322265625, -26.30908203125, -25.2958984375, -24.28271484375, -23.26953125, -22.25634765625, -21.2431640625, -20.22998046875, -19.216796875, -18.20361328125, -17.1904296875, -16.17724609375, -15.1640625, -14.15087890625, -13.1376953125, -12.12451171875, -11.111328125, -10.09814453125, -9.0849609375, -8.07177734375, -7.05859375, -6.04541015625, -5.0322265625, -4.01904296875, -3.005859375, -1.99267578125, -0.9794921875, 0.03369140625, 1.046875, 2.06005859375, 3.0732421875, 4.08642578125, 5.099609375, 6.11279296875, 7.1259765625, 8.13916015625, 9.15234375, 10.16552734375, 11.1787109375, 12.19189453125, 13.205078125, 14.21826171875, 15.2314453125, 16.24462890625, 17.2578125, 18.27099609375, 19.2841796875, 20.29736328125, 21.310546875, 22.32373046875, 23.3369140625, 24.35009765625, 25.36328125, 26.37646484375, 27.3896484375, 28.40283203125, 29.416015625, 30.42919921875, 31.4423828125, 32.45556640625, 33.46875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 7.0, 22.0, 18.0, 24.0, 34.0, 71.0, 116.0, 202.0, 286.0, 432.0, 674.0, 1113.0, 1688.0, 2869.0, 4303.0, 6724.0, 10529.0, 15685.0, 22967.0, 33097.0, 45950.0, 61141.0, 76392.0, 89980.0, 99748.0, 103050.0, 99843.0, 89890.0, 75691.0, 60655.0, 45790.0, 32844.0, 22704.0, 15604.0, 10102.0, 6568.0, 4313.0, 2706.0, 1800.0, 1040.0, 686.0, 394.0, 293.0, 186.0, 127.0, 68.0, 57.0, 24.0, 19.0, 15.0, 10.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.46875, -11.1044921875, -10.740234375, -10.3759765625, -10.01171875, -9.6474609375, -9.283203125, -8.9189453125, -8.5546875, -8.1904296875, -7.826171875, -7.4619140625, -7.09765625, -6.7333984375, -6.369140625, -6.0048828125, -5.640625, -5.2763671875, -4.912109375, -4.5478515625, -4.18359375, -3.8193359375, -3.455078125, -3.0908203125, -2.7265625, -2.3623046875, -1.998046875, -1.6337890625, -1.26953125, -0.9052734375, -0.541015625, -0.1767578125, 0.1875, 0.5517578125, 0.916015625, 1.2802734375, 1.64453125, 2.0087890625, 2.373046875, 2.7373046875, 3.1015625, 3.4658203125, 3.830078125, 4.1943359375, 4.55859375, 4.9228515625, 5.287109375, 5.6513671875, 6.015625, 6.3798828125, 6.744140625, 7.1083984375, 7.47265625, 7.8369140625, 8.201171875, 8.5654296875, 8.9296875, 9.2939453125, 9.658203125, 10.0224609375, 10.38671875, 10.7509765625, 11.115234375, 11.4794921875, 11.84375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 4.0, 4.0, 6.0, 6.0, 11.0, 9.0, 18.0, 24.0, 24.0, 27.0, 34.0, 35.0, 28.0, 52.0, 52.0, 64.0, 47.0, 65.0, 53.0, 50.0, 56.0, 56.0, 44.0, 40.0, 44.0, 31.0, 22.0, 24.0, 7.0, 10.0, 10.0, 12.0, 9.0, 7.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016155242919921875, -0.0015586018562316895, -0.0015016794204711914, -0.0014447569847106934, -0.0013878345489501953, -0.0013309121131896973, -0.0012739896774291992, -0.0012170672416687012, -0.0011601448059082031, -0.001103222370147705, -0.001046299934387207, -0.000989377498626709, -0.0009324550628662109, -0.0008755326271057129, -0.0008186101913452148, -0.0007616877555847168, -0.0007047653198242188, -0.0006478428840637207, -0.0005909204483032227, -0.0005339980125427246, -0.00047707557678222656, -0.0004201531410217285, -0.00036323070526123047, -0.0003063082695007324, -0.0002493858337402344, -0.00019246339797973633, -0.00013554096221923828, -7.861852645874023e-05, -2.1696090698242188e-05, 3.522634506225586e-05, 9.21487808227539e-05, 0.00014907121658325195, 0.00020599365234375, 0.00026291608810424805, 0.0003198385238647461, 0.00037676095962524414, 0.0004336833953857422, 0.0004906058311462402, 0.0005475282669067383, 0.0006044507026672363, 0.0006613731384277344, 0.0007182955741882324, 0.0007752180099487305, 0.0008321404457092285, 0.0008890628814697266, 0.0009459853172302246, 0.0010029077529907227, 0.0010598301887512207, 0.0011167526245117188, 0.0011736750602722168, 0.0012305974960327148, 0.0012875199317932129, 0.001344442367553711, 0.001401364803314209, 0.001458287239074707, 0.001515209674835205, 0.0015721321105957031, 0.0016290545463562012, 0.0016859769821166992, 0.0017428994178771973, 0.0017998218536376953, 0.0018567442893981934, 0.0019136667251586914, 0.0019705891609191895, 0.0020275115966796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 16.0, 6.0, 21.0, 61.0, 74.0, 119.0, 186.0, 277.0, 461.0, 762.0, 1197.0, 1860.0, 2985.0, 4678.0, 7410.0, 11167.0, 17272.0, 25328.0, 36564.0, 50568.0, 66479.0, 82600.0, 95939.0, 104702.0, 105123.0, 98783.0, 86175.0, 70799.0, 54149.0, 39997.0, 28222.0, 19148.0, 12677.0, 8277.0, 5364.0, 3290.0, 2211.0, 1380.0, 834.0, 505.0, 332.0, 199.0, 129.0, 81.0, 55.0, 42.0, 21.0, 12.0, 12.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -12.0352783203125, -11.648681640625, -11.2620849609375, -10.87548828125, -10.4888916015625, -10.102294921875, -9.7156982421875, -9.3291015625, -8.9425048828125, -8.555908203125, -8.1693115234375, -7.78271484375, -7.3961181640625, -7.009521484375, -6.6229248046875, -6.236328125, -5.8497314453125, -5.463134765625, -5.0765380859375, -4.68994140625, -4.3033447265625, -3.916748046875, -3.5301513671875, -3.1435546875, -2.7569580078125, -2.370361328125, -1.9837646484375, -1.59716796875, -1.2105712890625, -0.823974609375, -0.4373779296875, -0.05078125, 0.3358154296875, 0.722412109375, 1.1090087890625, 1.49560546875, 1.8822021484375, 2.268798828125, 2.6553955078125, 3.0419921875, 3.4285888671875, 3.815185546875, 4.2017822265625, 4.58837890625, 4.9749755859375, 5.361572265625, 5.7481689453125, 6.134765625, 6.5213623046875, 6.907958984375, 7.2945556640625, 7.68115234375, 8.0677490234375, 8.454345703125, 8.8409423828125, 9.2275390625, 9.6141357421875, 10.000732421875, 10.3873291015625, 10.77392578125, 11.1605224609375, 11.547119140625, 11.9337158203125, 12.3203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 4.0, 10.0, 8.0, 10.0, 17.0, 14.0, 16.0, 14.0, 18.0, 24.0, 34.0, 29.0, 23.0, 25.0, 40.0, 30.0, 39.0, 38.0, 37.0, 37.0, 38.0, 45.0, 29.0, 43.0, 35.0, 33.0, 33.0, 29.0, 27.0, 29.0, 22.0, 21.0, 17.0, 13.0, 11.0, 12.0, 8.0, 10.0, 14.0, 10.0, 12.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.32421875, -5.1627197265625, -5.001220703125, -4.8397216796875, -4.67822265625, -4.5167236328125, -4.355224609375, -4.1937255859375, -4.0322265625, -3.8707275390625, -3.709228515625, -3.5477294921875, -3.38623046875, -3.2247314453125, -3.063232421875, -2.9017333984375, -2.740234375, -2.5787353515625, -2.417236328125, -2.2557373046875, -2.09423828125, -1.9327392578125, -1.771240234375, -1.6097412109375, -1.4482421875, -1.2867431640625, -1.125244140625, -0.9637451171875, -0.80224609375, -0.6407470703125, -0.479248046875, -0.3177490234375, -0.15625, 0.0052490234375, 0.166748046875, 0.3282470703125, 0.48974609375, 0.6512451171875, 0.812744140625, 0.9742431640625, 1.1357421875, 1.2972412109375, 1.458740234375, 1.6202392578125, 1.78173828125, 1.9432373046875, 2.104736328125, 2.2662353515625, 2.427734375, 2.5892333984375, 2.750732421875, 2.9122314453125, 3.07373046875, 3.2352294921875, 3.396728515625, 3.5582275390625, 3.7197265625, 3.8812255859375, 4.042724609375, 4.2042236328125, 4.36572265625, 4.5272216796875, 4.688720703125, 4.8502197265625, 5.01171875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 8.0, 7.0, 6.0, 6.0, 12.0, 7.0, 19.0, 18.0, 28.0, 31.0, 20.0, 27.0, 43.0, 43.0, 56.0, 41.0, 49.0, 43.0, 51.0, 62.0, 50.0, 47.0, 39.0, 33.0, 43.0, 29.0, 22.0, 40.0, 21.0, 17.0, 12.0, 13.0, 12.0, 10.0, 10.0, 8.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.628501892089844, -58.87873840332031, -57.12897872924805, -55.379215240478516, -53.62945556640625, -51.87969207763672, -50.12992858886719, -48.380165100097656, -46.63040542602539, -44.88064193725586, -43.130882263183594, -41.38111877441406, -39.63135528564453, -37.881595611572266, -36.131832122802734, -34.38207244873047, -32.63230895996094, -30.88254737854004, -29.13278579711914, -27.38302230834961, -25.63326072692871, -23.883499145507812, -22.13373565673828, -20.383974075317383, -18.634212493896484, -16.884450912475586, -15.134688377380371, -13.384925842285156, -11.635164260864258, -9.88540267944336, -8.135640144348145, -6.38587760925293, -4.636112213134766, -2.886350154876709, -1.1365880966186523, 0.6131739616394043, 2.362936019897461, 4.112697601318359, 5.862460136413574, 7.612222671508789, 9.361984252929688, 11.111745834350586, 12.8615083694458, 14.611270904541016, 16.361032485961914, 18.110794067382812, 19.860557556152344, 21.610319137573242, 23.36008071899414, 25.10984230041504, 26.859603881835938, 28.60936737060547, 30.359128952026367, 32.108890533447266, 33.8586540222168, 35.60841369628906, 37.358177185058594, 39.107940673828125, 40.85770034790039, 42.60746383666992, 44.35722351074219, 46.10698699951172, 47.85675048828125, 49.60651397705078, 51.35627365112305]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 4.0, 7.0, 4.0, 6.0, 10.0, 12.0, 17.0, 9.0, 14.0, 18.0, 21.0, 22.0, 17.0, 24.0, 27.0, 42.0, 40.0, 40.0, 33.0, 55.0, 45.0, 34.0, 41.0, 43.0, 51.0, 37.0, 31.0, 41.0, 32.0, 22.0, 26.0, 18.0, 29.0, 21.0, 16.0, 20.0, 10.0, 8.0, 10.0, 13.0, 9.0, 6.0, 0.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-58.50265121459961, -56.67827224731445, -54.85389709472656, -53.029518127441406, -51.20513916015625, -49.380760192871094, -47.5563850402832, -45.73200607299805, -43.907630920410156, -42.083251953125, -40.25887680053711, -38.43449783325195, -36.6101188659668, -34.785743713378906, -32.96136474609375, -31.136985778808594, -29.312606811523438, -27.488229751586914, -25.663850784301758, -23.839473724365234, -22.015094757080078, -20.190717697143555, -18.36634063720703, -16.541961669921875, -14.717584609985352, -12.893206596374512, -11.068828582763672, -9.244451522827148, -7.420073509216309, -5.595695495605469, -3.7713184356689453, -1.9469404220581055, -0.12255859375, 1.7018191814422607, 3.5261969566345215, 5.350574493408203, 7.174952507019043, 8.999330520629883, 10.823707580566406, 12.648085594177246, 14.472463607788086, 16.29684066772461, 18.121219635009766, 19.94559669494629, 21.769973754882812, 23.59435272216797, 25.418729782104492, 27.243106842041016, 29.067485809326172, 30.891862869262695, 32.71623992919922, 34.540618896484375, 36.36499786376953, 38.18937683105469, 40.01375198364258, 41.838130950927734, 43.662506103515625, 45.48688507080078, 47.31126022338867, 49.13563919067383, 50.960018157958984, 52.784393310546875, 54.60877227783203, 56.43315124511719, 58.257530212402344]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 14.0, 17.0, 15.0, 28.0, 55.0, 68.0, 94.0, 132.0, 178.0, 237.0, 337.0, 474.0, 639.0, 821.0, 1188.0, 1516.0, 1887.0, 2581.0, 3189.0, 4227.0, 6303.0, 997455.0, 7945.0, 5431.0, 3668.0, 2981.0, 2193.0, 1769.0, 1343.0, 1102.0, 775.0, 540.0, 376.0, 289.0, 212.0, 153.0, 93.0, 82.0, 60.0, 36.0, 34.0, 19.0, 11.0, 9.0, 11.0, 4.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-523.710693359375, -508.21435546875, -492.718017578125, -477.2217102050781, -461.7253723144531, -446.2290344238281, -430.7326965332031, -415.23638916015625, -399.74005126953125, -384.24371337890625, -368.74737548828125, -353.2510681152344, -337.7547302246094, -322.2583923339844, -306.7620544433594, -291.2657470703125, -275.7694091796875, -260.2730712890625, -244.77674865722656, -229.28041076660156, -213.78408813476562, -198.28775024414062, -182.79141235351562, -167.2950897216797, -151.79873657226562, -136.30239868164062, -120.80607604980469, -105.30973815917969, -89.81341552734375, -74.31707763671875, -58.82074737548828, -43.32441711425781, -27.828094482421875, -12.33176326751709, 3.1645679473876953, 18.660900115966797, 34.157230377197266, 49.653564453125, 65.14989471435547, 80.64622497558594, 96.1425552368164, 111.63888549804688, 127.13521575927734, 142.6315460205078, 158.1278839111328, 173.62420654296875, 189.12054443359375, 204.61688232421875, 220.1132049560547, 235.6095428466797, 251.10586547851562, 266.6022033691406, 282.0985412597656, 297.5948486328125, 313.0911865234375, 328.5875244140625, 344.0838623046875, 359.5802001953125, 375.0765380859375, 390.5728454589844, 406.0691833496094, 421.5655212402344, 437.0618591308594, 452.55816650390625, 468.05450439453125]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 8.0, 12.0, 12.0, 19.0, 29.0, 41.0, 77.0, 108.0, 125.0, 203.0, 314.0, 413.0, 638.0, 1020.0, 1646.0, 2551.0, 4466.0, 7486.0, 11797.0, 18430.0, 26933.0, 48969.0, 51201664.0, 62414.0, 29003.0, 19525.0, 12665.0, 7963.0, 4876.0, 2846.0, 1754.0, 1129.0, 742.0, 447.0, 323.0, 209.0, 130.0, 120.0, 74.0, 54.0, 30.0, 28.0, 23.0, 9.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-671.0728149414062, -652.2144775390625, -633.3560791015625, -614.4976806640625, -595.6393432617188, -576.781005859375, -557.922607421875, -539.064208984375, -520.2058715820312, -501.3475036621094, -482.4891357421875, -463.6307678222656, -444.77239990234375, -425.9140319824219, -407.0556640625, -388.1972961425781, -369.33892822265625, -350.4805603027344, -331.6221923828125, -312.7638244628906, -293.90545654296875, -275.0470886230469, -256.188720703125, -237.33035278320312, -218.47198486328125, -199.61361694335938, -180.7552490234375, -161.89688110351562, -143.03851318359375, -124.18014526367188, -105.32177734375, -86.46340942382812, -67.6051025390625, -48.746734619140625, -29.88836669921875, -11.029998779296875, 7.828369140625, 26.686737060546875, 45.54510498046875, 64.40347290039062, 83.2618408203125, 102.12020874023438, 120.97857666015625, 139.83694458007812, 158.6953125, 177.55368041992188, 196.41204833984375, 215.27041625976562, 234.1287841796875, 252.98715209960938, 271.84552001953125, 290.7038879394531, 309.562255859375, 328.4206237792969, 347.27899169921875, 366.1373596191406, 384.9957275390625, 403.8540954589844, 422.71246337890625, 441.5708312988281, 460.42919921875, 479.2875671386719, 498.14593505859375, 517.0042724609375, 535.8626708984375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 10.0, 20.0, 33.0, 37.0, 49.0, 88.0, 137.0, 252.0, 327.0, 560.0, 952.0, 1634.0, 2688.0, 4351.0, 7376.0, 12192.0, 20207.0, 33627.0, 56659.0, 93429.0, 152521.0, 250886.0, 428531.0, 950910.0, 2266198.0, 947666.0, 428124.0, 249244.0, 151735.0, 92349.0, 55448.0, 33094.0, 19942.0, 11947.0, 7121.0, 4271.0, 2669.0, 1581.0, 959.0, 590.0, 391.0, 233.0, 136.0, 97.0, 54.0, 36.0, 25.0, 21.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-9.875, -9.5511474609375, -9.227294921875, -8.9034423828125, -8.57958984375, -8.2557373046875, -7.931884765625, -7.6080322265625, -7.2841796875, -6.9603271484375, -6.636474609375, -6.3126220703125, -5.98876953125, -5.6649169921875, -5.341064453125, -5.0172119140625, -4.693359375, -4.3695068359375, -4.045654296875, -3.7218017578125, -3.39794921875, -3.0740966796875, -2.750244140625, -2.4263916015625, -2.1025390625, -1.7786865234375, -1.454833984375, -1.1309814453125, -0.80712890625, -0.4832763671875, -0.159423828125, 0.1644287109375, 0.48828125, 0.8121337890625, 1.135986328125, 1.4598388671875, 1.78369140625, 2.1075439453125, 2.431396484375, 2.7552490234375, 3.0791015625, 3.4029541015625, 3.726806640625, 4.0506591796875, 4.37451171875, 4.6983642578125, 5.022216796875, 5.3460693359375, 5.669921875, 5.9937744140625, 6.317626953125, 6.6414794921875, 6.96533203125, 7.2891845703125, 7.613037109375, 7.9368896484375, 8.2607421875, 8.5845947265625, 8.908447265625, 9.2322998046875, 9.55615234375, 9.8800048828125, 10.203857421875, 10.5277099609375, 10.8515625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 4.0, 4.0, 8.0, 6.0, 16.0, 5.0, 8.0, 19.0, 9.0, 19.0, 23.0, 15.0, 24.0, 35.0, 35.0, 30.0, 41.0, 46.0, 49.0, 87.0, 199.0, 354.0, 361.0, 145.0, 56.0, 43.0, 32.0, 32.0, 49.0, 33.0, 34.0, 21.0, 22.0, 19.0, 23.0, 18.0, 15.0, 16.0, 10.0, 14.0, 8.0, 6.0, 7.0, 3.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-34.84375, -33.75830078125, -32.6728515625, -31.58740234375, -30.501953125, -29.41650390625, -28.3310546875, -27.24560546875, -26.16015625, -25.07470703125, -23.9892578125, -22.90380859375, -21.818359375, -20.73291015625, -19.6474609375, -18.56201171875, -17.4765625, -16.39111328125, -15.3056640625, -14.22021484375, -13.134765625, -12.04931640625, -10.9638671875, -9.87841796875, -8.79296875, -7.70751953125, -6.6220703125, -5.53662109375, -4.451171875, -3.36572265625, -2.2802734375, -1.19482421875, -0.109375, 0.97607421875, 2.0615234375, 3.14697265625, 4.232421875, 5.31787109375, 6.4033203125, 7.48876953125, 8.57421875, 9.65966796875, 10.7451171875, 11.83056640625, 12.916015625, 14.00146484375, 15.0869140625, 16.17236328125, 17.2578125, 18.34326171875, 19.4287109375, 20.51416015625, 21.599609375, 22.68505859375, 23.7705078125, 24.85595703125, 25.94140625, 27.02685546875, 28.1123046875, 29.19775390625, 30.283203125, 31.36865234375, 32.4541015625, 33.53955078125, 34.625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 8.0, 24.0, 34.0, 44.0, 95.0, 154.0, 266.0, 466.0, 817.0, 1450.0, 2442.0, 4272.0, 7893.0, 13934.0, 24792.0, 43255.0, 74332.0, 126022.0, 208800.0, 334919.0, 646842.0, 2752526.0, 1040173.0, 400537.0, 246183.0, 150989.0, 90207.0, 51521.0, 29778.0, 16807.0, 9778.0, 5296.0, 2904.0, 1596.0, 914.0, 576.0, 315.0, 177.0, 109.0, 70.0, 37.0, 34.0, 12.0, 19.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.4296875, -10.1199951171875, -9.810302734375, -9.5006103515625, -9.19091796875, -8.8812255859375, -8.571533203125, -8.2618408203125, -7.9521484375, -7.6424560546875, -7.332763671875, -7.0230712890625, -6.71337890625, -6.4036865234375, -6.093994140625, -5.7843017578125, -5.474609375, -5.1649169921875, -4.855224609375, -4.5455322265625, -4.23583984375, -3.9261474609375, -3.616455078125, -3.3067626953125, -2.9970703125, -2.6873779296875, -2.377685546875, -2.0679931640625, -1.75830078125, -1.4486083984375, -1.138916015625, -0.8292236328125, -0.51953125, -0.2098388671875, 0.099853515625, 0.4095458984375, 0.71923828125, 1.0289306640625, 1.338623046875, 1.6483154296875, 1.9580078125, 2.2677001953125, 2.577392578125, 2.8870849609375, 3.19677734375, 3.5064697265625, 3.816162109375, 4.1258544921875, 4.435546875, 4.7452392578125, 5.054931640625, 5.3646240234375, 5.67431640625, 5.9840087890625, 6.293701171875, 6.6033935546875, 6.9130859375, 7.2227783203125, 7.532470703125, 7.8421630859375, 8.15185546875, 8.4615478515625, 8.771240234375, 9.0809326171875, 9.390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 7.0, 7.0, 6.0, 1.0, 5.0, 10.0, 8.0, 17.0, 10.0, 13.0, 21.0, 17.0, 20.0, 27.0, 20.0, 30.0, 27.0, 31.0, 34.0, 33.0, 39.0, 86.0, 194.0, 513.0, 312.0, 95.0, 53.0, 34.0, 32.0, 37.0, 43.0, 35.0, 23.0, 25.0, 23.0, 29.0, 17.0, 13.0, 10.0, 10.0, 11.0, 10.0, 12.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-38.78125, -37.48291015625, -36.1845703125, -34.88623046875, -33.587890625, -32.28955078125, -30.9912109375, -29.69287109375, -28.39453125, -27.09619140625, -25.7978515625, -24.49951171875, -23.201171875, -21.90283203125, -20.6044921875, -19.30615234375, -18.0078125, -16.70947265625, -15.4111328125, -14.11279296875, -12.814453125, -11.51611328125, -10.2177734375, -8.91943359375, -7.62109375, -6.32275390625, -5.0244140625, -3.72607421875, -2.427734375, -1.12939453125, 0.1689453125, 1.46728515625, 2.765625, 4.06396484375, 5.3623046875, 6.66064453125, 7.958984375, 9.25732421875, 10.5556640625, 11.85400390625, 13.15234375, 14.45068359375, 15.7490234375, 17.04736328125, 18.345703125, 19.64404296875, 20.9423828125, 22.24072265625, 23.5390625, 24.83740234375, 26.1357421875, 27.43408203125, 28.732421875, 30.03076171875, 31.3291015625, 32.62744140625, 33.92578125, 35.22412109375, 36.5224609375, 37.82080078125, 39.119140625, 40.41748046875, 41.7158203125, 43.01416015625, 44.3125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 6.0, 12.0, 11.0, 17.0, 25.0, 40.0, 54.0, 70.0, 102.0, 136.0, 234.0, 283.0, 474.0, 620.0, 912.0, 1301.0, 1977.0, 2969.0, 4372.0, 6650.0, 10072.0, 15180.0, 23323.0, 36299.0, 59569.0, 110446.0, 5058934.0, 688596.0, 106428.0, 57757.0, 36137.0, 23169.0, 14896.0, 9649.0, 6570.0, 4570.0, 3017.0, 1981.0, 1462.0, 954.0, 662.0, 453.0, 326.0, 227.0, 169.0, 84.0, 79.0, 37.0, 34.0, 25.0, 27.0, 10.0, 8.0, 13.0, 9.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-24.84375, -24.04150390625, -23.2392578125, -22.43701171875, -21.634765625, -20.83251953125, -20.0302734375, -19.22802734375, -18.42578125, -17.62353515625, -16.8212890625, -16.01904296875, -15.216796875, -14.41455078125, -13.6123046875, -12.81005859375, -12.0078125, -11.20556640625, -10.4033203125, -9.60107421875, -8.798828125, -7.99658203125, -7.1943359375, -6.39208984375, -5.58984375, -4.78759765625, -3.9853515625, -3.18310546875, -2.380859375, -1.57861328125, -0.7763671875, 0.02587890625, 0.828125, 1.63037109375, 2.4326171875, 3.23486328125, 4.037109375, 4.83935546875, 5.6416015625, 6.44384765625, 7.24609375, 8.04833984375, 8.8505859375, 9.65283203125, 10.455078125, 11.25732421875, 12.0595703125, 12.86181640625, 13.6640625, 14.46630859375, 15.2685546875, 16.07080078125, 16.873046875, 17.67529296875, 18.4775390625, 19.27978515625, 20.08203125, 20.88427734375, 21.6865234375, 22.48876953125, 23.291015625, 24.09326171875, 24.8955078125, 25.69775390625, 26.5]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 10.0, 20.0, 14.0, 13.0, 13.0, 17.0, 17.0, 18.0, 32.0, 28.0, 35.0, 45.0, 39.0, 49.0, 54.0, 202.0, 737.0, 201.0, 57.0, 58.0, 37.0, 46.0, 39.0, 26.0, 39.0, 22.0, 28.0, 18.0, 24.0, 15.0, 14.0, 12.0, 6.0, 6.0, 4.0, 9.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-69.3125, -67.1865234375, -65.060546875, -62.9345703125, -60.80859375, -58.6826171875, -56.556640625, -54.4306640625, -52.3046875, -50.1787109375, -48.052734375, -45.9267578125, -43.80078125, -41.6748046875, -39.548828125, -37.4228515625, -35.296875, -33.1708984375, -31.044921875, -28.9189453125, -26.79296875, -24.6669921875, -22.541015625, -20.4150390625, -18.2890625, -16.1630859375, -14.037109375, -11.9111328125, -9.78515625, -7.6591796875, -5.533203125, -3.4072265625, -1.28125, 0.8447265625, 2.970703125, 5.0966796875, 7.22265625, 9.3486328125, 11.474609375, 13.6005859375, 15.7265625, 17.8525390625, 19.978515625, 22.1044921875, 24.23046875, 26.3564453125, 28.482421875, 30.6083984375, 32.734375, 34.8603515625, 36.986328125, 39.1123046875, 41.23828125, 43.3642578125, 45.490234375, 47.6162109375, 49.7421875, 51.8681640625, 53.994140625, 56.1201171875, 58.24609375, 60.3720703125, 62.498046875, 64.6240234375, 66.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 8.0, 5.0, 10.0, 19.0, 36.0, 42.0, 122.0, 489.0, 133.0, 58.0, 24.0, 23.0, 9.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-973.1376953125, -944.1845092773438, -915.2312622070312, -886.278076171875, -857.3248901367188, -828.3717041015625, -799.41845703125, -770.4652709960938, -741.5120849609375, -712.5588989257812, -683.6056518554688, -654.6524658203125, -625.6992797851562, -596.74609375, -567.7928466796875, -538.8396606445312, -509.8864440917969, -480.9332275390625, -451.98004150390625, -423.0268249511719, -394.0736389160156, -365.12042236328125, -336.167236328125, -307.2140197753906, -278.26080322265625, -249.30760192871094, -220.35440063476562, -191.40118408203125, -162.447998046875, -133.49478149414062, -104.54158020019531, -75.58837890625, -46.63519287109375, -17.681989669799805, 11.27121353149414, 40.22441864013672, 69.17761993408203, 98.13082885742188, 127.08403015136719, 156.0372314453125, 184.9904327392578, 213.94363403320312, 242.89683532714844, 271.85003662109375, 300.8032531738281, 329.7564697265625, 358.70965576171875, 387.662841796875, 416.6160583496094, 445.56927490234375, 474.5224609375, 503.4756774902344, 532.4288940429688, 561.382080078125, 590.3352661132812, 619.2884521484375, 648.24169921875, 677.1948852539062, 706.1481323242188, 735.101318359375, 764.0545043945312, 793.0076904296875, 821.9609375, 850.9141235351562, 879.8673095703125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 7.0, 10.0, 11.0, 17.0, 18.0, 30.0, 50.0, 82.0, 231.0, 263.0, 66.0, 63.0, 31.0, 23.0, 13.0, 9.0, 5.0, 10.0, 10.0, 5.0, 6.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-990.4898681640625, -958.5414428710938, -926.593017578125, -894.64453125, -862.6961059570312, -830.7476806640625, -798.7992553710938, -766.850830078125, -734.90234375, -702.9539184570312, -671.0054931640625, -639.0570068359375, -607.1085815429688, -575.16015625, -543.2117309570312, -511.2633056640625, -479.31488037109375, -447.366455078125, -415.4179992675781, -383.4695739746094, -351.5211181640625, -319.57269287109375, -287.624267578125, -255.6758270263672, -223.72738647460938, -191.77894592285156, -159.83050537109375, -127.882080078125, -95.93363952636719, -63.985198974609375, -32.036773681640625, -0.0883331298828125, 31.860107421875, 63.80854415893555, 95.7569808959961, 127.70541381835938, 159.6538543701172, 191.602294921875, 223.55072021484375, 255.49916076660156, 287.4476013183594, 319.3960266113281, 351.344482421875, 383.29290771484375, 415.2413330078125, 447.1897888183594, 479.1382141113281, 511.086669921875, 543.0350952148438, 574.9835205078125, 606.9319458007812, 638.88037109375, 670.828857421875, 702.7772827148438, 734.7257080078125, 766.6741333007812, 798.62255859375, 830.5709838867188, 862.5194091796875, 894.4678955078125, 926.4163208007812, 958.36474609375, 990.3131713867188, 1022.2615966796875, 1054.2100830078125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 13.0, 9.0, 30.0, 29.0, 52.0, 76.0, 120.0, 179.0, 266.0, 336.0, 579.0, 978.0, 1482.0, 2341.0, 3889.0, 6932.0, 13450.0, 27790.0, 69558.0, 355910.0, 3479609.0, 126428.0, 48347.0, 23413.0, 12720.0, 7195.0, 4493.0, 2645.0, 1795.0, 1130.0, 743.0, 561.0, 362.0, 220.0, 169.0, 147.0, 77.0, 57.0, 33.0, 28.0, 32.0, 17.0, 13.0, 10.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.44140625, -4.28955078125, -4.1376953125, -3.98583984375, -3.833984375, -3.68212890625, -3.5302734375, -3.37841796875, -3.2265625, -3.07470703125, -2.9228515625, -2.77099609375, -2.619140625, -2.46728515625, -2.3154296875, -2.16357421875, -2.01171875, -1.85986328125, -1.7080078125, -1.55615234375, -1.404296875, -1.25244140625, -1.1005859375, -0.94873046875, -0.796875, -0.64501953125, -0.4931640625, -0.34130859375, -0.189453125, -0.03759765625, 0.1142578125, 0.26611328125, 0.41796875, 0.56982421875, 0.7216796875, 0.87353515625, 1.025390625, 1.17724609375, 1.3291015625, 1.48095703125, 1.6328125, 1.78466796875, 1.9365234375, 2.08837890625, 2.240234375, 2.39208984375, 2.5439453125, 2.69580078125, 2.84765625, 2.99951171875, 3.1513671875, 3.30322265625, 3.455078125, 3.60693359375, 3.7587890625, 3.91064453125, 4.0625, 4.21435546875, 4.3662109375, 4.51806640625, 4.669921875, 4.82177734375, 4.9736328125, 5.12548828125, 5.27734375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 5.0, 3.0, 5.0, 9.0, 10.0, 9.0, 10.0, 23.0, 23.0, 44.0, 656.0, 73.0, 25.0, 13.0, 14.0, 9.0, 5.0, 8.0, 8.0, 6.0, 3.0, 1.0, 5.0, 5.0, 6.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.351898193359375, -1.30145263671875, -1.251007080078125, -1.2005615234375, -1.150115966796875, -1.09967041015625, -1.049224853515625, -0.998779296875, -0.948333740234375, -0.89788818359375, -0.847442626953125, -0.7969970703125, -0.746551513671875, -0.69610595703125, -0.645660400390625, -0.59521484375, -0.544769287109375, -0.49432373046875, -0.443878173828125, -0.3934326171875, -0.342987060546875, -0.29254150390625, -0.242095947265625, -0.191650390625, -0.141204833984375, -0.09075927734375, -0.040313720703125, 0.0101318359375, 0.060577392578125, 0.11102294921875, 0.161468505859375, 0.2119140625, 0.262359619140625, 0.31280517578125, 0.363250732421875, 0.4136962890625, 0.464141845703125, 0.51458740234375, 0.565032958984375, 0.615478515625, 0.665924072265625, 0.71636962890625, 0.766815185546875, 0.8172607421875, 0.867706298828125, 0.91815185546875, 0.968597412109375, 1.01904296875, 1.069488525390625, 1.11993408203125, 1.170379638671875, 1.2208251953125, 1.271270751953125, 1.32171630859375, 1.372161865234375, 1.422607421875, 1.473052978515625, 1.52349853515625, 1.573944091796875, 1.6243896484375, 1.674835205078125, 1.72528076171875, 1.775726318359375, 1.826171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 18.0, 24.0, 39.0, 50.0, 61.0, 101.0, 101.0, 184.0, 318.0, 449.0, 776.0, 1450.0, 2611.0, 5263.0, 11767.0, 28612.0, 79701.0, 266181.0, 1261261.0, 1972261.0, 385226.0, 108581.0, 38550.0, 15617.0, 7137.0, 3511.0, 1796.0, 952.0, 586.0, 362.0, 230.0, 155.0, 109.0, 64.0, 52.0, 37.0, 28.0, 12.0, 14.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.744140625, -3.627655029296875, -3.51116943359375, -3.394683837890625, -3.2781982421875, -3.161712646484375, -3.04522705078125, -2.928741455078125, -2.812255859375, -2.695770263671875, -2.57928466796875, -2.462799072265625, -2.3463134765625, -2.229827880859375, -2.11334228515625, -1.996856689453125, -1.88037109375, -1.763885498046875, -1.64739990234375, -1.530914306640625, -1.4144287109375, -1.297943115234375, -1.18145751953125, -1.064971923828125, -0.948486328125, -0.832000732421875, -0.71551513671875, -0.599029541015625, -0.4825439453125, -0.366058349609375, -0.24957275390625, -0.133087158203125, -0.0166015625, 0.099884033203125, 0.21636962890625, 0.332855224609375, 0.4493408203125, 0.565826416015625, 0.68231201171875, 0.798797607421875, 0.915283203125, 1.031768798828125, 1.14825439453125, 1.264739990234375, 1.3812255859375, 1.497711181640625, 1.61419677734375, 1.730682373046875, 1.84716796875, 1.963653564453125, 2.08013916015625, 2.196624755859375, 2.3131103515625, 2.429595947265625, 2.54608154296875, 2.662567138671875, 2.779052734375, 2.895538330078125, 3.01202392578125, 3.128509521484375, 3.2449951171875, 3.361480712890625, 3.47796630859375, 3.594451904296875, 3.7109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 3.0, 5.0, 9.0, 7.0, 14.0, 10.0, 25.0, 24.0, 30.0, 37.0, 48.0, 56.0, 77.0, 83.0, 103.0, 151.0, 195.0, 264.0, 350.0, 460.0, 573.0, 360.0, 279.0, 187.0, 168.0, 108.0, 79.0, 74.0, 45.0, 36.0, 36.0, 24.0, 36.0, 30.0, 15.0, 17.0, 13.0, 9.0, 9.0, 5.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.326171875, -1.2774658203125, -1.228759765625, -1.1800537109375, -1.13134765625, -1.0826416015625, -1.033935546875, -0.9852294921875, -0.9365234375, -0.8878173828125, -0.839111328125, -0.7904052734375, -0.74169921875, -0.6929931640625, -0.644287109375, -0.5955810546875, -0.546875, -0.4981689453125, -0.449462890625, -0.4007568359375, -0.35205078125, -0.3033447265625, -0.254638671875, -0.2059326171875, -0.1572265625, -0.1085205078125, -0.059814453125, -0.0111083984375, 0.03759765625, 0.0863037109375, 0.135009765625, 0.1837158203125, 0.232421875, 0.2811279296875, 0.329833984375, 0.3785400390625, 0.42724609375, 0.4759521484375, 0.524658203125, 0.5733642578125, 0.6220703125, 0.6707763671875, 0.719482421875, 0.7681884765625, 0.81689453125, 0.8656005859375, 0.914306640625, 0.9630126953125, 1.01171875, 1.0604248046875, 1.109130859375, 1.1578369140625, 1.20654296875, 1.2552490234375, 1.303955078125, 1.3526611328125, 1.4013671875, 1.4500732421875, 1.498779296875, 1.5474853515625, 1.59619140625, 1.6448974609375, 1.693603515625, 1.7423095703125, 1.791015625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 9.0, 16.0, 40.0, 65.0, 111.0, 181.0, 211.0, 150.0, 106.0, 45.0, 23.0, 12.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.602636337280273, -23.034021377563477, -22.46540641784668, -21.896791458129883, -21.328176498413086, -20.75956153869629, -20.190946578979492, -19.622333526611328, -19.05371856689453, -18.485103607177734, -17.916488647460938, -17.34787368774414, -16.779258728027344, -16.210643768310547, -15.642029762268066, -15.07341480255127, -14.504798889160156, -13.93618392944336, -13.367568969726562, -12.798954010009766, -12.230339050292969, -11.661724090576172, -11.093110084533691, -10.524495124816895, -9.955880165100098, -9.3872652053833, -8.818650245666504, -8.250035285949707, -7.681420803070068, -7.1128058433532715, -6.544191360473633, -5.975576400756836, -5.4069623947143555, -4.838347434997559, -4.269732475280762, -3.701117992401123, -3.132503032684326, -2.5638880729675293, -1.9952733516693115, -1.4266586303710938, -0.8580436706542969, -0.28942883014678955, 0.2791860103607178, 0.8478008508682251, 1.4164156913757324, 1.9850306510925293, 2.553645372390747, 3.122260093688965, 3.6908750534057617, 4.259490013122559, 4.8281049728393555, 5.396719455718994, 5.965334415435791, 6.533949375152588, 7.102563858032227, 7.671178817749023, 8.23979377746582, 8.808408737182617, 9.377023696899414, 9.945638656616211, 10.514253616333008, 11.082868576049805, 11.651482582092285, 12.220097541809082, 12.788712501525879]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 12.0, 15.0, 17.0, 23.0, 20.0, 28.0, 33.0, 34.0, 50.0, 43.0, 49.0, 45.0, 49.0, 52.0, 58.0, 51.0, 51.0, 53.0, 55.0, 26.0, 35.0, 41.0, 30.0, 22.0, 16.0, 10.0, 19.0, 10.0, 6.0, 5.0, 4.0, 4.0, 1.0, 6.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4104642868042, -9.095338821411133, -8.78021240234375, -8.465086936950684, -8.1499605178833, -7.834834575653076, -7.519708633422852, -7.204583168029785, -6.889456748962402, -6.574330806732178, -6.259204864501953, -5.9440789222717285, -5.628952980041504, -5.313827037811279, -4.998701095581055, -4.683575630187988, -4.368449687957764, -4.053323745727539, -3.7381978034973145, -3.42307186126709, -3.1079459190368652, -2.7928199768066406, -2.477694272994995, -2.1625683307647705, -1.847442388534546, -1.5323164463043213, -1.2171905040740967, -0.9020646810531616, -0.586938738822937, -0.2718127965927124, 0.043313026428222656, 0.35843896865844727, 0.6735649108886719, 0.9886908531188965, 1.303816795349121, 1.6189426183700562, 1.9340685606002808, 2.249194622039795, 2.5643203258514404, 2.879446268081665, 3.1945722103118896, 3.5096981525421143, 3.824824094772339, 4.139949798583984, 4.455075740814209, 4.770201683044434, 5.085327625274658, 5.400453567504883, 5.715579509735107, 6.030705451965332, 6.345831394195557, 6.660957336425781, 6.976083278656006, 7.2912092208862305, 7.606334686279297, 7.92146110534668, 8.236586570739746, 8.551712036132812, 8.866838455200195, 9.181963920593262, 9.497090339660645, 9.812215805053711, 10.127342224121094, 10.44246768951416, 10.757594108581543]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 9.0, 15.0, 22.0, 36.0, 31.0, 56.0, 58.0, 100.0, 148.0, 171.0, 309.0, 421.0, 591.0, 960.0, 1423.0, 2303.0, 3656.0, 5781.0, 10277.0, 18446.0, 39971.0, 410275.0, 465898.0, 41551.0, 18900.0, 10369.0, 6204.0, 3797.0, 2302.0, 1427.0, 976.0, 650.0, 436.0, 298.0, 184.0, 143.0, 118.0, 57.0, 55.0, 34.0, 23.0, 24.0, 20.0, 9.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.6796875, -4.5379638671875, -4.396240234375, -4.2545166015625, -4.11279296875, -3.9710693359375, -3.829345703125, -3.6876220703125, -3.5458984375, -3.4041748046875, -3.262451171875, -3.1207275390625, -2.97900390625, -2.8372802734375, -2.695556640625, -2.5538330078125, -2.412109375, -2.2703857421875, -2.128662109375, -1.9869384765625, -1.84521484375, -1.7034912109375, -1.561767578125, -1.4200439453125, -1.2783203125, -1.1365966796875, -0.994873046875, -0.8531494140625, -0.71142578125, -0.5697021484375, -0.427978515625, -0.2862548828125, -0.14453125, -0.0028076171875, 0.138916015625, 0.2806396484375, 0.42236328125, 0.5640869140625, 0.705810546875, 0.8475341796875, 0.9892578125, 1.1309814453125, 1.272705078125, 1.4144287109375, 1.55615234375, 1.6978759765625, 1.839599609375, 1.9813232421875, 2.123046875, 2.2647705078125, 2.406494140625, 2.5482177734375, 2.68994140625, 2.8316650390625, 2.973388671875, 3.1151123046875, 3.2568359375, 3.3985595703125, 3.540283203125, 3.6820068359375, 3.82373046875, 3.9654541015625, 4.107177734375, 4.2489013671875, 4.390625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 7.0, 1.0, 3.0, 7.0, 8.0, 9.0, 14.0, 27.0, 50.0, 160.0, 328.0, 204.0, 55.0, 24.0, 14.0, 12.0, 14.0, 6.0, 7.0, 5.0, 4.0, 6.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5087890625, -1.458251953125, -1.40771484375, -1.357177734375, -1.306640625, -1.256103515625, -1.20556640625, -1.155029296875, -1.1044921875, -1.053955078125, -1.00341796875, -0.952880859375, -0.90234375, -0.851806640625, -0.80126953125, -0.750732421875, -0.7001953125, -0.649658203125, -0.59912109375, -0.548583984375, -0.498046875, -0.447509765625, -0.39697265625, -0.346435546875, -0.2958984375, -0.245361328125, -0.19482421875, -0.144287109375, -0.09375, -0.043212890625, 0.00732421875, 0.057861328125, 0.1083984375, 0.158935546875, 0.20947265625, 0.260009765625, 0.310546875, 0.361083984375, 0.41162109375, 0.462158203125, 0.5126953125, 0.563232421875, 0.61376953125, 0.664306640625, 0.71484375, 0.765380859375, 0.81591796875, 0.866455078125, 0.9169921875, 0.967529296875, 1.01806640625, 1.068603515625, 1.119140625, 1.169677734375, 1.22021484375, 1.270751953125, 1.3212890625, 1.371826171875, 1.42236328125, 1.472900390625, 1.5234375, 1.573974609375, 1.62451171875, 1.675048828125, 1.7255859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 8.0, 12.0, 11.0, 26.0, 29.0, 39.0, 87.0, 143.0, 379.0, 1302.0, 6247.0, 38724.0, 391215.0, 544776.0, 54972.0, 7896.0, 1773.0, 504.0, 182.0, 70.0, 49.0, 32.0, 19.0, 17.0, 8.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.6640625, -11.288818359375, -10.91357421875, -10.538330078125, -10.1630859375, -9.787841796875, -9.41259765625, -9.037353515625, -8.662109375, -8.286865234375, -7.91162109375, -7.536376953125, -7.1611328125, -6.785888671875, -6.41064453125, -6.035400390625, -5.66015625, -5.284912109375, -4.90966796875, -4.534423828125, -4.1591796875, -3.783935546875, -3.40869140625, -3.033447265625, -2.658203125, -2.282958984375, -1.90771484375, -1.532470703125, -1.1572265625, -0.781982421875, -0.40673828125, -0.031494140625, 0.34375, 0.718994140625, 1.09423828125, 1.469482421875, 1.8447265625, 2.219970703125, 2.59521484375, 2.970458984375, 3.345703125, 3.720947265625, 4.09619140625, 4.471435546875, 4.8466796875, 5.221923828125, 5.59716796875, 5.972412109375, 6.34765625, 6.722900390625, 7.09814453125, 7.473388671875, 7.8486328125, 8.223876953125, 8.59912109375, 8.974365234375, 9.349609375, 9.724853515625, 10.10009765625, 10.475341796875, 10.8505859375, 11.225830078125, 11.60107421875, 11.976318359375, 12.3515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 2.0, 9.0, 7.0, 5.0, 9.0, 19.0, 16.0, 22.0, 25.0, 29.0, 30.0, 26.0, 30.0, 36.0, 43.0, 37.0, 52.0, 37.0, 45.0, 48.0, 41.0, 46.0, 31.0, 48.0, 36.0, 36.0, 30.0, 26.0, 25.0, 32.0, 21.0, 18.0, 19.0, 14.0, 10.0, 11.0, 6.0, 3.0, 5.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.21875, -7.01922607421875, -6.8197021484375, -6.62017822265625, -6.420654296875, -6.22113037109375, -6.0216064453125, -5.82208251953125, -5.62255859375, -5.42303466796875, -5.2235107421875, -5.02398681640625, -4.824462890625, -4.62493896484375, -4.4254150390625, -4.22589111328125, -4.0263671875, -3.82684326171875, -3.6273193359375, -3.42779541015625, -3.228271484375, -3.02874755859375, -2.8292236328125, -2.62969970703125, -2.43017578125, -2.23065185546875, -2.0311279296875, -1.83160400390625, -1.632080078125, -1.43255615234375, -1.2330322265625, -1.03350830078125, -0.833984375, -0.63446044921875, -0.4349365234375, -0.23541259765625, -0.035888671875, 0.16363525390625, 0.3631591796875, 0.56268310546875, 0.76220703125, 0.96173095703125, 1.1612548828125, 1.36077880859375, 1.560302734375, 1.75982666015625, 1.9593505859375, 2.15887451171875, 2.3583984375, 2.55792236328125, 2.7574462890625, 2.95697021484375, 3.156494140625, 3.35601806640625, 3.5555419921875, 3.75506591796875, 3.95458984375, 4.15411376953125, 4.3536376953125, 4.55316162109375, 4.752685546875, 4.95220947265625, 5.1517333984375, 5.35125732421875, 5.55078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 6.0, 10.0, 10.0, 15.0, 19.0, 33.0, 40.0, 78.0, 133.0, 253.0, 545.0, 1582.0, 7334.0, 255132.0, 769470.0, 10494.0, 2047.0, 697.0, 269.0, 144.0, 78.0, 51.0, 33.0, 22.0, 19.0, 10.0, 15.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.8858642578125, -13.373291015625, -12.8607177734375, -12.34814453125, -11.8355712890625, -11.322998046875, -10.8104248046875, -10.2978515625, -9.7852783203125, -9.272705078125, -8.7601318359375, -8.24755859375, -7.7349853515625, -7.222412109375, -6.7098388671875, -6.197265625, -5.6846923828125, -5.172119140625, -4.6595458984375, -4.14697265625, -3.6343994140625, -3.121826171875, -2.6092529296875, -2.0966796875, -1.5841064453125, -1.071533203125, -0.5589599609375, -0.04638671875, 0.4661865234375, 0.978759765625, 1.4913330078125, 2.00390625, 2.5164794921875, 3.029052734375, 3.5416259765625, 4.05419921875, 4.5667724609375, 5.079345703125, 5.5919189453125, 6.1044921875, 6.6170654296875, 7.129638671875, 7.6422119140625, 8.15478515625, 8.6673583984375, 9.179931640625, 9.6925048828125, 10.205078125, 10.7176513671875, 11.230224609375, 11.7427978515625, 12.25537109375, 12.7679443359375, 13.280517578125, 13.7930908203125, 14.3056640625, 14.8182373046875, 15.330810546875, 15.8433837890625, 16.35595703125, 16.8685302734375, 17.381103515625, 17.8936767578125, 18.40625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 9.0, 6.0, 5.0, 5.0, 8.0, 17.0, 23.0, 21.0, 30.0, 45.0, 50.0, 58.0, 65.0, 93.0, 58.0, 90.0, 93.0, 73.0, 57.0, 43.0, 32.0, 27.0, 26.0, 18.0, 12.0, 11.0, 7.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00022339820861816406, -0.00021733343601226807, -0.00021126866340637207, -0.00020520389080047607, -0.00019913911819458008, -0.00019307434558868408, -0.00018700957298278809, -0.0001809448003768921, -0.0001748800277709961, -0.0001688152551651001, -0.0001627504825592041, -0.0001566857099533081, -0.0001506209373474121, -0.0001445561647415161, -0.00013849139213562012, -0.00013242661952972412, -0.00012636184692382812, -0.00012029707431793213, -0.00011423230171203613, -0.00010816752910614014, -0.00010210275650024414, -9.603798389434814e-05, -8.997321128845215e-05, -8.390843868255615e-05, -7.784366607666016e-05, -7.177889347076416e-05, -6.571412086486816e-05, -5.964934825897217e-05, -5.358457565307617e-05, -4.7519803047180176e-05, -4.145503044128418e-05, -3.5390257835388184e-05, -2.9325485229492188e-05, -2.326071262359619e-05, -1.7195940017700195e-05, -1.11311674118042e-05, -5.066394805908203e-06, 9.98377799987793e-07, 7.063150405883789e-06, 1.3127923011779785e-05, 1.919269561767578e-05, 2.5257468223571777e-05, 3.1322240829467773e-05, 3.738701343536377e-05, 4.3451786041259766e-05, 4.951655864715576e-05, 5.558133125305176e-05, 6.164610385894775e-05, 6.771087646484375e-05, 7.377564907073975e-05, 7.984042167663574e-05, 8.590519428253174e-05, 9.196996688842773e-05, 9.803473949432373e-05, 0.00010409951210021973, 0.00011016428470611572, 0.00011622905731201172, 0.00012229382991790771, 0.0001283586025238037, 0.0001344233751296997, 0.0001404881477355957, 0.0001465529203414917, 0.0001526176929473877, 0.0001586824655532837, 0.0001647472381591797]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 20.0, 20.0, 23.0, 41.0, 47.0, 78.0, 98.0, 166.0, 267.0, 408.0, 690.0, 1239.0, 2408.0, 5085.0, 12348.0, 39309.0, 193371.0, 593964.0, 146467.0, 32322.0, 10891.0, 4429.0, 2107.0, 1115.0, 633.0, 335.0, 206.0, 148.0, 99.0, 62.0, 46.0, 26.0, 21.0, 16.0, 10.0, 12.0, 10.0, 0.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.03009033203125, -3.8883056640625, -3.74652099609375, -3.604736328125, -3.46295166015625, -3.3211669921875, -3.17938232421875, -3.03759765625, -2.89581298828125, -2.7540283203125, -2.61224365234375, -2.470458984375, -2.32867431640625, -2.1868896484375, -2.04510498046875, -1.9033203125, -1.76153564453125, -1.6197509765625, -1.47796630859375, -1.336181640625, -1.19439697265625, -1.0526123046875, -0.91082763671875, -0.76904296875, -0.62725830078125, -0.4854736328125, -0.34368896484375, -0.201904296875, -0.06011962890625, 0.0816650390625, 0.22344970703125, 0.365234375, 0.50701904296875, 0.6488037109375, 0.79058837890625, 0.932373046875, 1.07415771484375, 1.2159423828125, 1.35772705078125, 1.49951171875, 1.64129638671875, 1.7830810546875, 1.92486572265625, 2.066650390625, 2.20843505859375, 2.3502197265625, 2.49200439453125, 2.6337890625, 2.77557373046875, 2.9173583984375, 3.05914306640625, 3.200927734375, 3.34271240234375, 3.4844970703125, 3.62628173828125, 3.76806640625, 3.90985107421875, 4.0516357421875, 4.19342041015625, 4.335205078125, 4.47698974609375, 4.6187744140625, 4.76055908203125, 4.90234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 2.0, 7.0, 7.0, 13.0, 28.0, 16.0, 43.0, 40.0, 47.0, 73.0, 98.0, 75.0, 66.0, 92.0, 75.0, 73.0, 59.0, 45.0, 25.0, 27.0, 22.0, 13.0, 10.0, 6.0, 7.0, 7.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.76171875, -5.6019287109375, -5.442138671875, -5.2823486328125, -5.12255859375, -4.9627685546875, -4.802978515625, -4.6431884765625, -4.4833984375, -4.3236083984375, -4.163818359375, -4.0040283203125, -3.84423828125, -3.6844482421875, -3.524658203125, -3.3648681640625, -3.205078125, -3.0452880859375, -2.885498046875, -2.7257080078125, -2.56591796875, -2.4061279296875, -2.246337890625, -2.0865478515625, -1.9267578125, -1.7669677734375, -1.607177734375, -1.4473876953125, -1.28759765625, -1.1278076171875, -0.968017578125, -0.8082275390625, -0.6484375, -0.4886474609375, -0.328857421875, -0.1690673828125, -0.00927734375, 0.1505126953125, 0.310302734375, 0.4700927734375, 0.6298828125, 0.7896728515625, 0.949462890625, 1.1092529296875, 1.26904296875, 1.4288330078125, 1.588623046875, 1.7484130859375, 1.908203125, 2.0679931640625, 2.227783203125, 2.3875732421875, 2.54736328125, 2.7071533203125, 2.866943359375, 3.0267333984375, 3.1865234375, 3.3463134765625, 3.506103515625, 3.6658935546875, 3.82568359375, 3.9854736328125, 4.145263671875, 4.3050537109375, 4.46484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 8.0, 17.0, 35.0, 73.0, 105.0, 216.0, 251.0, 140.0, 55.0, 32.0, 17.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-83.91691589355469, -81.30899810791016, -78.70108032226562, -76.0931625366211, -73.48524475097656, -70.87732696533203, -68.2694091796875, -65.66148376464844, -63.05356979370117, -60.44565200805664, -57.83773422241211, -55.22981643676758, -52.62189483642578, -50.01397705078125, -47.40605926513672, -44.79814147949219, -42.190223693847656, -39.582305908203125, -36.974388122558594, -34.36647033691406, -31.7585506439209, -29.150632858276367, -26.542713165283203, -23.934795379638672, -21.32687759399414, -18.71895980834961, -16.111042022705078, -13.503122329711914, -10.895204544067383, -8.287286758422852, -5.679368019104004, -3.0714492797851562, -0.463531494140625, 2.1443867683410645, 4.752305030822754, 7.360223293304443, 9.968141555786133, 12.576059341430664, 15.183978080749512, 17.79189682006836, 20.39981460571289, 23.007732391357422, 25.615650177001953, 28.223569869995117, 30.83148765563965, 33.43940734863281, 36.047325134277344, 38.655242919921875, 41.263160705566406, 43.87107849121094, 46.47899627685547, 49.0869140625, 51.69483184814453, 54.30274963378906, 56.91067123413086, 59.51858901977539, 62.12650680541992, 64.73442840576172, 67.34234619140625, 69.95026397705078, 72.55818176269531, 75.16609954833984, 77.77401733398438, 80.3819351196289, 82.98985290527344]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 7.0, 7.0, 11.0, 33.0, 69.0, 110.0, 180.0, 171.0, 132.0, 93.0, 46.0, 37.0, 17.0, 10.0, 8.0, 7.0, 5.0, 7.0, 3.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-161.29098510742188, -157.19085693359375, -153.09072875976562, -148.99058532714844, -144.8904571533203, -140.7903289794922, -136.69020080566406, -132.59005737304688, -128.48992919921875, -124.38980102539062, -120.28966522216797, -116.18953704833984, -112.08940124511719, -107.98927307128906, -103.88914489746094, -99.78900909423828, -95.68888092041016, -91.58875274658203, -87.48861694335938, -83.38848876953125, -79.2883529663086, -75.18822479248047, -71.08808898925781, -66.98796081542969, -62.8878288269043, -58.787696838378906, -54.687564849853516, -50.587432861328125, -46.4873046875, -42.387168884277344, -38.28704071044922, -34.18690872192383, -30.086776733398438, -25.986644744873047, -21.886512756347656, -17.7863826751709, -13.686250686645508, -9.586118698120117, -5.485988616943359, -1.3858566284179688, 2.714275360107422, 6.814406871795654, 10.914538383483887, 15.014669418334961, 19.11480140686035, 23.214933395385742, 27.3150634765625, 31.41519546508789, 35.51532745361328, 39.61545944213867, 43.71559143066406, 47.81571960449219, 51.915855407714844, 56.01598358154297, 60.11611557006836, 64.21624755859375, 68.31637573242188, 72.41650390625, 76.51663970947266, 80.61676788330078, 84.71690368652344, 88.81703186035156, 92.91716003417969, 97.01729583740234, 101.117431640625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 17.0, 19.0, 34.0, 35.0, 55.0, 66.0, 121.0, 211.0, 326.0, 567.0, 1065.0, 2156.0, 5061.0, 15492.0, 78502.0, 3841301.0, 206277.0, 26945.0, 8507.0, 3570.0, 1697.0, 888.0, 521.0, 270.0, 192.0, 95.0, 72.0, 48.0, 38.0, 31.0, 17.0, 13.0, 6.0, 13.0, 5.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.984375, -20.379150390625, -19.77392578125, -19.168701171875, -18.5634765625, -17.958251953125, -17.35302734375, -16.747802734375, -16.142578125, -15.537353515625, -14.93212890625, -14.326904296875, -13.7216796875, -13.116455078125, -12.51123046875, -11.906005859375, -11.30078125, -10.695556640625, -10.09033203125, -9.485107421875, -8.8798828125, -8.274658203125, -7.66943359375, -7.064208984375, -6.458984375, -5.853759765625, -5.24853515625, -4.643310546875, -4.0380859375, -3.432861328125, -2.82763671875, -2.222412109375, -1.6171875, -1.011962890625, -0.40673828125, 0.198486328125, 0.8037109375, 1.408935546875, 2.01416015625, 2.619384765625, 3.224609375, 3.829833984375, 4.43505859375, 5.040283203125, 5.6455078125, 6.250732421875, 6.85595703125, 7.461181640625, 8.06640625, 8.671630859375, 9.27685546875, 9.882080078125, 10.4873046875, 11.092529296875, 11.69775390625, 12.302978515625, 12.908203125, 13.513427734375, 14.11865234375, 14.723876953125, 15.3291015625, 15.934326171875, 16.53955078125, 17.144775390625, 17.75]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 4.0, 4.0, 5.0, 6.0, 12.0, 14.0, 15.0, 15.0, 32.0, 58.0, 154.0, 209.0, 157.0, 112.0, 56.0, 44.0, 16.0, 9.0, 10.0, 12.0, 8.0, 11.0, 5.0, 3.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.7060546875, -1.660064697265625, -1.61407470703125, -1.568084716796875, -1.5220947265625, -1.476104736328125, -1.43011474609375, -1.384124755859375, -1.338134765625, -1.292144775390625, -1.24615478515625, -1.200164794921875, -1.1541748046875, -1.108184814453125, -1.06219482421875, -1.016204833984375, -0.97021484375, -0.924224853515625, -0.87823486328125, -0.832244873046875, -0.7862548828125, -0.740264892578125, -0.69427490234375, -0.648284912109375, -0.602294921875, -0.556304931640625, -0.51031494140625, -0.464324951171875, -0.4183349609375, -0.372344970703125, -0.32635498046875, -0.280364990234375, -0.234375, -0.188385009765625, -0.14239501953125, -0.096405029296875, -0.0504150390625, -0.004425048828125, 0.04156494140625, 0.087554931640625, 0.133544921875, 0.179534912109375, 0.22552490234375, 0.271514892578125, 0.3175048828125, 0.363494873046875, 0.40948486328125, 0.455474853515625, 0.50146484375, 0.547454833984375, 0.59344482421875, 0.639434814453125, 0.6854248046875, 0.731414794921875, 0.77740478515625, 0.823394775390625, 0.869384765625, 0.915374755859375, 0.96136474609375, 1.007354736328125, 1.0533447265625, 1.099334716796875, 1.14532470703125, 1.191314697265625, 1.2373046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 21.0, 21.0, 22.0, 29.0, 56.0, 97.0, 98.0, 166.0, 300.0, 445.0, 700.0, 1216.0, 2175.0, 4348.0, 9663.0, 24559.0, 77554.0, 398960.0, 3105888.0, 441558.0, 81715.0, 25364.0, 9693.0, 4451.0, 2239.0, 1210.0, 655.0, 385.0, 223.0, 145.0, 104.0, 73.0, 36.0, 30.0, 26.0, 14.0, 8.0, 10.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0], "bins": [-10.1015625, -9.83935546875, -9.5771484375, -9.31494140625, -9.052734375, -8.79052734375, -8.5283203125, -8.26611328125, -8.00390625, -7.74169921875, -7.4794921875, -7.21728515625, -6.955078125, -6.69287109375, -6.4306640625, -6.16845703125, -5.90625, -5.64404296875, -5.3818359375, -5.11962890625, -4.857421875, -4.59521484375, -4.3330078125, -4.07080078125, -3.80859375, -3.54638671875, -3.2841796875, -3.02197265625, -2.759765625, -2.49755859375, -2.2353515625, -1.97314453125, -1.7109375, -1.44873046875, -1.1865234375, -0.92431640625, -0.662109375, -0.39990234375, -0.1376953125, 0.12451171875, 0.38671875, 0.64892578125, 0.9111328125, 1.17333984375, 1.435546875, 1.69775390625, 1.9599609375, 2.22216796875, 2.484375, 2.74658203125, 3.0087890625, 3.27099609375, 3.533203125, 3.79541015625, 4.0576171875, 4.31982421875, 4.58203125, 4.84423828125, 5.1064453125, 5.36865234375, 5.630859375, 5.89306640625, 6.1552734375, 6.41748046875, 6.6796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 6.0, 5.0, 7.0, 7.0, 4.0, 18.0, 24.0, 33.0, 54.0, 71.0, 116.0, 198.0, 413.0, 995.0, 1229.0, 402.0, 191.0, 106.0, 60.0, 42.0, 18.0, 28.0, 15.0, 7.0, 4.0, 3.0, 8.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.671875, -2.603515625, -2.53515625, -2.466796875, -2.3984375, -2.330078125, -2.26171875, -2.193359375, -2.125, -2.056640625, -1.98828125, -1.919921875, -1.8515625, -1.783203125, -1.71484375, -1.646484375, -1.578125, -1.509765625, -1.44140625, -1.373046875, -1.3046875, -1.236328125, -1.16796875, -1.099609375, -1.03125, -0.962890625, -0.89453125, -0.826171875, -0.7578125, -0.689453125, -0.62109375, -0.552734375, -0.484375, -0.416015625, -0.34765625, -0.279296875, -0.2109375, -0.142578125, -0.07421875, -0.005859375, 0.0625, 0.130859375, 0.19921875, 0.267578125, 0.3359375, 0.404296875, 0.47265625, 0.541015625, 0.609375, 0.677734375, 0.74609375, 0.814453125, 0.8828125, 0.951171875, 1.01953125, 1.087890625, 1.15625, 1.224609375, 1.29296875, 1.361328125, 1.4296875, 1.498046875, 1.56640625, 1.634765625, 1.703125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 9.0, 20.0, 29.0, 54.0, 118.0, 228.0, 253.0, 174.0, 62.0, 27.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.096309661865234, -29.46102523803711, -28.825742721557617, -28.190458297729492, -27.555173873901367, -26.919889450073242, -26.28460693359375, -25.649322509765625, -25.0140380859375, -24.378753662109375, -23.743471145629883, -23.108186721801758, -22.472902297973633, -21.837617874145508, -21.202335357666016, -20.56705093383789, -19.931766510009766, -19.29648208618164, -18.66119956970215, -18.025915145874023, -17.3906307220459, -16.755346298217773, -16.12006378173828, -15.484779357910156, -14.849496841430664, -14.214213371276855, -13.57892894744873, -12.943645477294922, -12.308361053466797, -11.673077583312988, -11.03779411315918, -10.402509689331055, -9.767226219177246, -9.131942749023438, -8.496658325195312, -7.861374855041504, -7.226090431213379, -6.59080696105957, -5.9555230140686035, -5.320239067077637, -4.68495512008667, -4.049671173095703, -3.4143872261047363, -2.7791035175323486, -2.143819570541382, -1.508535623550415, -0.8732519149780273, -0.23796796798706055, 0.39731597900390625, 1.032599925994873, 1.6678837537765503, 2.3031675815582275, 2.9384515285491943, 3.573735475540161, 4.209019184112549, 4.844303131103516, 5.479587078094482, 6.114871025085449, 6.750154972076416, 7.385438919067383, 8.020722389221191, 8.656006813049316, 9.291290283203125, 9.92657470703125, 10.561858177185059]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 3.0, 9.0, 15.0, 10.0, 21.0, 25.0, 41.0, 43.0, 57.0, 67.0, 84.0, 82.0, 106.0, 82.0, 71.0, 65.0, 51.0, 38.0, 39.0, 21.0, 14.0, 8.0, 14.0, 9.0, 4.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.332693099975586, -9.962347030639648, -9.592000007629395, -9.221653938293457, -8.851306915283203, -8.480960845947266, -8.110613822937012, -7.740267753601074, -7.36992073059082, -6.999574184417725, -6.629227638244629, -6.258881092071533, -5.8885345458984375, -5.518187999725342, -5.147841453552246, -4.777495384216309, -4.407148838043213, -4.036802291870117, -3.6664557456970215, -3.296109199523926, -2.92576265335083, -2.5554161071777344, -2.1850697994232178, -1.814723253250122, -1.4443767070770264, -1.0740301609039307, -0.7036836743354797, -0.3333371877670288, 0.037009358406066895, 0.4073559045791626, 0.7777023315429688, 1.1480488777160645, 1.5183954238891602, 1.8887419700622559, 2.2590885162353516, 2.6294350624084473, 2.999781608581543, 3.3701281547546387, 3.7404744625091553, 4.110820770263672, 4.481167793273926, 4.8515143394470215, 5.221860885620117, 5.592207431793213, 5.962553977966309, 6.332900524139404, 6.7032470703125, 7.0735931396484375, 7.443939685821533, 7.814286231994629, 8.184632301330566, 8.55497932434082, 8.925325393676758, 9.295672416687012, 9.66601848602295, 10.036365509033203, 10.40671157836914, 10.777057647705078, 11.147404670715332, 11.51775074005127, 11.888097763061523, 12.258443832397461, 12.628790855407715, 12.999136924743652, 13.369483947753906]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 11.0, 16.0, 31.0, 50.0, 110.0, 176.0, 387.0, 1032.0, 3137.0, 15404.0, 220528.0, 766906.0, 32970.0, 5289.0, 1460.0, 531.0, 220.0, 113.0, 70.0, 47.0, 20.0, 12.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.765625, -22.07958984375, -21.3935546875, -20.70751953125, -20.021484375, -19.33544921875, -18.6494140625, -17.96337890625, -17.27734375, -16.59130859375, -15.9052734375, -15.21923828125, -14.533203125, -13.84716796875, -13.1611328125, -12.47509765625, -11.7890625, -11.10302734375, -10.4169921875, -9.73095703125, -9.044921875, -8.35888671875, -7.6728515625, -6.98681640625, -6.30078125, -5.61474609375, -4.9287109375, -4.24267578125, -3.556640625, -2.87060546875, -2.1845703125, -1.49853515625, -0.8125, -0.12646484375, 0.5595703125, 1.24560546875, 1.931640625, 2.61767578125, 3.3037109375, 3.98974609375, 4.67578125, 5.36181640625, 6.0478515625, 6.73388671875, 7.419921875, 8.10595703125, 8.7919921875, 9.47802734375, 10.1640625, 10.85009765625, 11.5361328125, 12.22216796875, 12.908203125, 13.59423828125, 14.2802734375, 14.96630859375, 15.65234375, 16.33837890625, 17.0244140625, 17.71044921875, 18.396484375, 19.08251953125, 19.7685546875, 20.45458984375, 21.140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 6.0, 10.0, 12.0, 10.0, 13.0, 22.0, 43.0, 87.0, 125.0, 154.0, 171.0, 122.0, 73.0, 50.0, 28.0, 16.0, 15.0, 11.0, 8.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3896484375, -1.3437347412109375, -1.297821044921875, -1.2519073486328125, -1.20599365234375, -1.1600799560546875, -1.114166259765625, -1.0682525634765625, -1.0223388671875, -0.9764251708984375, -0.930511474609375, -0.8845977783203125, -0.83868408203125, -0.7927703857421875, -0.746856689453125, -0.7009429931640625, -0.655029296875, -0.6091156005859375, -0.563201904296875, -0.5172882080078125, -0.47137451171875, -0.4254608154296875, -0.379547119140625, -0.3336334228515625, -0.2877197265625, -0.2418060302734375, -0.195892333984375, -0.1499786376953125, -0.10406494140625, -0.0581512451171875, -0.012237548828125, 0.0336761474609375, 0.07958984375, 0.1255035400390625, 0.171417236328125, 0.2173309326171875, 0.26324462890625, 0.3091583251953125, 0.355072021484375, 0.4009857177734375, 0.4468994140625, 0.4928131103515625, 0.538726806640625, 0.5846405029296875, 0.63055419921875, 0.6764678955078125, 0.722381591796875, 0.7682952880859375, 0.814208984375, 0.8601226806640625, 0.906036376953125, 0.9519500732421875, 0.99786376953125, 1.0437774658203125, 1.089691162109375, 1.1356048583984375, 1.1815185546875, 1.2274322509765625, 1.273345947265625, 1.3192596435546875, 1.36517333984375, 1.4110870361328125, 1.457000732421875, 1.5029144287109375, 1.548828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 7.0, 4.0, 8.0, 13.0, 33.0, 107.0, 531.0, 3834.0, 62807.0, 866760.0, 108090.0, 5394.0, 711.0, 146.0, 41.0, 13.0, 10.0, 8.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.371337890625, -17.78955078125, -17.207763671875, -16.6259765625, -16.044189453125, -15.46240234375, -14.880615234375, -14.298828125, -13.717041015625, -13.13525390625, -12.553466796875, -11.9716796875, -11.389892578125, -10.80810546875, -10.226318359375, -9.64453125, -9.062744140625, -8.48095703125, -7.899169921875, -7.3173828125, -6.735595703125, -6.15380859375, -5.572021484375, -4.990234375, -4.408447265625, -3.82666015625, -3.244873046875, -2.6630859375, -2.081298828125, -1.49951171875, -0.917724609375, -0.3359375, 0.245849609375, 0.82763671875, 1.409423828125, 1.9912109375, 2.572998046875, 3.15478515625, 3.736572265625, 4.318359375, 4.900146484375, 5.48193359375, 6.063720703125, 6.6455078125, 7.227294921875, 7.80908203125, 8.390869140625, 8.97265625, 9.554443359375, 10.13623046875, 10.718017578125, 11.2998046875, 11.881591796875, 12.46337890625, 13.045166015625, 13.626953125, 14.208740234375, 14.79052734375, 15.372314453125, 15.9541015625, 16.535888671875, 17.11767578125, 17.699462890625, 18.28125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 10.0, 10.0, 13.0, 11.0, 15.0, 21.0, 14.0, 28.0, 36.0, 28.0, 33.0, 30.0, 47.0, 41.0, 46.0, 56.0, 56.0, 51.0, 56.0, 50.0, 52.0, 48.0, 46.0, 33.0, 33.0, 25.0, 21.0, 21.0, 18.0, 14.0, 6.0, 5.0, 3.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.97772216796875, -3.8343505859375, -3.69097900390625, -3.547607421875, -3.40423583984375, -3.2608642578125, -3.11749267578125, -2.97412109375, -2.83074951171875, -2.6873779296875, -2.54400634765625, -2.400634765625, -2.25726318359375, -2.1138916015625, -1.97052001953125, -1.8271484375, -1.68377685546875, -1.5404052734375, -1.39703369140625, -1.253662109375, -1.11029052734375, -0.9669189453125, -0.82354736328125, -0.68017578125, -0.53680419921875, -0.3934326171875, -0.25006103515625, -0.106689453125, 0.03668212890625, 0.1800537109375, 0.32342529296875, 0.466796875, 0.61016845703125, 0.7535400390625, 0.89691162109375, 1.040283203125, 1.18365478515625, 1.3270263671875, 1.47039794921875, 1.61376953125, 1.75714111328125, 1.9005126953125, 2.04388427734375, 2.187255859375, 2.33062744140625, 2.4739990234375, 2.61737060546875, 2.7607421875, 2.90411376953125, 3.0474853515625, 3.19085693359375, 3.334228515625, 3.47760009765625, 3.6209716796875, 3.76434326171875, 3.90771484375, 4.05108642578125, 4.1944580078125, 4.33782958984375, 4.481201171875, 4.62457275390625, 4.7679443359375, 4.91131591796875, 5.0546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 11.0, 15.0, 30.0, 76.0, 185.0, 733.0, 4037.0, 155385.0, 878791.0, 7775.0, 1009.0, 265.0, 116.0, 47.0, 27.0, 15.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.25, -30.79296875, -29.3359375, -27.87890625, -26.421875, -24.96484375, -23.5078125, -22.05078125, -20.59375, -19.13671875, -17.6796875, -16.22265625, -14.765625, -13.30859375, -11.8515625, -10.39453125, -8.9375, -7.48046875, -6.0234375, -4.56640625, -3.109375, -1.65234375, -0.1953125, 1.26171875, 2.71875, 4.17578125, 5.6328125, 7.08984375, 8.546875, 10.00390625, 11.4609375, 12.91796875, 14.375, 15.83203125, 17.2890625, 18.74609375, 20.203125, 21.66015625, 23.1171875, 24.57421875, 26.03125, 27.48828125, 28.9453125, 30.40234375, 31.859375, 33.31640625, 34.7734375, 36.23046875, 37.6875, 39.14453125, 40.6015625, 42.05859375, 43.515625, 44.97265625, 46.4296875, 47.88671875, 49.34375, 50.80078125, 52.2578125, 53.71484375, 55.171875, 56.62890625, 58.0859375, 59.54296875, 61.0]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 7.0, 7.0, 1.0, 8.0, 14.0, 17.0, 29.0, 49.0, 79.0, 143.0, 241.0, 173.0, 87.0, 60.0, 27.0, 18.0, 13.0, 9.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012063980102539062, -0.0011773556470870972, -0.001148313283920288, -0.001119270920753479, -0.00109022855758667, -0.0010611861944198608, -0.0010321438312530518, -0.0010031014680862427, -0.0009740591049194336, -0.0009450167417526245, -0.0009159743785858154, -0.0008869320154190063, -0.0008578896522521973, -0.0008288472890853882, -0.0007998049259185791, -0.00077076256275177, -0.0007417201995849609, -0.0007126778364181519, -0.0006836354732513428, -0.0006545931100845337, -0.0006255507469177246, -0.0005965083837509155, -0.0005674660205841064, -0.0005384236574172974, -0.0005093812942504883, -0.0004803389310836792, -0.0004512965679168701, -0.00042225420475006104, -0.00039321184158325195, -0.00036416947841644287, -0.0003351271152496338, -0.0003060847520828247, -0.0002770423889160156, -0.00024800002574920654, -0.00021895766258239746, -0.00018991529941558838, -0.0001608729362487793, -0.00013183057308197021, -0.00010278820991516113, -7.374584674835205e-05, -4.470348358154297e-05, -1.5661120414733887e-05, 1.3381242752075195e-05, 4.242360591888428e-05, 7.146596908569336e-05, 0.00010050833225250244, 0.00012955069541931152, 0.0001585930585861206, 0.0001876354217529297, 0.00021667778491973877, 0.00024572014808654785, 0.00027476251125335693, 0.000303804874420166, 0.0003328472375869751, 0.0003618896007537842, 0.00039093196392059326, 0.00041997432708740234, 0.0004490166902542114, 0.0004780590534210205, 0.0005071014165878296, 0.0005361437797546387, 0.0005651861429214478, 0.0005942285060882568, 0.0006232708692550659, 0.000652313232421875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 5.0, 7.0, 18.0, 27.0, 45.0, 68.0, 130.0, 164.0, 272.0, 403.0, 686.0, 1204.0, 2242.0, 4320.0, 9727.0, 27851.0, 127414.0, 617365.0, 196164.0, 36843.0, 12159.0, 5148.0, 2682.0, 1410.0, 808.0, 493.0, 337.0, 197.0, 112.0, 75.0, 52.0, 40.0, 22.0, 22.0, 11.0, 3.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.88037109375, -9.5576171875, -9.23486328125, -8.912109375, -8.58935546875, -8.2666015625, -7.94384765625, -7.62109375, -7.29833984375, -6.9755859375, -6.65283203125, -6.330078125, -6.00732421875, -5.6845703125, -5.36181640625, -5.0390625, -4.71630859375, -4.3935546875, -4.07080078125, -3.748046875, -3.42529296875, -3.1025390625, -2.77978515625, -2.45703125, -2.13427734375, -1.8115234375, -1.48876953125, -1.166015625, -0.84326171875, -0.5205078125, -0.19775390625, 0.125, 0.44775390625, 0.7705078125, 1.09326171875, 1.416015625, 1.73876953125, 2.0615234375, 2.38427734375, 2.70703125, 3.02978515625, 3.3525390625, 3.67529296875, 3.998046875, 4.32080078125, 4.6435546875, 4.96630859375, 5.2890625, 5.61181640625, 5.9345703125, 6.25732421875, 6.580078125, 6.90283203125, 7.2255859375, 7.54833984375, 7.87109375, 8.19384765625, 8.5166015625, 8.83935546875, 9.162109375, 9.48486328125, 9.8076171875, 10.13037109375, 10.453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 8.0, 6.0, 12.0, 19.0, 38.0, 73.0, 87.0, 136.0, 151.0, 156.0, 97.0, 72.0, 53.0, 24.0, 12.0, 10.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.859375, -10.505859375, -10.15234375, -9.798828125, -9.4453125, -9.091796875, -8.73828125, -8.384765625, -8.03125, -7.677734375, -7.32421875, -6.970703125, -6.6171875, -6.263671875, -5.91015625, -5.556640625, -5.203125, -4.849609375, -4.49609375, -4.142578125, -3.7890625, -3.435546875, -3.08203125, -2.728515625, -2.375, -2.021484375, -1.66796875, -1.314453125, -0.9609375, -0.607421875, -0.25390625, 0.099609375, 0.453125, 0.806640625, 1.16015625, 1.513671875, 1.8671875, 2.220703125, 2.57421875, 2.927734375, 3.28125, 3.634765625, 3.98828125, 4.341796875, 4.6953125, 5.048828125, 5.40234375, 5.755859375, 6.109375, 6.462890625, 6.81640625, 7.169921875, 7.5234375, 7.876953125, 8.23046875, 8.583984375, 8.9375, 9.291015625, 9.64453125, 9.998046875, 10.3515625, 10.705078125, 11.05859375, 11.412109375, 11.765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 18.0, 60.0, 166.0, 346.0, 254.0, 91.0, 37.0, 13.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.65475463867188, -130.00514221191406, -126.35552215576172, -122.7059097290039, -119.05628967285156, -115.40667724609375, -111.75706481933594, -108.1074447631836, -104.45782470703125, -100.80821228027344, -97.1585922241211, -93.50897979736328, -89.85935974121094, -86.20974731445312, -82.56013488769531, -78.91051483154297, -75.26090240478516, -71.61128997802734, -67.961669921875, -64.31205749511719, -60.662437438964844, -57.01282501220703, -53.36320877075195, -49.713592529296875, -46.0639762878418, -42.41436004638672, -38.76474380493164, -35.11512756347656, -31.465513229370117, -27.81589698791504, -24.166282653808594, -20.516666412353516, -16.867050170898438, -13.21743392944336, -9.567818641662598, -5.918203353881836, -2.268587112426758, 1.3810291290283203, 5.030643463134766, 8.680259704589844, 12.329875946044922, 15.9794921875, 19.629108428955078, 23.278722763061523, 26.9283390045166, 30.57795524597168, 34.227569580078125, 37.8771858215332, 41.52680206298828, 45.17641830444336, 48.82603454589844, 52.47564697265625, 56.125267028808594, 59.774879455566406, 63.424495697021484, 67.07411193847656, 70.72372436523438, 74.37333679199219, 78.02295684814453, 81.67256927490234, 85.32218933105469, 88.9718017578125, 92.62141418457031, 96.27103424072266, 99.920654296875]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 6.0, 3.0, 8.0, 7.0, 19.0, 20.0, 23.0, 45.0, 57.0, 36.0, 64.0, 93.0, 82.0, 91.0, 82.0, 73.0, 61.0, 64.0, 41.0, 39.0, 23.0, 22.0, 11.0, 9.0, 6.0, 9.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-66.91558074951172, -65.18614196777344, -63.456703186035156, -61.727264404296875, -59.997825622558594, -58.26838684082031, -56.53894805908203, -54.80950927734375, -53.08007049560547, -51.35063171386719, -49.621192932128906, -47.891754150390625, -46.162315368652344, -44.43287658691406, -42.70343780517578, -40.9739990234375, -39.24456024169922, -37.51512145996094, -35.785682678222656, -34.056243896484375, -32.326805114746094, -30.597366333007812, -28.86792755126953, -27.13848876953125, -25.409046173095703, -23.679607391357422, -21.95016860961914, -20.22072982788086, -18.491291046142578, -16.761852264404297, -15.0324125289917, -13.302973747253418, -11.573535919189453, -9.844097137451172, -8.11465835571289, -6.385219097137451, -4.65578031539917, -2.9263410568237305, -1.1969022750854492, 0.532536506652832, 2.2619752883911133, 3.9914140701293945, 5.720852851867676, 7.450292110443115, 9.179731369018555, 10.909170150756836, 12.638608932495117, 14.368047714233398, 16.09748649597168, 17.82692527770996, 19.556364059448242, 21.285802841186523, 23.015241622924805, 24.74468231201172, 26.47412109375, 28.20355987548828, 29.932998657226562, 31.662437438964844, 33.391876220703125, 35.121315002441406, 36.85075378417969, 38.58019256591797, 40.30963134765625, 42.03907012939453, 43.76850891113281]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 11.0, 12.0, 15.0, 18.0, 21.0, 37.0, 37.0, 63.0, 87.0, 131.0, 216.0, 432.0, 753.0, 1428.0, 3189.0, 8415.0, 32362.0, 420418.0, 3619435.0, 80148.0, 15984.0, 5430.0, 2398.0, 1249.0, 661.0, 405.0, 245.0, 172.0, 121.0, 81.0, 57.0, 64.0, 44.0, 23.0, 22.0, 21.0, 19.0, 14.0, 5.0, 10.0, 7.0, 4.0, 5.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.734375, -20.025146484375, -19.31591796875, -18.606689453125, -17.8974609375, -17.188232421875, -16.47900390625, -15.769775390625, -15.060546875, -14.351318359375, -13.64208984375, -12.932861328125, -12.2236328125, -11.514404296875, -10.80517578125, -10.095947265625, -9.38671875, -8.677490234375, -7.96826171875, -7.259033203125, -6.5498046875, -5.840576171875, -5.13134765625, -4.422119140625, -3.712890625, -3.003662109375, -2.29443359375, -1.585205078125, -0.8759765625, -0.166748046875, 0.54248046875, 1.251708984375, 1.9609375, 2.670166015625, 3.37939453125, 4.088623046875, 4.7978515625, 5.507080078125, 6.21630859375, 6.925537109375, 7.634765625, 8.343994140625, 9.05322265625, 9.762451171875, 10.4716796875, 11.180908203125, 11.89013671875, 12.599365234375, 13.30859375, 14.017822265625, 14.72705078125, 15.436279296875, 16.1455078125, 16.854736328125, 17.56396484375, 18.273193359375, 18.982421875, 19.691650390625, 20.40087890625, 21.110107421875, 21.8193359375, 22.528564453125, 23.23779296875, 23.947021484375, 24.65625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 6.0, 14.0, 16.0, 17.0, 23.0, 37.0, 48.0, 72.0, 125.0, 115.0, 121.0, 106.0, 91.0, 56.0, 59.0, 29.0, 17.0, 11.0, 10.0, 11.0, 4.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.24609375, -1.2022857666015625, -1.158477783203125, -1.1146697998046875, -1.07086181640625, -1.0270538330078125, -0.983245849609375, -0.9394378662109375, -0.8956298828125, -0.8518218994140625, -0.808013916015625, -0.7642059326171875, -0.72039794921875, -0.6765899658203125, -0.632781982421875, -0.5889739990234375, -0.545166015625, -0.5013580322265625, -0.457550048828125, -0.4137420654296875, -0.36993408203125, -0.3261260986328125, -0.282318115234375, -0.2385101318359375, -0.1947021484375, -0.1508941650390625, -0.107086181640625, -0.0632781982421875, -0.01947021484375, 0.0243377685546875, 0.068145751953125, 0.1119537353515625, 0.15576171875, 0.1995697021484375, 0.243377685546875, 0.2871856689453125, 0.33099365234375, 0.3748016357421875, 0.418609619140625, 0.4624176025390625, 0.5062255859375, 0.5500335693359375, 0.593841552734375, 0.6376495361328125, 0.68145751953125, 0.7252655029296875, 0.769073486328125, 0.8128814697265625, 0.856689453125, 0.9004974365234375, 0.944305419921875, 0.9881134033203125, 1.03192138671875, 1.0757293701171875, 1.119537353515625, 1.1633453369140625, 1.2071533203125, 1.2509613037109375, 1.294769287109375, 1.3385772705078125, 1.38238525390625, 1.4261932373046875, 1.470001220703125, 1.5138092041015625, 1.5576171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 6.0, 8.0, 14.0, 13.0, 12.0, 24.0, 29.0, 66.0, 83.0, 175.0, 558.0, 7848.0, 4049973.0, 132920.0, 1924.0, 307.0, 135.0, 72.0, 38.0, 15.0, 20.0, 10.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34375, -49.49462890625, -47.6455078125, -45.79638671875, -43.947265625, -42.09814453125, -40.2490234375, -38.39990234375, -36.55078125, -34.70166015625, -32.8525390625, -31.00341796875, -29.154296875, -27.30517578125, -25.4560546875, -23.60693359375, -21.7578125, -19.90869140625, -18.0595703125, -16.21044921875, -14.361328125, -12.51220703125, -10.6630859375, -8.81396484375, -6.96484375, -5.11572265625, -3.2666015625, -1.41748046875, 0.431640625, 2.28076171875, 4.1298828125, 5.97900390625, 7.828125, 9.67724609375, 11.5263671875, 13.37548828125, 15.224609375, 17.07373046875, 18.9228515625, 20.77197265625, 22.62109375, 24.47021484375, 26.3193359375, 28.16845703125, 30.017578125, 31.86669921875, 33.7158203125, 35.56494140625, 37.4140625, 39.26318359375, 41.1123046875, 42.96142578125, 44.810546875, 46.65966796875, 48.5087890625, 50.35791015625, 52.20703125, 54.05615234375, 55.9052734375, 57.75439453125, 59.603515625, 61.45263671875, 63.3017578125, 65.15087890625, 67.0]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 6.0, 12.0, 15.0, 12.0, 26.0, 37.0, 66.0, 106.0, 187.0, 349.0, 866.0, 1206.0, 534.0, 233.0, 132.0, 87.0, 63.0, 37.0, 24.0, 14.0, 17.0, 15.0, 4.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.327728271484375, -2.24530029296875, -2.162872314453125, -2.0804443359375, -1.998016357421875, -1.91558837890625, -1.833160400390625, -1.750732421875, -1.668304443359375, -1.58587646484375, -1.503448486328125, -1.4210205078125, -1.338592529296875, -1.25616455078125, -1.173736572265625, -1.09130859375, -1.008880615234375, -0.92645263671875, -0.844024658203125, -0.7615966796875, -0.679168701171875, -0.59674072265625, -0.514312744140625, -0.431884765625, -0.349456787109375, -0.26702880859375, -0.184600830078125, -0.1021728515625, -0.019744873046875, 0.06268310546875, 0.145111083984375, 0.2275390625, 0.309967041015625, 0.39239501953125, 0.474822998046875, 0.5572509765625, 0.639678955078125, 0.72210693359375, 0.804534912109375, 0.886962890625, 0.969390869140625, 1.05181884765625, 1.134246826171875, 1.2166748046875, 1.299102783203125, 1.38153076171875, 1.463958740234375, 1.54638671875, 1.628814697265625, 1.71124267578125, 1.793670654296875, 1.8760986328125, 1.958526611328125, 2.04095458984375, 2.123382568359375, 2.205810546875, 2.288238525390625, 2.37066650390625, 2.453094482421875, 2.5355224609375, 2.617950439453125, 2.70037841796875, 2.782806396484375, 2.865234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 12.0, 29.0, 113.0, 236.0, 295.0, 188.0, 76.0, 32.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.84351348876953, -23.994565963745117, -23.145618438720703, -22.29667091369629, -21.447723388671875, -20.598773956298828, -19.749828338623047, -18.90087890625, -18.051931381225586, -17.202983856201172, -16.354036331176758, -15.505088806152344, -14.656140327453613, -13.8071928024292, -12.958245277404785, -12.109296798706055, -11.260350227355957, -10.411402702331543, -9.562455177307129, -8.713506698608398, -7.864559173583984, -7.01561164855957, -6.166664123535156, -5.317716121673584, -4.46876859664917, -3.6198208332061768, -2.7708730697631836, -1.9219255447387695, -1.0729777812957764, -0.2240300178527832, 0.6249175071716309, 1.4738655090332031, 2.322813034057617, 3.1717607975006104, 4.0207085609436035, 4.869656085968018, 5.71860408782959, 6.567551612854004, 7.416499137878418, 8.265447616577148, 9.114395141601562, 9.963342666625977, 10.81229019165039, 11.661237716674805, 12.510186195373535, 13.35913372039795, 14.208081245422363, 15.057029724121094, 15.905976295471191, 16.754924774169922, 17.603872299194336, 18.45281982421875, 19.301767349243164, 20.150714874267578, 20.999662399291992, 21.848609924316406, 22.69755744934082, 23.546504974365234, 24.39545249938965, 25.244400024414062, 26.093347549438477, 26.94229507446289, 27.791244506835938, 28.64019203186035, 29.489139556884766]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 8.0, 13.0, 15.0, 18.0, 20.0, 22.0, 37.0, 30.0, 60.0, 51.0, 50.0, 51.0, 74.0, 79.0, 74.0, 76.0, 63.0, 59.0, 43.0, 32.0, 27.0, 21.0, 23.0, 14.0, 9.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.948840141296387, -9.580921173095703, -9.21300220489502, -8.845083236694336, -8.477164268493652, -8.109245300292969, -7.741326332092285, -7.373407363891602, -7.005488395690918, -6.637569427490234, -6.269650459289551, -5.901731491088867, -5.533812522888184, -5.1658935546875, -4.797974586486816, -4.430055618286133, -4.062136650085449, -3.6942176818847656, -3.326298713684082, -2.9583797454833984, -2.590460777282715, -2.2225418090820312, -1.8546228408813477, -1.486703872680664, -1.1187849044799805, -0.7508659362792969, -0.3829469680786133, -0.015027999877929688, 0.3528909683227539, 0.7208099365234375, 1.088728904724121, 1.4566478729248047, 1.8245658874511719, 2.1924848556518555, 2.560403823852539, 2.9283227920532227, 3.2962417602539062, 3.66416072845459, 4.032079696655273, 4.399998664855957, 4.767917633056641, 5.135836601257324, 5.503755569458008, 5.871674537658691, 6.239593505859375, 6.607512474060059, 6.975431442260742, 7.343350410461426, 7.711269378662109, 8.079188346862793, 8.447107315063477, 8.81502628326416, 9.182945251464844, 9.550864219665527, 9.918783187866211, 10.286702156066895, 10.654621124267578, 11.022540092468262, 11.390459060668945, 11.758378028869629, 12.126296997070312, 12.494215965270996, 12.86213493347168, 13.230053901672363, 13.597972869873047]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 6.0, 5.0, 11.0, 8.0, 6.0, 10.0, 12.0, 26.0, 19.0, 30.0, 33.0, 53.0, 66.0, 109.0, 191.0, 334.0, 669.0, 1509.0, 4855.0, 24701.0, 241548.0, 652006.0, 103899.0, 12809.0, 3157.0, 1170.0, 487.0, 270.0, 156.0, 106.0, 60.0, 43.0, 37.0, 35.0, 22.0, 24.0, 13.0, 12.0, 11.0, 6.0, 6.0, 2.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.642578125, -13.20703125, -12.771484375, -12.3359375, -11.900390625, -11.46484375, -11.029296875, -10.59375, -10.158203125, -9.72265625, -9.287109375, -8.8515625, -8.416015625, -7.98046875, -7.544921875, -7.109375, -6.673828125, -6.23828125, -5.802734375, -5.3671875, -4.931640625, -4.49609375, -4.060546875, -3.625, -3.189453125, -2.75390625, -2.318359375, -1.8828125, -1.447265625, -1.01171875, -0.576171875, -0.140625, 0.294921875, 0.73046875, 1.166015625, 1.6015625, 2.037109375, 2.47265625, 2.908203125, 3.34375, 3.779296875, 4.21484375, 4.650390625, 5.0859375, 5.521484375, 5.95703125, 6.392578125, 6.828125, 7.263671875, 7.69921875, 8.134765625, 8.5703125, 9.005859375, 9.44140625, 9.876953125, 10.3125, 10.748046875, 11.18359375, 11.619140625, 12.0546875, 12.490234375, 12.92578125, 13.361328125, 13.796875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 17.0, 28.0, 37.0, 93.0, 108.0, 146.0, 168.0, 140.0, 103.0, 71.0, 38.0, 25.0, 11.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4296875, -2.3681640625, -2.306640625, -2.2451171875, -2.18359375, -2.1220703125, -2.060546875, -1.9990234375, -1.9375, -1.8759765625, -1.814453125, -1.7529296875, -1.69140625, -1.6298828125, -1.568359375, -1.5068359375, -1.4453125, -1.3837890625, -1.322265625, -1.2607421875, -1.19921875, -1.1376953125, -1.076171875, -1.0146484375, -0.953125, -0.8916015625, -0.830078125, -0.7685546875, -0.70703125, -0.6455078125, -0.583984375, -0.5224609375, -0.4609375, -0.3994140625, -0.337890625, -0.2763671875, -0.21484375, -0.1533203125, -0.091796875, -0.0302734375, 0.03125, 0.0927734375, 0.154296875, 0.2158203125, 0.27734375, 0.3388671875, 0.400390625, 0.4619140625, 0.5234375, 0.5849609375, 0.646484375, 0.7080078125, 0.76953125, 0.8310546875, 0.892578125, 0.9541015625, 1.015625, 1.0771484375, 1.138671875, 1.2001953125, 1.26171875, 1.3232421875, 1.384765625, 1.4462890625, 1.5078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 11.0, 9.0, 17.0, 23.0, 19.0, 28.0, 37.0, 48.0, 72.0, 117.0, 145.0, 198.0, 314.0, 411.0, 669.0, 1048.0, 1906.0, 3445.0, 6630.0, 14205.0, 32300.0, 74746.0, 165110.0, 276588.0, 243224.0, 125076.0, 54878.0, 24028.0, 10801.0, 5299.0, 2756.0, 1609.0, 926.0, 558.0, 377.0, 262.0, 194.0, 133.0, 118.0, 70.0, 36.0, 39.0, 20.0, 10.0, 13.0, 7.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.78125, -5.59954833984375, -5.4178466796875, -5.23614501953125, -5.054443359375, -4.87274169921875, -4.6910400390625, -4.50933837890625, -4.32763671875, -4.14593505859375, -3.9642333984375, -3.78253173828125, -3.600830078125, -3.41912841796875, -3.2374267578125, -3.05572509765625, -2.8740234375, -2.69232177734375, -2.5106201171875, -2.32891845703125, -2.147216796875, -1.96551513671875, -1.7838134765625, -1.60211181640625, -1.42041015625, -1.23870849609375, -1.0570068359375, -0.87530517578125, -0.693603515625, -0.51190185546875, -0.3302001953125, -0.14849853515625, 0.033203125, 0.21490478515625, 0.3966064453125, 0.57830810546875, 0.760009765625, 0.94171142578125, 1.1234130859375, 1.30511474609375, 1.48681640625, 1.66851806640625, 1.8502197265625, 2.03192138671875, 2.213623046875, 2.39532470703125, 2.5770263671875, 2.75872802734375, 2.9404296875, 3.12213134765625, 3.3038330078125, 3.48553466796875, 3.667236328125, 3.84893798828125, 4.0306396484375, 4.21234130859375, 4.39404296875, 4.57574462890625, 4.7574462890625, 4.93914794921875, 5.120849609375, 5.30255126953125, 5.4842529296875, 5.66595458984375, 5.84765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 11.0, 8.0, 9.0, 10.0, 12.0, 16.0, 15.0, 21.0, 27.0, 36.0, 39.0, 29.0, 48.0, 36.0, 44.0, 38.0, 37.0, 29.0, 53.0, 48.0, 37.0, 44.0, 45.0, 44.0, 32.0, 29.0, 23.0, 31.0, 24.0, 23.0, 17.0, 14.0, 10.0, 14.0, 12.0, 8.0, 9.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.50732421875, -4.3466796875, -4.18603515625, -4.025390625, -3.86474609375, -3.7041015625, -3.54345703125, -3.3828125, -3.22216796875, -3.0615234375, -2.90087890625, -2.740234375, -2.57958984375, -2.4189453125, -2.25830078125, -2.09765625, -1.93701171875, -1.7763671875, -1.61572265625, -1.455078125, -1.29443359375, -1.1337890625, -0.97314453125, -0.8125, -0.65185546875, -0.4912109375, -0.33056640625, -0.169921875, -0.00927734375, 0.1513671875, 0.31201171875, 0.47265625, 0.63330078125, 0.7939453125, 0.95458984375, 1.115234375, 1.27587890625, 1.4365234375, 1.59716796875, 1.7578125, 1.91845703125, 2.0791015625, 2.23974609375, 2.400390625, 2.56103515625, 2.7216796875, 2.88232421875, 3.04296875, 3.20361328125, 3.3642578125, 3.52490234375, 3.685546875, 3.84619140625, 4.0068359375, 4.16748046875, 4.328125, 4.48876953125, 4.6494140625, 4.81005859375, 4.970703125, 5.13134765625, 5.2919921875, 5.45263671875, 5.61328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 15.0, 12.0, 24.0, 51.0, 59.0, 92.0, 150.0, 314.0, 571.0, 1093.0, 2366.0, 5590.0, 15140.0, 49947.0, 199039.0, 472469.0, 219869.0, 54501.0, 16211.0, 5950.0, 2563.0, 1181.0, 573.0, 323.0, 170.0, 110.0, 61.0, 33.0, 24.0, 13.0, 6.0, 5.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.109375, -8.85302734375, -8.5966796875, -8.34033203125, -8.083984375, -7.82763671875, -7.5712890625, -7.31494140625, -7.05859375, -6.80224609375, -6.5458984375, -6.28955078125, -6.033203125, -5.77685546875, -5.5205078125, -5.26416015625, -5.0078125, -4.75146484375, -4.4951171875, -4.23876953125, -3.982421875, -3.72607421875, -3.4697265625, -3.21337890625, -2.95703125, -2.70068359375, -2.4443359375, -2.18798828125, -1.931640625, -1.67529296875, -1.4189453125, -1.16259765625, -0.90625, -0.64990234375, -0.3935546875, -0.13720703125, 0.119140625, 0.37548828125, 0.6318359375, 0.88818359375, 1.14453125, 1.40087890625, 1.6572265625, 1.91357421875, 2.169921875, 2.42626953125, 2.6826171875, 2.93896484375, 3.1953125, 3.45166015625, 3.7080078125, 3.96435546875, 4.220703125, 4.47705078125, 4.7333984375, 4.98974609375, 5.24609375, 5.50244140625, 5.7587890625, 6.01513671875, 6.271484375, 6.52783203125, 6.7841796875, 7.04052734375, 7.296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 8.0, 15.0, 27.0, 32.0, 26.0, 31.0, 45.0, 57.0, 73.0, 73.0, 102.0, 87.0, 90.0, 62.0, 53.0, 41.0, 28.0, 31.0, 29.0, 10.0, 12.0, 10.0, 11.0, 5.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0008268356323242188, -0.0007970333099365234, -0.0007672309875488281, -0.0007374286651611328, -0.0007076263427734375, -0.0006778240203857422, -0.0006480216979980469, -0.0006182193756103516, -0.0005884170532226562, -0.0005586147308349609, -0.0005288124084472656, -0.0004990100860595703, -0.000469207763671875, -0.0004394054412841797, -0.0004096031188964844, -0.00037980079650878906, -0.00034999847412109375, -0.00032019615173339844, -0.0002903938293457031, -0.0002605915069580078, -0.0002307891845703125, -0.0002009868621826172, -0.00017118453979492188, -0.00014138221740722656, -0.00011157989501953125, -8.177757263183594e-05, -5.1975250244140625e-05, -2.2172927856445312e-05, 7.62939453125e-06, 3.743171691894531e-05, 6.723403930664062e-05, 9.703636169433594e-05, 0.00012683868408203125, 0.00015664100646972656, 0.00018644332885742188, 0.0002162456512451172, 0.0002460479736328125, 0.0002758502960205078, 0.0003056526184082031, 0.00033545494079589844, 0.00036525726318359375, 0.00039505958557128906, 0.0004248619079589844, 0.0004546642303466797, 0.000484466552734375, 0.0005142688751220703, 0.0005440711975097656, 0.0005738735198974609, 0.0006036758422851562, 0.0006334781646728516, 0.0006632804870605469, 0.0006930828094482422, 0.0007228851318359375, 0.0007526874542236328, 0.0007824897766113281, 0.0008122920989990234, 0.0008420944213867188, 0.0008718967437744141, 0.0009016990661621094, 0.0009315013885498047, 0.0009613037109375, 0.0009911060333251953, 0.0010209083557128906, 0.001050710678100586, 0.0010805130004882812]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 9.0, 11.0, 26.0, 23.0, 38.0, 62.0, 78.0, 145.0, 267.0, 512.0, 1005.0, 2257.0, 5951.0, 21560.0, 129201.0, 648739.0, 196573.0, 29294.0, 7616.0, 2704.0, 1174.0, 547.0, 302.0, 169.0, 96.0, 66.0, 46.0, 17.0, 19.0, 16.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.83056640625, -13.4189453125, -13.00732421875, -12.595703125, -12.18408203125, -11.7724609375, -11.36083984375, -10.94921875, -10.53759765625, -10.1259765625, -9.71435546875, -9.302734375, -8.89111328125, -8.4794921875, -8.06787109375, -7.65625, -7.24462890625, -6.8330078125, -6.42138671875, -6.009765625, -5.59814453125, -5.1865234375, -4.77490234375, -4.36328125, -3.95166015625, -3.5400390625, -3.12841796875, -2.716796875, -2.30517578125, -1.8935546875, -1.48193359375, -1.0703125, -0.65869140625, -0.2470703125, 0.16455078125, 0.576171875, 0.98779296875, 1.3994140625, 1.81103515625, 2.22265625, 2.63427734375, 3.0458984375, 3.45751953125, 3.869140625, 4.28076171875, 4.6923828125, 5.10400390625, 5.515625, 5.92724609375, 6.3388671875, 6.75048828125, 7.162109375, 7.57373046875, 7.9853515625, 8.39697265625, 8.80859375, 9.22021484375, 9.6318359375, 10.04345703125, 10.455078125, 10.86669921875, 11.2783203125, 11.68994140625, 12.1015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 11.0, 17.0, 19.0, 36.0, 46.0, 63.0, 77.0, 114.0, 122.0, 111.0, 112.0, 76.0, 53.0, 37.0, 31.0, 19.0, 14.0, 11.0, 4.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-10.234375, -9.98455810546875, -9.7347412109375, -9.48492431640625, -9.235107421875, -8.98529052734375, -8.7354736328125, -8.48565673828125, -8.23583984375, -7.98602294921875, -7.7362060546875, -7.48638916015625, -7.236572265625, -6.98675537109375, -6.7369384765625, -6.48712158203125, -6.2373046875, -5.98748779296875, -5.7376708984375, -5.48785400390625, -5.238037109375, -4.98822021484375, -4.7384033203125, -4.48858642578125, -4.23876953125, -3.98895263671875, -3.7391357421875, -3.48931884765625, -3.239501953125, -2.98968505859375, -2.7398681640625, -2.49005126953125, -2.240234375, -1.99041748046875, -1.7406005859375, -1.49078369140625, -1.240966796875, -0.99114990234375, -0.7413330078125, -0.49151611328125, -0.24169921875, 0.00811767578125, 0.2579345703125, 0.50775146484375, 0.757568359375, 1.00738525390625, 1.2572021484375, 1.50701904296875, 1.7568359375, 2.00665283203125, 2.2564697265625, 2.50628662109375, 2.756103515625, 3.00592041015625, 3.2557373046875, 3.50555419921875, 3.75537109375, 4.00518798828125, 4.2550048828125, 4.50482177734375, 4.754638671875, 5.00445556640625, 5.2542724609375, 5.50408935546875, 5.75390625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 12.0, 33.0, 51.0, 102.0, 189.0, 197.0, 167.0, 105.0, 62.0, 30.0, 16.0, 10.0, 3.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.81666564941406, -84.31334686279297, -81.81002807617188, -79.30670166015625, -76.80338287353516, -74.30006408691406, -71.79674530029297, -69.29342651367188, -66.79010009765625, -64.28678131103516, -61.7834587097168, -59.2801399230957, -56.776817321777344, -54.27349853515625, -51.770179748535156, -49.26686096191406, -46.76354217529297, -44.260223388671875, -41.756900787353516, -39.25358200073242, -36.75025939941406, -34.24694061279297, -31.743621826171875, -29.24030113220215, -26.736980438232422, -24.233659744262695, -21.73033905029297, -19.227020263671875, -16.72369956970215, -14.220378875732422, -11.717059135437012, -9.213739395141602, -6.710411071777344, -4.207090854644775, -1.703770637512207, 0.7995495796203613, 3.3028697967529297, 5.806190490722656, 8.309510231018066, 10.812829971313477, 13.316150665283203, 15.81947135925293, 18.322792053222656, 20.82611083984375, 23.329431533813477, 25.832752227783203, 28.336071014404297, 30.839391708374023, 33.34271240234375, 35.846031188964844, 38.3493537902832, 40.8526725769043, 43.355995178222656, 45.85931396484375, 48.362632751464844, 50.86595153808594, 53.3692741394043, 55.87259292602539, 58.37591552734375, 60.879234313964844, 63.38255310058594, 65.88587951660156, 68.38919830322266, 70.89251708984375, 73.39583587646484]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 9.0, 9.0, 17.0, 15.0, 33.0, 34.0, 27.0, 43.0, 51.0, 56.0, 70.0, 71.0, 69.0, 73.0, 49.0, 60.0, 63.0, 52.0, 40.0, 40.0, 37.0, 32.0, 16.0, 13.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.86215209960938, -64.96086120605469, -63.0595703125, -61.15827941894531, -59.25699234008789, -57.3557014465332, -55.454410552978516, -53.55311965942383, -51.651832580566406, -49.75054168701172, -47.84925079345703, -45.947959899902344, -44.04667282104492, -42.145381927490234, -40.24409103393555, -38.34280014038086, -36.44150924682617, -34.540218353271484, -32.6389274597168, -30.737638473510742, -28.836349487304688, -26.93505859375, -25.033767700195312, -23.132476806640625, -21.23118782043457, -19.329896926879883, -17.428607940673828, -15.52731704711914, -13.62602710723877, -11.724737167358398, -9.823446273803711, -7.92215633392334, -6.020870208740234, -4.119580268859863, -2.218289852142334, -0.3169994354248047, 1.5842905044555664, 3.4855804443359375, 5.386871337890625, 7.288161277770996, 9.189451217651367, 11.090741157531738, 12.99203109741211, 14.893321990966797, 16.794612884521484, 18.69590187072754, 20.597192764282227, 22.49848175048828, 24.39977264404297, 26.301063537597656, 28.20235252380371, 30.1036434173584, 32.00493240356445, 33.90622329711914, 35.80751419067383, 37.708805084228516, 39.61009216308594, 41.511383056640625, 43.41267395019531, 45.31396484375, 47.21525192260742, 49.11654281616211, 51.0178337097168, 52.919124603271484, 54.82041549682617]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 11.0, 9.0, 18.0, 24.0, 34.0, 58.0, 83.0, 118.0, 202.0, 411.0, 980.0, 3208.0, 21349.0, 3292826.0, 852016.0, 17218.0, 3393.0, 1132.0, 504.0, 267.0, 159.0, 79.0, 62.0, 34.0, 22.0, 14.0, 18.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.21875, -36.94189453125, -35.6650390625, -34.38818359375, -33.111328125, -31.83447265625, -30.5576171875, -29.28076171875, -28.00390625, -26.72705078125, -25.4501953125, -24.17333984375, -22.896484375, -21.61962890625, -20.3427734375, -19.06591796875, -17.7890625, -16.51220703125, -15.2353515625, -13.95849609375, -12.681640625, -11.40478515625, -10.1279296875, -8.85107421875, -7.57421875, -6.29736328125, -5.0205078125, -3.74365234375, -2.466796875, -1.18994140625, 0.0869140625, 1.36376953125, 2.640625, 3.91748046875, 5.1943359375, 6.47119140625, 7.748046875, 9.02490234375, 10.3017578125, 11.57861328125, 12.85546875, 14.13232421875, 15.4091796875, 16.68603515625, 17.962890625, 19.23974609375, 20.5166015625, 21.79345703125, 23.0703125, 24.34716796875, 25.6240234375, 26.90087890625, 28.177734375, 29.45458984375, 30.7314453125, 32.00830078125, 33.28515625, 34.56201171875, 35.8388671875, 37.11572265625, 38.392578125, 39.66943359375, 40.9462890625, 42.22314453125, 43.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 6.0, 19.0, 22.0, 43.0, 43.0, 63.0, 69.0, 88.0, 102.0, 85.0, 95.0, 74.0, 70.0, 56.0, 51.0, 35.0, 19.0, 15.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.7880859375, -1.731353759765625, -1.67462158203125, -1.617889404296875, -1.5611572265625, -1.504425048828125, -1.44769287109375, -1.390960693359375, -1.334228515625, -1.277496337890625, -1.22076416015625, -1.164031982421875, -1.1072998046875, -1.050567626953125, -0.99383544921875, -0.937103271484375, -0.88037109375, -0.823638916015625, -0.76690673828125, -0.710174560546875, -0.6534423828125, -0.596710205078125, -0.53997802734375, -0.483245849609375, -0.426513671875, -0.369781494140625, -0.31304931640625, -0.256317138671875, -0.1995849609375, -0.142852783203125, -0.08612060546875, -0.029388427734375, 0.02734375, 0.084075927734375, 0.14080810546875, 0.197540283203125, 0.2542724609375, 0.311004638671875, 0.36773681640625, 0.424468994140625, 0.481201171875, 0.537933349609375, 0.59466552734375, 0.651397705078125, 0.7081298828125, 0.764862060546875, 0.82159423828125, 0.878326416015625, 0.93505859375, 0.991790771484375, 1.04852294921875, 1.105255126953125, 1.1619873046875, 1.218719482421875, 1.27545166015625, 1.332183837890625, 1.388916015625, 1.445648193359375, 1.50238037109375, 1.559112548828125, 1.6158447265625, 1.672576904296875, 1.72930908203125, 1.786041259765625, 1.8427734375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 16.0, 9.0, 24.0, 27.0, 39.0, 69.0, 98.0, 105.0, 174.0, 279.0, 997.0, 284819.0, 3904130.0, 2591.0, 360.0, 166.0, 111.0, 81.0, 64.0, 41.0, 28.0, 22.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0], "bins": [-120.0625, -117.51513671875, -114.9677734375, -112.42041015625, -109.873046875, -107.32568359375, -104.7783203125, -102.23095703125, -99.68359375, -97.13623046875, -94.5888671875, -92.04150390625, -89.494140625, -86.94677734375, -84.3994140625, -81.85205078125, -79.3046875, -76.75732421875, -74.2099609375, -71.66259765625, -69.115234375, -66.56787109375, -64.0205078125, -61.47314453125, -58.92578125, -56.37841796875, -53.8310546875, -51.28369140625, -48.736328125, -46.18896484375, -43.6416015625, -41.09423828125, -38.546875, -35.99951171875, -33.4521484375, -30.90478515625, -28.357421875, -25.81005859375, -23.2626953125, -20.71533203125, -18.16796875, -15.62060546875, -13.0732421875, -10.52587890625, -7.978515625, -5.43115234375, -2.8837890625, -0.33642578125, 2.2109375, 4.75830078125, 7.3056640625, 9.85302734375, 12.400390625, 14.94775390625, 17.4951171875, 20.04248046875, 22.58984375, 25.13720703125, 27.6845703125, 30.23193359375, 32.779296875, 35.32666015625, 37.8740234375, 40.42138671875, 42.96875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 16.0, 33.0, 58.0, 140.0, 369.0, 1557.0, 1325.0, 338.0, 130.0, 55.0, 22.0, 18.0, 11.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.3203125, -11.10235595703125, -10.8843994140625, -10.66644287109375, -10.448486328125, -10.23052978515625, -10.0125732421875, -9.79461669921875, -9.57666015625, -9.35870361328125, -9.1407470703125, -8.92279052734375, -8.704833984375, -8.48687744140625, -8.2689208984375, -8.05096435546875, -7.8330078125, -7.61505126953125, -7.3970947265625, -7.17913818359375, -6.961181640625, -6.74322509765625, -6.5252685546875, -6.30731201171875, -6.08935546875, -5.87139892578125, -5.6534423828125, -5.43548583984375, -5.217529296875, -4.99957275390625, -4.7816162109375, -4.56365966796875, -4.345703125, -4.12774658203125, -3.9097900390625, -3.69183349609375, -3.473876953125, -3.25592041015625, -3.0379638671875, -2.82000732421875, -2.60205078125, -2.38409423828125, -2.1661376953125, -1.94818115234375, -1.730224609375, -1.51226806640625, -1.2943115234375, -1.07635498046875, -0.8583984375, -0.64044189453125, -0.4224853515625, -0.20452880859375, 0.013427734375, 0.23138427734375, 0.4493408203125, 0.66729736328125, 0.88525390625, 1.10321044921875, 1.3211669921875, 1.53912353515625, 1.757080078125, 1.97503662109375, 2.1929931640625, 2.41094970703125, 2.62890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 110.0, 824.0, 66.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.94189453125, -177.99920654296875, -170.0565185546875, -162.11383056640625, -154.171142578125, -146.22845458984375, -138.2857666015625, -130.34307861328125, -122.40038299560547, -114.45769500732422, -106.51500701904297, -98.57231140136719, -90.62962341308594, -82.68693542480469, -74.74424743652344, -66.80155944824219, -58.85887145996094, -50.91618347167969, -42.97349548339844, -35.03080368041992, -27.088115692138672, -19.145427703857422, -11.202735900878906, -3.2600479125976562, 4.682640075683594, 12.62532901763916, 20.568017959594727, 28.51070785522461, 36.45339584350586, 44.39608383178711, 52.338775634765625, 60.281463623046875, 68.22415161132812, 76.16683959960938, 84.10952758789062, 92.05221557617188, 99.99490356445312, 107.93759155273438, 115.88028717041016, 123.8229751586914, 131.76565551757812, 139.70834350585938, 147.65103149414062, 155.59371948242188, 163.53640747070312, 171.47909545898438, 179.42178344726562, 187.36447143554688, 195.3071746826172, 203.24986267089844, 211.1925506591797, 219.13523864746094, 227.0779266357422, 235.02061462402344, 242.96331787109375, 250.906005859375, 258.84869384765625, 266.7913818359375, 274.73406982421875, 282.6767578125, 290.61944580078125, 298.5621337890625, 306.50482177734375, 314.447509765625, 322.39019775390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 13.0, 24.0, 21.0, 35.0, 51.0, 70.0, 80.0, 97.0, 106.0, 92.0, 98.0, 67.0, 60.0, 59.0, 45.0, 26.0, 22.0, 12.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.453672409057617, -27.52790069580078, -26.602128982543945, -25.67635726928711, -24.75058364868164, -23.824811935424805, -22.89904022216797, -21.973268508911133, -21.047496795654297, -20.12172508239746, -19.195953369140625, -18.270179748535156, -17.34440803527832, -16.418636322021484, -15.492864608764648, -14.567092895507812, -13.641319274902344, -12.715547561645508, -11.789774894714355, -10.86400318145752, -9.938230514526367, -9.012458801269531, -8.086687088012695, -7.160914897918701, -6.235142707824707, -5.309370517730713, -4.383598327636719, -3.457826614379883, -2.5320544242858887, -1.6062822341918945, -0.6805105209350586, 0.24526166915893555, 1.1710319519042969, 2.096804141998291, 3.022576093673706, 3.948348045349121, 4.874120235443115, 5.799892425537109, 6.725664138793945, 7.6514363288879395, 8.577208518981934, 9.50298023223877, 10.428752899169922, 11.354524612426758, 12.280296325683594, 13.206068992614746, 14.131840705871582, 15.057613372802734, 15.98338508605957, 16.909156799316406, 17.834928512573242, 18.760700225830078, 19.686473846435547, 20.612245559692383, 21.53801727294922, 22.463788986206055, 23.38956069946289, 24.315332412719727, 25.241104125976562, 26.16687774658203, 27.092649459838867, 28.018421173095703, 28.94419288635254, 29.869964599609375, 30.795738220214844]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 5.0, 12.0, 13.0, 12.0, 17.0, 42.0, 58.0, 88.0, 153.0, 250.0, 500.0, 956.0, 2486.0, 7635.0, 44403.0, 381318.0, 521750.0, 72469.0, 10856.0, 3049.0, 1205.0, 529.0, 278.0, 147.0, 108.0, 65.0, 27.0, 26.0, 17.0, 11.0, 13.0, 9.0, 4.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.828125, -21.188232421875, -20.54833984375, -19.908447265625, -19.2685546875, -18.628662109375, -17.98876953125, -17.348876953125, -16.708984375, -16.069091796875, -15.42919921875, -14.789306640625, -14.1494140625, -13.509521484375, -12.86962890625, -12.229736328125, -11.58984375, -10.949951171875, -10.31005859375, -9.670166015625, -9.0302734375, -8.390380859375, -7.75048828125, -7.110595703125, -6.470703125, -5.830810546875, -5.19091796875, -4.551025390625, -3.9111328125, -3.271240234375, -2.63134765625, -1.991455078125, -1.3515625, -0.711669921875, -0.07177734375, 0.568115234375, 1.2080078125, 1.847900390625, 2.48779296875, 3.127685546875, 3.767578125, 4.407470703125, 5.04736328125, 5.687255859375, 6.3271484375, 6.967041015625, 7.60693359375, 8.246826171875, 8.88671875, 9.526611328125, 10.16650390625, 10.806396484375, 11.4462890625, 12.086181640625, 12.72607421875, 13.365966796875, 14.005859375, 14.645751953125, 15.28564453125, 15.925537109375, 16.5654296875, 17.205322265625, 17.84521484375, 18.485107421875, 19.125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 12.0, 22.0, 31.0, 45.0, 79.0, 91.0, 111.0, 117.0, 117.0, 108.0, 85.0, 62.0, 43.0, 24.0, 12.0, 15.0, 1.0, 3.0, 4.0, 1.0, 0.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.246185302734375, -3.16033935546875, -3.074493408203125, -2.9886474609375, -2.902801513671875, -2.81695556640625, -2.731109619140625, -2.645263671875, -2.559417724609375, -2.47357177734375, -2.387725830078125, -2.3018798828125, -2.216033935546875, -2.13018798828125, -2.044342041015625, -1.95849609375, -1.872650146484375, -1.78680419921875, -1.700958251953125, -1.6151123046875, -1.529266357421875, -1.44342041015625, -1.357574462890625, -1.271728515625, -1.185882568359375, -1.10003662109375, -1.014190673828125, -0.9283447265625, -0.842498779296875, -0.75665283203125, -0.670806884765625, -0.5849609375, -0.499114990234375, -0.41326904296875, -0.327423095703125, -0.2415771484375, -0.155731201171875, -0.06988525390625, 0.015960693359375, 0.101806640625, 0.187652587890625, 0.27349853515625, 0.359344482421875, 0.4451904296875, 0.531036376953125, 0.61688232421875, 0.702728271484375, 0.78857421875, 0.874420166015625, 0.96026611328125, 1.046112060546875, 1.1319580078125, 1.217803955078125, 1.30364990234375, 1.389495849609375, 1.475341796875, 1.561187744140625, 1.64703369140625, 1.732879638671875, 1.8187255859375, 1.904571533203125, 1.99041748046875, 2.076263427734375, 2.162109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 5.0, 15.0, 13.0, 26.0, 20.0, 38.0, 51.0, 64.0, 99.0, 145.0, 212.0, 271.0, 444.0, 681.0, 1186.0, 2093.0, 4235.0, 9549.0, 24911.0, 69597.0, 186457.0, 328423.0, 251996.0, 105221.0, 36795.0, 13591.0, 5724.0, 2790.0, 1451.0, 840.0, 530.0, 312.0, 202.0, 154.0, 141.0, 70.0, 57.0, 35.0, 27.0, 17.0, 19.0, 7.0, 11.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-9.34375, -9.074462890625, -8.80517578125, -8.535888671875, -8.2666015625, -7.997314453125, -7.72802734375, -7.458740234375, -7.189453125, -6.920166015625, -6.65087890625, -6.381591796875, -6.1123046875, -5.843017578125, -5.57373046875, -5.304443359375, -5.03515625, -4.765869140625, -4.49658203125, -4.227294921875, -3.9580078125, -3.688720703125, -3.41943359375, -3.150146484375, -2.880859375, -2.611572265625, -2.34228515625, -2.072998046875, -1.8037109375, -1.534423828125, -1.26513671875, -0.995849609375, -0.7265625, -0.457275390625, -0.18798828125, 0.081298828125, 0.3505859375, 0.619873046875, 0.88916015625, 1.158447265625, 1.427734375, 1.697021484375, 1.96630859375, 2.235595703125, 2.5048828125, 2.774169921875, 3.04345703125, 3.312744140625, 3.58203125, 3.851318359375, 4.12060546875, 4.389892578125, 4.6591796875, 4.928466796875, 5.19775390625, 5.467041015625, 5.736328125, 6.005615234375, 6.27490234375, 6.544189453125, 6.8134765625, 7.082763671875, 7.35205078125, 7.621337890625, 7.890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 5.0, 6.0, 12.0, 9.0, 13.0, 14.0, 17.0, 18.0, 19.0, 27.0, 29.0, 38.0, 35.0, 39.0, 49.0, 51.0, 45.0, 54.0, 54.0, 56.0, 43.0, 37.0, 41.0, 50.0, 34.0, 30.0, 24.0, 22.0, 21.0, 30.0, 13.0, 10.0, 9.0, 13.0, 6.0, 6.0, 5.0, 7.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0234375, -7.77581787109375, -7.5281982421875, -7.28057861328125, -7.032958984375, -6.78533935546875, -6.5377197265625, -6.29010009765625, -6.04248046875, -5.79486083984375, -5.5472412109375, -5.29962158203125, -5.052001953125, -4.80438232421875, -4.5567626953125, -4.30914306640625, -4.0615234375, -3.81390380859375, -3.5662841796875, -3.31866455078125, -3.071044921875, -2.82342529296875, -2.5758056640625, -2.32818603515625, -2.08056640625, -1.83294677734375, -1.5853271484375, -1.33770751953125, -1.090087890625, -0.84246826171875, -0.5948486328125, -0.34722900390625, -0.099609375, 0.14801025390625, 0.3956298828125, 0.64324951171875, 0.890869140625, 1.13848876953125, 1.3861083984375, 1.63372802734375, 1.88134765625, 2.12896728515625, 2.3765869140625, 2.62420654296875, 2.871826171875, 3.11944580078125, 3.3670654296875, 3.61468505859375, 3.8623046875, 4.10992431640625, 4.3575439453125, 4.60516357421875, 4.852783203125, 5.10040283203125, 5.3480224609375, 5.59564208984375, 5.84326171875, 6.09088134765625, 6.3385009765625, 6.58612060546875, 6.833740234375, 7.08135986328125, 7.3289794921875, 7.57659912109375, 7.82421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 6.0, 3.0, 9.0, 12.0, 19.0, 27.0, 30.0, 66.0, 116.0, 213.0, 469.0, 1358.0, 4852.0, 27945.0, 271324.0, 626333.0, 99358.0, 12275.0, 2565.0, 844.0, 313.0, 147.0, 88.0, 58.0, 41.0, 26.0, 14.0, 16.0, 6.0, 4.0, 2.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.804931640625, -9.34423828125, -8.883544921875, -8.4228515625, -7.962158203125, -7.50146484375, -7.040771484375, -6.580078125, -6.119384765625, -5.65869140625, -5.197998046875, -4.7373046875, -4.276611328125, -3.81591796875, -3.355224609375, -2.89453125, -2.433837890625, -1.97314453125, -1.512451171875, -1.0517578125, -0.591064453125, -0.13037109375, 0.330322265625, 0.791015625, 1.251708984375, 1.71240234375, 2.173095703125, 2.6337890625, 3.094482421875, 3.55517578125, 4.015869140625, 4.4765625, 4.937255859375, 5.39794921875, 5.858642578125, 6.3193359375, 6.780029296875, 7.24072265625, 7.701416015625, 8.162109375, 8.622802734375, 9.08349609375, 9.544189453125, 10.0048828125, 10.465576171875, 10.92626953125, 11.386962890625, 11.84765625, 12.308349609375, 12.76904296875, 13.229736328125, 13.6904296875, 14.151123046875, 14.61181640625, 15.072509765625, 15.533203125, 15.993896484375, 16.45458984375, 16.915283203125, 17.3759765625, 17.836669921875, 18.29736328125, 18.758056640625, 19.21875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 7.0, 7.0, 12.0, 10.0, 12.0, 11.0, 17.0, 16.0, 31.0, 29.0, 36.0, 62.0, 54.0, 61.0, 71.0, 71.0, 74.0, 57.0, 63.0, 52.0, 36.0, 37.0, 26.0, 28.0, 26.0, 20.0, 12.0, 14.0, 7.0, 11.0, 10.0, 8.0, 3.0, 3.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009431838989257812, -0.0009156465530395508, -0.0008881092071533203, -0.0008605718612670898, -0.0008330345153808594, -0.0008054971694946289, -0.0007779598236083984, -0.000750422477722168, -0.0007228851318359375, -0.000695347785949707, -0.0006678104400634766, -0.0006402730941772461, -0.0006127357482910156, -0.0005851984024047852, -0.0005576610565185547, -0.0005301237106323242, -0.0005025863647460938, -0.0004750490188598633, -0.0004475116729736328, -0.00041997432708740234, -0.0003924369812011719, -0.0003648996353149414, -0.00033736228942871094, -0.00030982494354248047, -0.00028228759765625, -0.00025475025177001953, -0.00022721290588378906, -0.0001996755599975586, -0.00017213821411132812, -0.00014460086822509766, -0.00011706352233886719, -8.952617645263672e-05, -6.198883056640625e-05, -3.445148468017578e-05, -6.9141387939453125e-06, 2.0623207092285156e-05, 4.8160552978515625e-05, 7.56978988647461e-05, 0.00010323524475097656, 0.00013077259063720703, 0.0001583099365234375, 0.00018584728240966797, 0.00021338462829589844, 0.0002409219741821289, 0.0002684593200683594, 0.00029599666595458984, 0.0003235340118408203, 0.0003510713577270508, 0.00037860870361328125, 0.0004061460494995117, 0.0004336833953857422, 0.00046122074127197266, 0.0004887580871582031, 0.0005162954330444336, 0.0005438327789306641, 0.0005713701248168945, 0.000598907470703125, 0.0006264448165893555, 0.0006539821624755859, 0.0006815195083618164, 0.0007090568542480469, 0.0007365942001342773, 0.0007641315460205078, 0.0007916688919067383, 0.0008192062377929688]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 9.0, 6.0, 14.0, 29.0, 30.0, 61.0, 95.0, 152.0, 293.0, 613.0, 1323.0, 3401.0, 11868.0, 60745.0, 384877.0, 479444.0, 83254.0, 15173.0, 4095.0, 1518.0, 658.0, 340.0, 207.0, 120.0, 66.0, 38.0, 34.0, 14.0, 14.0, 14.0, 7.0, 5.0, 8.0, 2.0, 4.0, 5.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.125, -10.698486328125, -10.27197265625, -9.845458984375, -9.4189453125, -8.992431640625, -8.56591796875, -8.139404296875, -7.712890625, -7.286376953125, -6.85986328125, -6.433349609375, -6.0068359375, -5.580322265625, -5.15380859375, -4.727294921875, -4.30078125, -3.874267578125, -3.44775390625, -3.021240234375, -2.5947265625, -2.168212890625, -1.74169921875, -1.315185546875, -0.888671875, -0.462158203125, -0.03564453125, 0.390869140625, 0.8173828125, 1.243896484375, 1.67041015625, 2.096923828125, 2.5234375, 2.949951171875, 3.37646484375, 3.802978515625, 4.2294921875, 4.656005859375, 5.08251953125, 5.509033203125, 5.935546875, 6.362060546875, 6.78857421875, 7.215087890625, 7.6416015625, 8.068115234375, 8.49462890625, 8.921142578125, 9.34765625, 9.774169921875, 10.20068359375, 10.627197265625, 11.0537109375, 11.480224609375, 11.90673828125, 12.333251953125, 12.759765625, 13.186279296875, 13.61279296875, 14.039306640625, 14.4658203125, 14.892333984375, 15.31884765625, 15.745361328125, 16.171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 15.0, 15.0, 30.0, 55.0, 56.0, 111.0, 115.0, 128.0, 113.0, 115.0, 91.0, 40.0, 30.0, 19.0, 35.0, 9.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04296875, -5.71893310546875, -5.3948974609375, -5.07086181640625, -4.746826171875, -4.42279052734375, -4.0987548828125, -3.77471923828125, -3.45068359375, -3.12664794921875, -2.8026123046875, -2.47857666015625, -2.154541015625, -1.83050537109375, -1.5064697265625, -1.18243408203125, -0.8583984375, -0.53436279296875, -0.2103271484375, 0.11370849609375, 0.437744140625, 0.76177978515625, 1.0858154296875, 1.40985107421875, 1.73388671875, 2.05792236328125, 2.3819580078125, 2.70599365234375, 3.030029296875, 3.35406494140625, 3.6781005859375, 4.00213623046875, 4.326171875, 4.65020751953125, 4.9742431640625, 5.29827880859375, 5.622314453125, 5.94635009765625, 6.2703857421875, 6.59442138671875, 6.91845703125, 7.24249267578125, 7.5665283203125, 7.89056396484375, 8.214599609375, 8.53863525390625, 8.8626708984375, 9.18670654296875, 9.5107421875, 9.83477783203125, 10.1588134765625, 10.48284912109375, 10.806884765625, 11.13092041015625, 11.4549560546875, 11.77899169921875, 12.10302734375, 12.42706298828125, 12.7510986328125, 13.07513427734375, 13.399169921875, 13.72320556640625, 14.0472412109375, 14.37127685546875, 14.6953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 11.0, 35.0, 82.0, 202.0, 303.0, 216.0, 90.0, 32.0, 17.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.82984924316406, -220.74945068359375, -215.66903686523438, -210.588623046875, -205.5082244873047, -200.42782592773438, -195.347412109375, -190.26699829101562, -185.1865997314453, -180.106201171875, -175.02578735351562, -169.94537353515625, -164.86497497558594, -159.78457641601562, -154.70416259765625, -149.62374877929688, -144.54335021972656, -139.46295166015625, -134.38253784179688, -129.3021240234375, -124.22172546386719, -119.14131927490234, -114.0609130859375, -108.98050689697266, -103.90010070800781, -98.81969451904297, -93.73928833007812, -88.65888214111328, -83.57847595214844, -78.4980697631836, -73.41766357421875, -68.3372573852539, -63.256858825683594, -58.17645263671875, -53.096046447753906, -48.01564025878906, -42.93523406982422, -37.854827880859375, -32.77442169189453, -27.694015502929688, -22.613609313964844, -17.533203125, -12.452796936035156, -7.3723907470703125, -2.2919845581054688, 2.788421630859375, 7.868827819824219, 12.949234008789062, 18.029640197753906, 23.11004638671875, 28.190452575683594, 33.27085876464844, 38.35126495361328, 43.431671142578125, 48.51207733154297, 53.59248352050781, 58.672889709472656, 63.7532958984375, 68.83370208740234, 73.91410827636719, 78.99451446533203, 84.07492065429688, 89.15532684326172, 94.23573303222656, 99.3161392211914]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 6.0, 10.0, 7.0, 12.0, 19.0, 24.0, 29.0, 27.0, 33.0, 41.0, 39.0, 51.0, 63.0, 53.0, 52.0, 51.0, 53.0, 48.0, 54.0, 42.0, 38.0, 42.0, 35.0, 30.0, 24.0, 22.0, 14.0, 14.0, 10.0, 15.0, 9.0, 10.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-77.57233428955078, -75.47307586669922, -73.37381744384766, -71.2745590209961, -69.17530059814453, -67.07604217529297, -64.9767837524414, -62.877525329589844, -60.77826690673828, -58.67900848388672, -56.579750061035156, -54.480491638183594, -52.38123321533203, -50.28197479248047, -48.182716369628906, -46.083457946777344, -43.98419952392578, -41.88494110107422, -39.785682678222656, -37.686424255371094, -35.58716583251953, -33.48790740966797, -31.388648986816406, -29.289390563964844, -27.19013214111328, -25.09087371826172, -22.991615295410156, -20.892356872558594, -18.79309844970703, -16.69384002685547, -14.594581604003906, -12.495323181152344, -10.396072387695312, -8.29681396484375, -6.1975555419921875, -4.098297119140625, -1.9990386962890625, 0.1002197265625, 2.1994781494140625, 4.298736572265625, 6.3979949951171875, 8.49725341796875, 10.596511840820312, 12.695770263671875, 14.795028686523438, 16.894287109375, 18.993545532226562, 21.092803955078125, 23.192062377929688, 25.29132080078125, 27.390579223632812, 29.489837646484375, 31.589096069335938, 33.6883544921875, 35.78761291503906, 37.886871337890625, 39.98612976074219, 42.08538818359375, 44.18464660644531, 46.283905029296875, 48.38316345214844, 50.482421875, 52.58168029785156, 54.680938720703125, 56.78019714355469]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 16.0, 10.0, 11.0, 22.0, 22.0, 38.0, 39.0, 37.0, 93.0, 135.0, 221.0, 379.0, 705.0, 1517.0, 3936.0, 15207.0, 101104.0, 3651623.0, 373664.0, 33619.0, 7446.0, 2408.0, 983.0, 436.0, 236.0, 145.0, 66.0, 46.0, 30.0, 17.0, 17.0, 11.0, 11.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.078125, -30.254150390625, -29.43017578125, -28.606201171875, -27.7822265625, -26.958251953125, -26.13427734375, -25.310302734375, -24.486328125, -23.662353515625, -22.83837890625, -22.014404296875, -21.1904296875, -20.366455078125, -19.54248046875, -18.718505859375, -17.89453125, -17.070556640625, -16.24658203125, -15.422607421875, -14.5986328125, -13.774658203125, -12.95068359375, -12.126708984375, -11.302734375, -10.478759765625, -9.65478515625, -8.830810546875, -8.0068359375, -7.182861328125, -6.35888671875, -5.534912109375, -4.7109375, -3.886962890625, -3.06298828125, -2.239013671875, -1.4150390625, -0.591064453125, 0.23291015625, 1.056884765625, 1.880859375, 2.704833984375, 3.52880859375, 4.352783203125, 5.1767578125, 6.000732421875, 6.82470703125, 7.648681640625, 8.47265625, 9.296630859375, 10.12060546875, 10.944580078125, 11.7685546875, 12.592529296875, 13.41650390625, 14.240478515625, 15.064453125, 15.888427734375, 16.71240234375, 17.536376953125, 18.3603515625, 19.184326171875, 20.00830078125, 20.832275390625, 21.65625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 17.0, 7.0, 12.0, 23.0, 38.0, 56.0, 51.0, 73.0, 49.0, 77.0, 72.0, 84.0, 83.0, 78.0, 55.0, 50.0, 47.0, 40.0, 25.0, 25.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.503265380859375, -2.42254638671875, -2.341827392578125, -2.2611083984375, -2.180389404296875, -2.09967041015625, -2.018951416015625, -1.938232421875, -1.857513427734375, -1.77679443359375, -1.696075439453125, -1.6153564453125, -1.534637451171875, -1.45391845703125, -1.373199462890625, -1.29248046875, -1.211761474609375, -1.13104248046875, -1.050323486328125, -0.9696044921875, -0.888885498046875, -0.80816650390625, -0.727447509765625, -0.646728515625, -0.566009521484375, -0.48529052734375, -0.404571533203125, -0.3238525390625, -0.243133544921875, -0.16241455078125, -0.081695556640625, -0.0009765625, 0.079742431640625, 0.16046142578125, 0.241180419921875, 0.3218994140625, 0.402618408203125, 0.48333740234375, 0.564056396484375, 0.644775390625, 0.725494384765625, 0.80621337890625, 0.886932373046875, 0.9676513671875, 1.048370361328125, 1.12908935546875, 1.209808349609375, 1.29052734375, 1.371246337890625, 1.45196533203125, 1.532684326171875, 1.6134033203125, 1.694122314453125, 1.77484130859375, 1.855560302734375, 1.936279296875, 2.016998291015625, 2.09771728515625, 2.178436279296875, 2.2591552734375, 2.339874267578125, 2.42059326171875, 2.501312255859375, 2.58203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 11.0, 15.0, 25.0, 35.0, 54.0, 91.0, 121.0, 179.0, 385.0, 843.0, 3254.0, 324884.0, 3856394.0, 5998.0, 1052.0, 427.0, 204.0, 121.0, 64.0, 48.0, 38.0, 22.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-108.3125, -105.8583984375, -103.404296875, -100.9501953125, -98.49609375, -96.0419921875, -93.587890625, -91.1337890625, -88.6796875, -86.2255859375, -83.771484375, -81.3173828125, -78.86328125, -76.4091796875, -73.955078125, -71.5009765625, -69.046875, -66.5927734375, -64.138671875, -61.6845703125, -59.23046875, -56.7763671875, -54.322265625, -51.8681640625, -49.4140625, -46.9599609375, -44.505859375, -42.0517578125, -39.59765625, -37.1435546875, -34.689453125, -32.2353515625, -29.78125, -27.3271484375, -24.873046875, -22.4189453125, -19.96484375, -17.5107421875, -15.056640625, -12.6025390625, -10.1484375, -7.6943359375, -5.240234375, -2.7861328125, -0.33203125, 2.1220703125, 4.576171875, 7.0302734375, 9.484375, 11.9384765625, 14.392578125, 16.8466796875, 19.30078125, 21.7548828125, 24.208984375, 26.6630859375, 29.1171875, 31.5712890625, 34.025390625, 36.4794921875, 38.93359375, 41.3876953125, 43.841796875, 46.2958984375, 48.75]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 28.0, 49.0, 123.0, 377.0, 1977.0, 1136.0, 234.0, 79.0, 42.0, 12.0, 9.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.578125, -17.239013671875, -16.89990234375, -16.560791015625, -16.2216796875, -15.882568359375, -15.54345703125, -15.204345703125, -14.865234375, -14.526123046875, -14.18701171875, -13.847900390625, -13.5087890625, -13.169677734375, -12.83056640625, -12.491455078125, -12.15234375, -11.813232421875, -11.47412109375, -11.135009765625, -10.7958984375, -10.456787109375, -10.11767578125, -9.778564453125, -9.439453125, -9.100341796875, -8.76123046875, -8.422119140625, -8.0830078125, -7.743896484375, -7.40478515625, -7.065673828125, -6.7265625, -6.387451171875, -6.04833984375, -5.709228515625, -5.3701171875, -5.031005859375, -4.69189453125, -4.352783203125, -4.013671875, -3.674560546875, -3.33544921875, -2.996337890625, -2.6572265625, -2.318115234375, -1.97900390625, -1.639892578125, -1.30078125, -0.961669921875, -0.62255859375, -0.283447265625, 0.0556640625, 0.394775390625, 0.73388671875, 1.072998046875, 1.412109375, 1.751220703125, 2.09033203125, 2.429443359375, 2.7685546875, 3.107666015625, 3.44677734375, 3.785888671875, 4.125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 18.0, 30.0, 123.0, 289.0, 314.0, 136.0, 43.0, 23.0, 15.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.5068130493164, -98.84917449951172, -96.1915283203125, -93.53388977050781, -90.87625122070312, -88.21861267089844, -85.56097412109375, -82.90332794189453, -80.24568939208984, -77.58805084228516, -74.93040466308594, -72.27276611328125, -69.61512756347656, -66.95748901367188, -64.29985046386719, -61.64220428466797, -58.98456573486328, -56.326927185058594, -53.66928482055664, -51.01164245605469, -48.35400390625, -45.69636535644531, -43.03872299194336, -40.381080627441406, -37.72344207763672, -35.06580352783203, -32.40816116333008, -29.750520706176758, -27.092880249023438, -24.435239791870117, -21.777599334716797, -19.119958877563477, -16.462326049804688, -13.804685592651367, -11.147045135498047, -8.489404678344727, -5.831764221191406, -3.174123764038086, -0.5164833068847656, 2.1411571502685547, 4.798797607421875, 7.456438064575195, 10.114078521728516, 12.771718978881836, 15.429359436035156, 18.086999893188477, 20.744640350341797, 23.402280807495117, 26.059921264648438, 28.717561721801758, 31.375202178955078, 34.03284454345703, 36.69048309326172, 39.348121643066406, 42.00576400756836, 44.66340637207031, 47.321044921875, 49.97868347167969, 52.63632583618164, 55.293968200683594, 57.95160675048828, 60.60924530029297, 63.26688766479492, 65.92453002929688, 68.58216857910156]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 1.0, 3.0, 5.0, 12.0, 13.0, 19.0, 34.0, 34.0, 45.0, 43.0, 55.0, 66.0, 62.0, 62.0, 78.0, 80.0, 66.0, 68.0, 65.0, 47.0, 32.0, 29.0, 24.0, 17.0, 8.0, 8.0, 13.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.922222137451172, -30.00249481201172, -29.082765579223633, -28.16303825378418, -27.243309020996094, -26.32358169555664, -25.403854370117188, -24.4841251373291, -23.564395904541016, -22.644668579101562, -21.724939346313477, -20.805212020874023, -19.885482788085938, -18.965755462646484, -18.04602813720703, -17.126298904418945, -16.206571578979492, -15.286843299865723, -14.367115020751953, -13.4473876953125, -12.527658462524414, -11.607931137084961, -10.688202857971191, -9.768474578857422, -8.848746299743652, -7.929018020629883, -7.009289741516113, -6.089561939239502, -5.169833660125732, -4.250105381011963, -3.3303775787353516, -2.410649299621582, -1.4909210205078125, -0.5711928606033325, 0.34853529930114746, 1.268263339996338, 2.1879916191101074, 3.107719898223877, 4.027447700500488, 4.947175979614258, 5.866904258728027, 6.786632537841797, 7.706360816955566, 8.626089096069336, 9.545816421508789, 10.465545654296875, 11.385272979736328, 12.305001258850098, 13.224729537963867, 14.144457817077637, 15.064186096191406, 15.98391342163086, 16.903642654418945, 17.8233699798584, 18.743099212646484, 19.662826538085938, 20.58255386352539, 21.502281188964844, 22.42201042175293, 23.341737747192383, 24.26146697998047, 25.181194305419922, 26.100921630859375, 27.02065086364746, 27.940380096435547]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 10.0, 11.0, 15.0, 38.0, 54.0, 110.0, 136.0, 259.0, 436.0, 871.0, 1904.0, 5426.0, 20251.0, 102728.0, 446840.0, 370878.0, 75164.0, 15480.0, 4461.0, 1676.0, 818.0, 418.0, 214.0, 141.0, 84.0, 45.0, 29.0, 17.0, 17.0, 9.0, 9.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.71875, -17.211181640625, -16.70361328125, -16.196044921875, -15.6884765625, -15.180908203125, -14.67333984375, -14.165771484375, -13.658203125, -13.150634765625, -12.64306640625, -12.135498046875, -11.6279296875, -11.120361328125, -10.61279296875, -10.105224609375, -9.59765625, -9.090087890625, -8.58251953125, -8.074951171875, -7.5673828125, -7.059814453125, -6.55224609375, -6.044677734375, -5.537109375, -5.029541015625, -4.52197265625, -4.014404296875, -3.5068359375, -2.999267578125, -2.49169921875, -1.984130859375, -1.4765625, -0.968994140625, -0.46142578125, 0.046142578125, 0.5537109375, 1.061279296875, 1.56884765625, 2.076416015625, 2.583984375, 3.091552734375, 3.59912109375, 4.106689453125, 4.6142578125, 5.121826171875, 5.62939453125, 6.136962890625, 6.64453125, 7.152099609375, 7.65966796875, 8.167236328125, 8.6748046875, 9.182373046875, 9.68994140625, 10.197509765625, 10.705078125, 11.212646484375, 11.72021484375, 12.227783203125, 12.7353515625, 13.242919921875, 13.75048828125, 14.258056640625, 14.765625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 3.0, 3.0, 7.0, 14.0, 19.0, 25.0, 42.0, 47.0, 52.0, 55.0, 61.0, 83.0, 77.0, 80.0, 70.0, 75.0, 67.0, 51.0, 51.0, 33.0, 17.0, 14.0, 21.0, 6.0, 5.0, 5.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.25390625, -3.160919189453125, -3.06793212890625, -2.974945068359375, -2.8819580078125, -2.788970947265625, -2.69598388671875, -2.602996826171875, -2.510009765625, -2.417022705078125, -2.32403564453125, -2.231048583984375, -2.1380615234375, -2.045074462890625, -1.95208740234375, -1.859100341796875, -1.76611328125, -1.673126220703125, -1.58013916015625, -1.487152099609375, -1.3941650390625, -1.301177978515625, -1.20819091796875, -1.115203857421875, -1.022216796875, -0.929229736328125, -0.83624267578125, -0.743255615234375, -0.6502685546875, -0.557281494140625, -0.46429443359375, -0.371307373046875, -0.2783203125, -0.185333251953125, -0.09234619140625, 0.000640869140625, 0.0936279296875, 0.186614990234375, 0.27960205078125, 0.372589111328125, 0.465576171875, 0.558563232421875, 0.65155029296875, 0.744537353515625, 0.8375244140625, 0.930511474609375, 1.02349853515625, 1.116485595703125, 1.20947265625, 1.302459716796875, 1.39544677734375, 1.488433837890625, 1.5814208984375, 1.674407958984375, 1.76739501953125, 1.860382080078125, 1.953369140625, 2.046356201171875, 2.13934326171875, 2.232330322265625, 2.3253173828125, 2.418304443359375, 2.51129150390625, 2.604278564453125, 2.697265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 2.0, 4.0, 5.0, 10.0, 11.0, 14.0, 31.0, 27.0, 43.0, 56.0, 87.0, 103.0, 196.0, 276.0, 449.0, 812.0, 1776.0, 3973.0, 10439.0, 31431.0, 105631.0, 305083.0, 368524.0, 150565.0, 44627.0, 14557.0, 5156.0, 2155.0, 1053.0, 520.0, 316.0, 208.0, 119.0, 76.0, 57.0, 50.0, 27.0, 22.0, 22.0, 14.0, 13.0, 9.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.28955078125, -7.9462890625, -7.60302734375, -7.259765625, -6.91650390625, -6.5732421875, -6.22998046875, -5.88671875, -5.54345703125, -5.2001953125, -4.85693359375, -4.513671875, -4.17041015625, -3.8271484375, -3.48388671875, -3.140625, -2.79736328125, -2.4541015625, -2.11083984375, -1.767578125, -1.42431640625, -1.0810546875, -0.73779296875, -0.39453125, -0.05126953125, 0.2919921875, 0.63525390625, 0.978515625, 1.32177734375, 1.6650390625, 2.00830078125, 2.3515625, 2.69482421875, 3.0380859375, 3.38134765625, 3.724609375, 4.06787109375, 4.4111328125, 4.75439453125, 5.09765625, 5.44091796875, 5.7841796875, 6.12744140625, 6.470703125, 6.81396484375, 7.1572265625, 7.50048828125, 7.84375, 8.18701171875, 8.5302734375, 8.87353515625, 9.216796875, 9.56005859375, 9.9033203125, 10.24658203125, 10.58984375, 10.93310546875, 11.2763671875, 11.61962890625, 11.962890625, 12.30615234375, 12.6494140625, 12.99267578125, 13.3359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 6.0, 11.0, 6.0, 7.0, 11.0, 10.0, 12.0, 17.0, 15.0, 19.0, 24.0, 26.0, 27.0, 38.0, 52.0, 33.0, 45.0, 41.0, 40.0, 47.0, 50.0, 31.0, 44.0, 40.0, 34.0, 38.0, 31.0, 35.0, 37.0, 20.0, 25.0, 22.0, 18.0, 17.0, 13.0, 10.0, 12.0, 5.0, 7.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8671875, -8.573486328125, -8.27978515625, -7.986083984375, -7.6923828125, -7.398681640625, -7.10498046875, -6.811279296875, -6.517578125, -6.223876953125, -5.93017578125, -5.636474609375, -5.3427734375, -5.049072265625, -4.75537109375, -4.461669921875, -4.16796875, -3.874267578125, -3.58056640625, -3.286865234375, -2.9931640625, -2.699462890625, -2.40576171875, -2.112060546875, -1.818359375, -1.524658203125, -1.23095703125, -0.937255859375, -0.6435546875, -0.349853515625, -0.05615234375, 0.237548828125, 0.53125, 0.824951171875, 1.11865234375, 1.412353515625, 1.7060546875, 1.999755859375, 2.29345703125, 2.587158203125, 2.880859375, 3.174560546875, 3.46826171875, 3.761962890625, 4.0556640625, 4.349365234375, 4.64306640625, 4.936767578125, 5.23046875, 5.524169921875, 5.81787109375, 6.111572265625, 6.4052734375, 6.698974609375, 6.99267578125, 7.286376953125, 7.580078125, 7.873779296875, 8.16748046875, 8.461181640625, 8.7548828125, 9.048583984375, 9.34228515625, 9.635986328125, 9.9296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 8.0, 3.0, 15.0, 15.0, 18.0, 42.0, 67.0, 161.0, 298.0, 844.0, 3158.0, 18366.0, 153419.0, 651189.0, 192975.0, 22496.0, 3832.0, 954.0, 351.0, 160.0, 71.0, 36.0, 29.0, 16.0, 7.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0625, -8.72119140625, -8.3798828125, -8.03857421875, -7.697265625, -7.35595703125, -7.0146484375, -6.67333984375, -6.33203125, -5.99072265625, -5.6494140625, -5.30810546875, -4.966796875, -4.62548828125, -4.2841796875, -3.94287109375, -3.6015625, -3.26025390625, -2.9189453125, -2.57763671875, -2.236328125, -1.89501953125, -1.5537109375, -1.21240234375, -0.87109375, -0.52978515625, -0.1884765625, 0.15283203125, 0.494140625, 0.83544921875, 1.1767578125, 1.51806640625, 1.859375, 2.20068359375, 2.5419921875, 2.88330078125, 3.224609375, 3.56591796875, 3.9072265625, 4.24853515625, 4.58984375, 4.93115234375, 5.2724609375, 5.61376953125, 5.955078125, 6.29638671875, 6.6376953125, 6.97900390625, 7.3203125, 7.66162109375, 8.0029296875, 8.34423828125, 8.685546875, 9.02685546875, 9.3681640625, 9.70947265625, 10.05078125, 10.39208984375, 10.7333984375, 11.07470703125, 11.416015625, 11.75732421875, 12.0986328125, 12.43994140625, 12.78125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 6.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 6.0, 13.0, 9.0, 18.0, 10.0, 15.0, 26.0, 23.0, 28.0, 29.0, 42.0, 52.0, 70.0, 62.0, 73.0, 74.0, 51.0, 41.0, 48.0, 61.0, 33.0, 35.0, 23.0, 20.0, 24.0, 14.0, 18.0, 14.0, 8.0, 6.0, 7.0, 9.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0008306503295898438, -0.0008045434951782227, -0.0007784366607666016, -0.0007523298263549805, -0.0007262229919433594, -0.0007001161575317383, -0.0006740093231201172, -0.0006479024887084961, -0.000621795654296875, -0.0005956888198852539, -0.0005695819854736328, -0.0005434751510620117, -0.0005173683166503906, -0.0004912614822387695, -0.00046515464782714844, -0.00043904781341552734, -0.00041294097900390625, -0.00038683414459228516, -0.00036072731018066406, -0.00033462047576904297, -0.0003085136413574219, -0.0002824068069458008, -0.0002562999725341797, -0.0002301931381225586, -0.0002040863037109375, -0.0001779794692993164, -0.0001518726348876953, -0.00012576580047607422, -9.965896606445312e-05, -7.355213165283203e-05, -4.744529724121094e-05, -2.1338462829589844e-05, 4.76837158203125e-06, 3.0875205993652344e-05, 5.698204040527344e-05, 8.308887481689453e-05, 0.00010919570922851562, 0.00013530254364013672, 0.0001614093780517578, 0.0001875162124633789, 0.000213623046875, 0.0002397298812866211, 0.0002658367156982422, 0.0002919435501098633, 0.0003180503845214844, 0.00034415721893310547, 0.00037026405334472656, 0.00039637088775634766, 0.00042247772216796875, 0.00044858455657958984, 0.00047469139099121094, 0.000500798225402832, 0.0005269050598144531, 0.0005530118942260742, 0.0005791187286376953, 0.0006052255630493164, 0.0006313323974609375, 0.0006574392318725586, 0.0006835460662841797, 0.0007096529006958008, 0.0007357597351074219, 0.000761866569519043, 0.0007879734039306641, 0.0008140802383422852, 0.0008401870727539062]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 8.0, 10.0, 11.0, 8.0, 29.0, 45.0, 54.0, 57.0, 110.0, 161.0, 299.0, 591.0, 1177.0, 2526.0, 6698.0, 19450.0, 68759.0, 265063.0, 461088.0, 160046.0, 41498.0, 12557.0, 4538.0, 1818.0, 854.0, 416.0, 241.0, 156.0, 88.0, 46.0, 41.0, 33.0, 19.0, 10.0, 10.0, 12.0, 8.0, 2.0, 7.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.15625, -7.91851806640625, -7.6807861328125, -7.44305419921875, -7.205322265625, -6.96759033203125, -6.7298583984375, -6.49212646484375, -6.25439453125, -6.01666259765625, -5.7789306640625, -5.54119873046875, -5.303466796875, -5.06573486328125, -4.8280029296875, -4.59027099609375, -4.3525390625, -4.11480712890625, -3.8770751953125, -3.63934326171875, -3.401611328125, -3.16387939453125, -2.9261474609375, -2.68841552734375, -2.45068359375, -2.21295166015625, -1.9752197265625, -1.73748779296875, -1.499755859375, -1.26202392578125, -1.0242919921875, -0.78656005859375, -0.548828125, -0.31109619140625, -0.0733642578125, 0.16436767578125, 0.402099609375, 0.63983154296875, 0.8775634765625, 1.11529541015625, 1.35302734375, 1.59075927734375, 1.8284912109375, 2.06622314453125, 2.303955078125, 2.54168701171875, 2.7794189453125, 3.01715087890625, 3.2548828125, 3.49261474609375, 3.7303466796875, 3.96807861328125, 4.205810546875, 4.44354248046875, 4.6812744140625, 4.91900634765625, 5.15673828125, 5.39447021484375, 5.6322021484375, 5.86993408203125, 6.107666015625, 6.34539794921875, 6.5831298828125, 6.82086181640625, 7.05859375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 3.0, 4.0, 8.0, 18.0, 10.0, 7.0, 21.0, 13.0, 24.0, 24.0, 29.0, 41.0, 34.0, 40.0, 36.0, 54.0, 51.0, 66.0, 41.0, 51.0, 48.0, 49.0, 48.0, 28.0, 43.0, 36.0, 25.0, 24.0, 24.0, 18.0, 14.0, 13.0, 9.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.371246337890625, -3.25225830078125, -3.133270263671875, -3.0142822265625, -2.895294189453125, -2.77630615234375, -2.657318115234375, -2.538330078125, -2.419342041015625, -2.30035400390625, -2.181365966796875, -2.0623779296875, -1.943389892578125, -1.82440185546875, -1.705413818359375, -1.58642578125, -1.467437744140625, -1.34844970703125, -1.229461669921875, -1.1104736328125, -0.991485595703125, -0.87249755859375, -0.753509521484375, -0.634521484375, -0.515533447265625, -0.39654541015625, -0.277557373046875, -0.1585693359375, -0.039581298828125, 0.07940673828125, 0.198394775390625, 0.3173828125, 0.436370849609375, 0.55535888671875, 0.674346923828125, 0.7933349609375, 0.912322998046875, 1.03131103515625, 1.150299072265625, 1.269287109375, 1.388275146484375, 1.50726318359375, 1.626251220703125, 1.7452392578125, 1.864227294921875, 1.98321533203125, 2.102203369140625, 2.22119140625, 2.340179443359375, 2.45916748046875, 2.578155517578125, 2.6971435546875, 2.816131591796875, 2.93511962890625, 3.054107666015625, 3.173095703125, 3.292083740234375, 3.41107177734375, 3.530059814453125, 3.6490478515625, 3.768035888671875, 3.88702392578125, 4.006011962890625, 4.125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 16.0, 22.0, 27.0, 55.0, 57.0, 94.0, 113.0, 132.0, 126.0, 96.0, 72.0, 58.0, 49.0, 21.0, 16.0, 9.0, 15.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.24492645263672, -87.00086975097656, -84.7568130493164, -82.51275634765625, -80.26869201660156, -78.0246353149414, -75.78057861328125, -73.5365219116211, -71.29246520996094, -69.04840850830078, -66.80435180664062, -64.56029510498047, -62.31623458862305, -60.07217788696289, -57.82811737060547, -55.58406066894531, -53.340003967285156, -51.095947265625, -48.851890563964844, -46.60783004760742, -44.363773345947266, -42.11971664428711, -39.87565612792969, -37.63159942626953, -35.387542724609375, -33.14348602294922, -30.89942741394043, -28.65536880493164, -26.411312103271484, -24.167255401611328, -21.92319679260254, -19.67913818359375, -17.435077667236328, -15.191020011901855, -12.946962356567383, -10.70290470123291, -8.458847045898438, -6.214789390563965, -3.970731735229492, -1.7266740798950195, 0.5173835754394531, 2.761441230773926, 5.005498886108398, 7.249556541442871, 9.493614196777344, 11.737671852111816, 13.981729507446289, 16.225788116455078, 18.469844818115234, 20.71390151977539, 22.95796012878418, 25.20201873779297, 27.446075439453125, 29.69013214111328, 31.93419075012207, 34.17824935913086, 36.422306060791016, 38.66636276245117, 40.910423278808594, 43.15447998046875, 45.398536682128906, 47.64259338378906, 49.88665008544922, 52.13071060180664, 54.3747673034668]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 3.0, 18.0, 12.0, 13.0, 21.0, 20.0, 22.0, 35.0, 34.0, 54.0, 53.0, 61.0, 54.0, 75.0, 70.0, 70.0, 60.0, 49.0, 43.0, 42.0, 36.0, 29.0, 27.0, 24.0, 16.0, 9.0, 14.0, 6.0, 8.0, 3.0, 8.0, 2.0, 0.0, 3.0, 3.0], "bins": [-111.98564147949219, -109.38790130615234, -106.79015350341797, -104.19241333007812, -101.59466552734375, -98.9969253540039, -96.39917755126953, -93.80143737792969, -91.20368957519531, -88.60594940185547, -86.0082015991211, -83.41046142578125, -80.81271362304688, -78.21497344970703, -75.61722564697266, -73.01948547363281, -70.42173767089844, -67.8239974975586, -65.22624969482422, -62.62850570678711, -60.03076171875, -57.43301773071289, -54.83527374267578, -52.23753356933594, -49.639793395996094, -47.042049407958984, -44.444305419921875, -41.846561431884766, -39.248817443847656, -36.65107345581055, -34.05332946777344, -31.45558738708496, -28.85784149169922, -26.26009750366211, -23.662353515625, -21.06460952758789, -18.46686553955078, -15.869122505187988, -13.271379470825195, -10.673635482788086, -8.075891494750977, -5.478147506713867, -2.880403995513916, -0.28266048431396484, 2.3150835037231445, 4.912827491760254, 7.510570526123047, 10.108314514160156, 12.706058502197266, 15.303802490234375, 17.901546478271484, 20.499290466308594, 23.097034454345703, 25.694778442382812, 28.29252052307129, 30.8902645111084, 33.488006591796875, 36.085750579833984, 38.683494567871094, 41.2812385559082, 43.87898254394531, 46.47672653198242, 49.07447052001953, 51.672210693359375, 54.26995849609375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 7.0, 19.0, 19.0, 23.0, 51.0, 54.0, 105.0, 181.0, 321.0, 668.0, 1886.0, 7921.0, 73054.0, 4006669.0, 90985.0, 9103.0, 1994.0, 620.0, 249.0, 145.0, 79.0, 30.0, 23.0, 20.0, 14.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.375, -40.21044921875, -39.0458984375, -37.88134765625, -36.716796875, -35.55224609375, -34.3876953125, -33.22314453125, -32.05859375, -30.89404296875, -29.7294921875, -28.56494140625, -27.400390625, -26.23583984375, -25.0712890625, -23.90673828125, -22.7421875, -21.57763671875, -20.4130859375, -19.24853515625, -18.083984375, -16.91943359375, -15.7548828125, -14.59033203125, -13.42578125, -12.26123046875, -11.0966796875, -9.93212890625, -8.767578125, -7.60302734375, -6.4384765625, -5.27392578125, -4.109375, -2.94482421875, -1.7802734375, -0.61572265625, 0.548828125, 1.71337890625, 2.8779296875, 4.04248046875, 5.20703125, 6.37158203125, 7.5361328125, 8.70068359375, 9.865234375, 11.02978515625, 12.1943359375, 13.35888671875, 14.5234375, 15.68798828125, 16.8525390625, 18.01708984375, 19.181640625, 20.34619140625, 21.5107421875, 22.67529296875, 23.83984375, 25.00439453125, 26.1689453125, 27.33349609375, 28.498046875, 29.66259765625, 30.8271484375, 31.99169921875, 33.15625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 10.0, 15.0, 18.0, 30.0, 37.0, 53.0, 72.0, 59.0, 73.0, 93.0, 91.0, 90.0, 73.0, 70.0, 54.0, 49.0, 35.0, 24.0, 12.0, 12.0, 6.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.48828125, -4.37396240234375, -4.2596435546875, -4.14532470703125, -4.031005859375, -3.91668701171875, -3.8023681640625, -3.68804931640625, -3.57373046875, -3.45941162109375, -3.3450927734375, -3.23077392578125, -3.116455078125, -3.00213623046875, -2.8878173828125, -2.77349853515625, -2.6591796875, -2.54486083984375, -2.4305419921875, -2.31622314453125, -2.201904296875, -2.08758544921875, -1.9732666015625, -1.85894775390625, -1.74462890625, -1.63031005859375, -1.5159912109375, -1.40167236328125, -1.287353515625, -1.17303466796875, -1.0587158203125, -0.94439697265625, -0.830078125, -0.71575927734375, -0.6014404296875, -0.48712158203125, -0.372802734375, -0.25848388671875, -0.1441650390625, -0.02984619140625, 0.08447265625, 0.19879150390625, 0.3131103515625, 0.42742919921875, 0.541748046875, 0.65606689453125, 0.7703857421875, 0.88470458984375, 0.9990234375, 1.11334228515625, 1.2276611328125, 1.34197998046875, 1.456298828125, 1.57061767578125, 1.6849365234375, 1.79925537109375, 1.91357421875, 2.02789306640625, 2.1422119140625, 2.25653076171875, 2.370849609375, 2.48516845703125, 2.5994873046875, 2.71380615234375, 2.828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 19.0, 26.0, 21.0, 38.0, 65.0, 95.0, 135.0, 253.0, 570.0, 1373.0, 4479.0, 20799.0, 261151.0, 3796117.0, 92048.0, 11907.0, 2865.0, 1135.0, 513.0, 263.0, 135.0, 93.0, 46.0, 47.0, 19.0, 19.0, 12.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.28125, -33.337890625, -32.39453125, -31.451171875, -30.5078125, -29.564453125, -28.62109375, -27.677734375, -26.734375, -25.791015625, -24.84765625, -23.904296875, -22.9609375, -22.017578125, -21.07421875, -20.130859375, -19.1875, -18.244140625, -17.30078125, -16.357421875, -15.4140625, -14.470703125, -13.52734375, -12.583984375, -11.640625, -10.697265625, -9.75390625, -8.810546875, -7.8671875, -6.923828125, -5.98046875, -5.037109375, -4.09375, -3.150390625, -2.20703125, -1.263671875, -0.3203125, 0.623046875, 1.56640625, 2.509765625, 3.453125, 4.396484375, 5.33984375, 6.283203125, 7.2265625, 8.169921875, 9.11328125, 10.056640625, 11.0, 11.943359375, 12.88671875, 13.830078125, 14.7734375, 15.716796875, 16.66015625, 17.603515625, 18.546875, 19.490234375, 20.43359375, 21.376953125, 22.3203125, 23.263671875, 24.20703125, 25.150390625, 26.09375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 11.0, 9.0, 13.0, 22.0, 45.0, 53.0, 87.0, 152.0, 317.0, 884.0, 1445.0, 492.0, 194.0, 118.0, 57.0, 44.0, 36.0, 16.0, 19.0, 11.0, 10.0, 4.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.78924560546875, -4.6253662109375, -4.46148681640625, -4.297607421875, -4.13372802734375, -3.9698486328125, -3.80596923828125, -3.64208984375, -3.47821044921875, -3.3143310546875, -3.15045166015625, -2.986572265625, -2.82269287109375, -2.6588134765625, -2.49493408203125, -2.3310546875, -2.16717529296875, -2.0032958984375, -1.83941650390625, -1.675537109375, -1.51165771484375, -1.3477783203125, -1.18389892578125, -1.02001953125, -0.85614013671875, -0.6922607421875, -0.52838134765625, -0.364501953125, -0.20062255859375, -0.0367431640625, 0.12713623046875, 0.291015625, 0.45489501953125, 0.6187744140625, 0.78265380859375, 0.946533203125, 1.11041259765625, 1.2742919921875, 1.43817138671875, 1.60205078125, 1.76593017578125, 1.9298095703125, 2.09368896484375, 2.257568359375, 2.42144775390625, 2.5853271484375, 2.74920654296875, 2.9130859375, 3.07696533203125, 3.2408447265625, 3.40472412109375, 3.568603515625, 3.73248291015625, 3.8963623046875, 4.06024169921875, 4.22412109375, 4.38800048828125, 4.5518798828125, 4.71575927734375, 4.879638671875, 5.04351806640625, 5.2073974609375, 5.37127685546875, 5.53515625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 20.0, 79.0, 250.0, 420.0, 171.0, 54.0, 17.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.04430389404297, -35.18310546875, -32.32190704345703, -29.460708618164062, -26.599510192871094, -23.738311767578125, -20.877113342285156, -18.015914916992188, -15.154716491699219, -12.29351806640625, -9.432319641113281, -6.5711212158203125, -3.7099227905273438, -0.848724365234375, 2.0124740600585938, 4.8736724853515625, 7.734870910644531, 10.5960693359375, 13.457267761230469, 16.318466186523438, 19.179664611816406, 22.040863037109375, 24.902061462402344, 27.763259887695312, 30.62445831298828, 33.48565673828125, 36.34685516357422, 39.20805358886719, 42.069252014160156, 44.930450439453125, 47.791648864746094, 50.65284729003906, 53.5140380859375, 56.37523651123047, 59.23643493652344, 62.097633361816406, 64.95883178710938, 67.82003021240234, 70.68122863769531, 73.54242706298828, 76.40362548828125, 79.26482391357422, 82.12602233886719, 84.98722076416016, 87.84841918945312, 90.7096176147461, 93.57081604003906, 96.43201446533203, 99.293212890625, 102.15441131591797, 105.01560974121094, 107.8768081665039, 110.73800659179688, 113.59920501708984, 116.46040344238281, 119.32160186767578, 122.18280029296875, 125.04399871826172, 127.90519714355469, 130.76638793945312, 133.62759399414062, 136.48880004882812, 139.34999084472656, 142.211181640625, 145.0723876953125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 9.0, 8.0, 5.0, 10.0, 13.0, 27.0, 25.0, 26.0, 36.0, 42.0, 39.0, 39.0, 73.0, 55.0, 62.0, 78.0, 73.0, 67.0, 54.0, 52.0, 39.0, 38.0, 33.0, 28.0, 20.0, 16.0, 9.0, 9.0, 6.0, 7.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.02696418762207, -14.356404304504395, -13.685843467712402, -13.015283584594727, -12.344722747802734, -11.674162864685059, -11.003602981567383, -10.33304214477539, -9.662482261657715, -8.991922378540039, -8.321361541748047, -7.650801658630371, -6.980241298675537, -6.309680938720703, -5.639121055603027, -4.968560695648193, -4.298000335693359, -3.6274399757385254, -2.9568798542022705, -2.2863197326660156, -1.6157593727111816, -0.9451990127563477, -0.2746391296386719, 0.3959212303161621, 1.066481590270996, 1.7370418310165405, 2.407602071762085, 3.07816219329834, 3.748722553253174, 4.419282913208008, 5.089842796325684, 5.760403156280518, 6.430961608886719, 7.101521968841553, 7.772082328796387, 8.442642211914062, 9.113203048706055, 9.78376293182373, 10.454322814941406, 11.124883651733398, 11.795443534851074, 12.46600341796875, 13.136564254760742, 13.807124137878418, 14.477684020996094, 15.148244857788086, 15.818804740905762, 16.489364624023438, 17.15992546081543, 17.830486297607422, 18.50104522705078, 19.171606063842773, 19.842166900634766, 20.512725830078125, 21.183286666870117, 21.85384750366211, 22.52440643310547, 23.19496726989746, 23.86552619934082, 24.536087036132812, 25.206647872924805, 25.877208709716797, 26.547767639160156, 27.21832847595215, 27.88888931274414]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 3.0, 11.0, 7.0, 12.0, 27.0, 29.0, 39.0, 46.0, 58.0, 114.0, 140.0, 229.0, 371.0, 694.0, 1288.0, 2707.0, 6335.0, 18966.0, 72624.0, 289164.0, 446956.0, 152175.0, 37231.0, 10946.0, 4162.0, 1890.0, 888.0, 533.0, 325.0, 188.0, 112.0, 78.0, 36.0, 45.0, 26.0, 22.0, 8.0, 13.0, 13.0, 5.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-14.875, -14.4407958984375, -14.006591796875, -13.5723876953125, -13.13818359375, -12.7039794921875, -12.269775390625, -11.8355712890625, -11.4013671875, -10.9671630859375, -10.532958984375, -10.0987548828125, -9.66455078125, -9.2303466796875, -8.796142578125, -8.3619384765625, -7.927734375, -7.4935302734375, -7.059326171875, -6.6251220703125, -6.19091796875, -5.7567138671875, -5.322509765625, -4.8883056640625, -4.4541015625, -4.0198974609375, -3.585693359375, -3.1514892578125, -2.71728515625, -2.2830810546875, -1.848876953125, -1.4146728515625, -0.98046875, -0.5462646484375, -0.112060546875, 0.3221435546875, 0.75634765625, 1.1905517578125, 1.624755859375, 2.0589599609375, 2.4931640625, 2.9273681640625, 3.361572265625, 3.7957763671875, 4.22998046875, 4.6641845703125, 5.098388671875, 5.5325927734375, 5.966796875, 6.4010009765625, 6.835205078125, 7.2694091796875, 7.70361328125, 8.1378173828125, 8.572021484375, 9.0062255859375, 9.4404296875, 9.8746337890625, 10.308837890625, 10.7430419921875, 11.17724609375, 11.6114501953125, 12.045654296875, 12.4798583984375, 12.9140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 10.0, 10.0, 16.0, 21.0, 24.0, 31.0, 49.0, 51.0, 61.0, 65.0, 78.0, 85.0, 68.0, 71.0, 61.0, 54.0, 41.0, 53.0, 39.0, 27.0, 20.0, 23.0, 12.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.568359375, -3.469635009765625, -3.37091064453125, -3.272186279296875, -3.1734619140625, -3.074737548828125, -2.97601318359375, -2.877288818359375, -2.778564453125, -2.679840087890625, -2.58111572265625, -2.482391357421875, -2.3836669921875, -2.284942626953125, -2.18621826171875, -2.087493896484375, -1.98876953125, -1.890045166015625, -1.79132080078125, -1.692596435546875, -1.5938720703125, -1.495147705078125, -1.39642333984375, -1.297698974609375, -1.198974609375, -1.100250244140625, -1.00152587890625, -0.902801513671875, -0.8040771484375, -0.705352783203125, -0.60662841796875, -0.507904052734375, -0.4091796875, -0.310455322265625, -0.21173095703125, -0.113006591796875, -0.0142822265625, 0.084442138671875, 0.18316650390625, 0.281890869140625, 0.380615234375, 0.479339599609375, 0.57806396484375, 0.676788330078125, 0.7755126953125, 0.874237060546875, 0.97296142578125, 1.071685791015625, 1.17041015625, 1.269134521484375, 1.36785888671875, 1.466583251953125, 1.5653076171875, 1.664031982421875, 1.76275634765625, 1.861480712890625, 1.960205078125, 2.058929443359375, 2.15765380859375, 2.256378173828125, 2.3551025390625, 2.453826904296875, 2.55255126953125, 2.651275634765625, 2.75]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 3.0, 8.0, 11.0, 12.0, 14.0, 24.0, 30.0, 39.0, 55.0, 116.0, 185.0, 323.0, 601.0, 1299.0, 3195.0, 11056.0, 58278.0, 371118.0, 490866.0, 88745.0, 15452.0, 4010.0, 1498.0, 716.0, 326.0, 218.0, 112.0, 70.0, 41.0, 40.0, 19.0, 17.0, 8.0, 8.0, 9.0, 11.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.140625, -17.57568359375, -17.0107421875, -16.44580078125, -15.880859375, -15.31591796875, -14.7509765625, -14.18603515625, -13.62109375, -13.05615234375, -12.4912109375, -11.92626953125, -11.361328125, -10.79638671875, -10.2314453125, -9.66650390625, -9.1015625, -8.53662109375, -7.9716796875, -7.40673828125, -6.841796875, -6.27685546875, -5.7119140625, -5.14697265625, -4.58203125, -4.01708984375, -3.4521484375, -2.88720703125, -2.322265625, -1.75732421875, -1.1923828125, -0.62744140625, -0.0625, 0.50244140625, 1.0673828125, 1.63232421875, 2.197265625, 2.76220703125, 3.3271484375, 3.89208984375, 4.45703125, 5.02197265625, 5.5869140625, 6.15185546875, 6.716796875, 7.28173828125, 7.8466796875, 8.41162109375, 8.9765625, 9.54150390625, 10.1064453125, 10.67138671875, 11.236328125, 11.80126953125, 12.3662109375, 12.93115234375, 13.49609375, 14.06103515625, 14.6259765625, 15.19091796875, 15.755859375, 16.32080078125, 16.8857421875, 17.45068359375, 18.015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 3.0, 8.0, 4.0, 6.0, 13.0, 15.0, 22.0, 35.0, 20.0, 38.0, 39.0, 37.0, 37.0, 55.0, 50.0, 57.0, 46.0, 54.0, 66.0, 51.0, 29.0, 39.0, 43.0, 37.0, 32.0, 23.0, 24.0, 25.0, 14.0, 13.0, 11.0, 10.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.7421875, -12.3714599609375, -12.000732421875, -11.6300048828125, -11.25927734375, -10.8885498046875, -10.517822265625, -10.1470947265625, -9.7763671875, -9.4056396484375, -9.034912109375, -8.6641845703125, -8.29345703125, -7.9227294921875, -7.552001953125, -7.1812744140625, -6.810546875, -6.4398193359375, -6.069091796875, -5.6983642578125, -5.32763671875, -4.9569091796875, -4.586181640625, -4.2154541015625, -3.8447265625, -3.4739990234375, -3.103271484375, -2.7325439453125, -2.36181640625, -1.9910888671875, -1.620361328125, -1.2496337890625, -0.87890625, -0.5081787109375, -0.137451171875, 0.2332763671875, 0.60400390625, 0.9747314453125, 1.345458984375, 1.7161865234375, 2.0869140625, 2.4576416015625, 2.828369140625, 3.1990966796875, 3.56982421875, 3.9405517578125, 4.311279296875, 4.6820068359375, 5.052734375, 5.4234619140625, 5.794189453125, 6.1649169921875, 6.53564453125, 6.9063720703125, 7.277099609375, 7.6478271484375, 8.0185546875, 8.3892822265625, 8.760009765625, 9.1307373046875, 9.50146484375, 9.8721923828125, 10.242919921875, 10.6136474609375, 10.984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 6.0, 10.0, 16.0, 18.0, 34.0, 67.0, 110.0, 197.0, 437.0, 1191.0, 4167.0, 17999.0, 126777.0, 645932.0, 215863.0, 27332.0, 5618.0, 1648.0, 594.0, 246.0, 102.0, 72.0, 26.0, 33.0, 14.0, 13.0, 9.0, 7.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.4593505859375, -8.153076171875, -7.8468017578125, -7.54052734375, -7.2342529296875, -6.927978515625, -6.6217041015625, -6.3154296875, -6.0091552734375, -5.702880859375, -5.3966064453125, -5.09033203125, -4.7840576171875, -4.477783203125, -4.1715087890625, -3.865234375, -3.5589599609375, -3.252685546875, -2.9464111328125, -2.64013671875, -2.3338623046875, -2.027587890625, -1.7213134765625, -1.4150390625, -1.1087646484375, -0.802490234375, -0.4962158203125, -0.18994140625, 0.1163330078125, 0.422607421875, 0.7288818359375, 1.03515625, 1.3414306640625, 1.647705078125, 1.9539794921875, 2.26025390625, 2.5665283203125, 2.872802734375, 3.1790771484375, 3.4853515625, 3.7916259765625, 4.097900390625, 4.4041748046875, 4.71044921875, 5.0167236328125, 5.322998046875, 5.6292724609375, 5.935546875, 6.2418212890625, 6.548095703125, 6.8543701171875, 7.16064453125, 7.4669189453125, 7.773193359375, 8.0794677734375, 8.3857421875, 8.6920166015625, 8.998291015625, 9.3045654296875, 9.61083984375, 9.9171142578125, 10.223388671875, 10.5296630859375, 10.8359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 8.0, 7.0, 17.0, 13.0, 27.0, 39.0, 43.0, 56.0, 63.0, 91.0, 90.0, 107.0, 101.0, 86.0, 67.0, 41.0, 26.0, 30.0, 19.0, 12.0, 15.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010395050048828125, -0.0010012388229370117, -0.0009629726409912109, -0.0009247064590454102, -0.0008864402770996094, -0.0008481740951538086, -0.0008099079132080078, -0.000771641731262207, -0.0007333755493164062, -0.0006951093673706055, -0.0006568431854248047, -0.0006185770034790039, -0.0005803108215332031, -0.0005420446395874023, -0.0005037784576416016, -0.0004655122756958008, -0.00042724609375, -0.0003889799118041992, -0.00035071372985839844, -0.00031244754791259766, -0.0002741813659667969, -0.0002359151840209961, -0.0001976490020751953, -0.00015938282012939453, -0.00012111663818359375, -8.285045623779297e-05, -4.458427429199219e-05, -6.318092346191406e-06, 3.1948089599609375e-05, 7.021427154541016e-05, 0.00010848045349121094, 0.00014674663543701172, 0.0001850128173828125, 0.00022327899932861328, 0.00026154518127441406, 0.00029981136322021484, 0.0003380775451660156, 0.0003763437271118164, 0.0004146099090576172, 0.00045287609100341797, 0.0004911422729492188, 0.0005294084548950195, 0.0005676746368408203, 0.0006059408187866211, 0.0006442070007324219, 0.0006824731826782227, 0.0007207393646240234, 0.0007590055465698242, 0.000797271728515625, 0.0008355379104614258, 0.0008738040924072266, 0.0009120702743530273, 0.0009503364562988281, 0.000988602638244629, 0.0010268688201904297, 0.0010651350021362305, 0.0011034011840820312, 0.001141667366027832, 0.0011799335479736328, 0.0012181997299194336, 0.0012564659118652344, 0.0012947320938110352, 0.001332998275756836, 0.0013712644577026367, 0.0014095306396484375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 2.0, 4.0, 6.0, 16.0, 18.0, 37.0, 47.0, 116.0, 188.0, 465.0, 1181.0, 4350.0, 30477.0, 430308.0, 534977.0, 38944.0, 5151.0, 1290.0, 485.0, 229.0, 105.0, 71.0, 32.0, 24.0, 5.0, 4.0, 10.0, 6.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -13.083984375, -12.67578125, -12.267578125, -11.859375, -11.451171875, -11.04296875, -10.634765625, -10.2265625, -9.818359375, -9.41015625, -9.001953125, -8.59375, -8.185546875, -7.77734375, -7.369140625, -6.9609375, -6.552734375, -6.14453125, -5.736328125, -5.328125, -4.919921875, -4.51171875, -4.103515625, -3.6953125, -3.287109375, -2.87890625, -2.470703125, -2.0625, -1.654296875, -1.24609375, -0.837890625, -0.4296875, -0.021484375, 0.38671875, 0.794921875, 1.203125, 1.611328125, 2.01953125, 2.427734375, 2.8359375, 3.244140625, 3.65234375, 4.060546875, 4.46875, 4.876953125, 5.28515625, 5.693359375, 6.1015625, 6.509765625, 6.91796875, 7.326171875, 7.734375, 8.142578125, 8.55078125, 8.958984375, 9.3671875, 9.775390625, 10.18359375, 10.591796875, 11.0, 11.408203125, 11.81640625, 12.224609375, 12.6328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 5.0, 5.0, 18.0, 23.0, 33.0, 46.0, 56.0, 67.0, 73.0, 99.0, 101.0, 84.0, 84.0, 66.0, 62.0, 52.0, 26.0, 24.0, 14.0, 20.0, 7.0, 5.0, 5.0, 8.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4140625, -5.21759033203125, -5.0211181640625, -4.82464599609375, -4.628173828125, -4.43170166015625, -4.2352294921875, -4.03875732421875, -3.84228515625, -3.64581298828125, -3.4493408203125, -3.25286865234375, -3.056396484375, -2.85992431640625, -2.6634521484375, -2.46697998046875, -2.2705078125, -2.07403564453125, -1.8775634765625, -1.68109130859375, -1.484619140625, -1.28814697265625, -1.0916748046875, -0.89520263671875, -0.69873046875, -0.50225830078125, -0.3057861328125, -0.10931396484375, 0.087158203125, 0.28363037109375, 0.4801025390625, 0.67657470703125, 0.873046875, 1.06951904296875, 1.2659912109375, 1.46246337890625, 1.658935546875, 1.85540771484375, 2.0518798828125, 2.24835205078125, 2.44482421875, 2.64129638671875, 2.8377685546875, 3.03424072265625, 3.230712890625, 3.42718505859375, 3.6236572265625, 3.82012939453125, 4.0166015625, 4.21307373046875, 4.4095458984375, 4.60601806640625, 4.802490234375, 4.99896240234375, 5.1954345703125, 5.39190673828125, 5.58837890625, 5.78485107421875, 5.9813232421875, 6.17779541015625, 6.374267578125, 6.57073974609375, 6.7672119140625, 6.96368408203125, 7.16015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 13.0, 48.0, 184.0, 400.0, 256.0, 76.0, 23.0, 9.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.12338256835938, -157.109130859375, -149.09487915039062, -141.08062744140625, -133.06637573242188, -125.05211639404297, -117.03785705566406, -109.02360534667969, -101.00935363769531, -92.99510192871094, -84.98085021972656, -76.96659088134766, -68.95233917236328, -60.938087463378906, -52.923831939697266, -44.909576416015625, -36.89532470703125, -28.881071090698242, -20.866817474365234, -12.852563858032227, -4.838310241699219, 3.1759414672851562, 11.190196990966797, 19.204452514648438, 27.218704223632812, 35.23295593261719, 43.24721145629883, 51.26146697998047, 59.275718688964844, 67.28997039794922, 75.30422973632812, 83.3184814453125, 91.332763671875, 99.34701538085938, 107.36126708984375, 115.37552642822266, 123.38977813720703, 131.40402221679688, 139.4182891845703, 147.4325408935547, 155.44679260253906, 163.46104431152344, 171.4752960205078, 179.4895477294922, 187.50381469726562, 195.51806640625, 203.53231811523438, 211.54656982421875, 219.56082153320312, 227.5750732421875, 235.58932495117188, 243.60357666015625, 251.61782836914062, 259.632080078125, 267.6463317871094, 275.66058349609375, 283.67486572265625, 291.6891174316406, 299.703369140625, 307.7176208496094, 315.73187255859375, 323.7461242675781, 331.7603759765625, 339.774658203125, 347.78887939453125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 7.0, 5.0, 17.0, 10.0, 16.0, 7.0, 15.0, 22.0, 17.0, 28.0, 32.0, 34.0, 38.0, 37.0, 52.0, 46.0, 50.0, 45.0, 57.0, 49.0, 42.0, 51.0, 36.0, 47.0, 44.0, 28.0, 25.0, 19.0, 21.0, 16.0, 16.0, 14.0, 12.0, 7.0, 10.0, 9.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-66.31913757324219, -64.38018798828125, -62.44123840332031, -60.502288818359375, -58.56333923339844, -56.6243896484375, -54.68544006347656, -52.746490478515625, -50.80754089355469, -48.86859130859375, -46.92964172363281, -44.990692138671875, -43.05174255371094, -41.11279296875, -39.17384338378906, -37.234893798828125, -35.29594802856445, -33.356998443603516, -31.418048858642578, -29.47909927368164, -27.540149688720703, -25.601200103759766, -23.66225242614746, -21.723302841186523, -19.784353256225586, -17.84540367126465, -15.906454086303711, -13.96750545501709, -12.028555870056152, -10.089606285095215, -8.150657653808594, -6.211708068847656, -4.272762298583984, -2.333812952041626, -0.3948636054992676, 1.5440855026245117, 3.483035087585449, 5.421984672546387, 7.360933303833008, 9.299882888793945, 11.238832473754883, 13.17778205871582, 15.116731643676758, 17.055679321289062, 18.99462890625, 20.933578491210938, 22.872528076171875, 24.811477661132812, 26.75042724609375, 28.689376831054688, 30.628326416015625, 32.56727600097656, 34.5062255859375, 36.44517517089844, 38.384124755859375, 40.32307434082031, 42.26202392578125, 44.20097351074219, 46.139923095703125, 48.07887268066406, 50.017822265625, 51.95677185058594, 53.895721435546875, 55.83467102050781, 57.773616790771484]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 4.0, 6.0, 9.0, 12.0, 14.0, 21.0, 17.0, 27.0, 39.0, 43.0, 64.0, 87.0, 122.0, 142.0, 248.0, 375.0, 648.0, 1261.0, 2689.0, 6780.0, 22266.0, 128284.0, 3675742.0, 303522.0, 35211.0, 9738.0, 3599.0, 1588.0, 710.0, 418.0, 190.0, 132.0, 91.0, 46.0, 42.0, 21.0, 22.0, 8.0, 8.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.203125, -22.533447265625, -21.86376953125, -21.194091796875, -20.5244140625, -19.854736328125, -19.18505859375, -18.515380859375, -17.845703125, -17.176025390625, -16.50634765625, -15.836669921875, -15.1669921875, -14.497314453125, -13.82763671875, -13.157958984375, -12.48828125, -11.818603515625, -11.14892578125, -10.479248046875, -9.8095703125, -9.139892578125, -8.47021484375, -7.800537109375, -7.130859375, -6.461181640625, -5.79150390625, -5.121826171875, -4.4521484375, -3.782470703125, -3.11279296875, -2.443115234375, -1.7734375, -1.103759765625, -0.43408203125, 0.235595703125, 0.9052734375, 1.574951171875, 2.24462890625, 2.914306640625, 3.583984375, 4.253662109375, 4.92333984375, 5.593017578125, 6.2626953125, 6.932373046875, 7.60205078125, 8.271728515625, 8.94140625, 9.611083984375, 10.28076171875, 10.950439453125, 11.6201171875, 12.289794921875, 12.95947265625, 13.629150390625, 14.298828125, 14.968505859375, 15.63818359375, 16.307861328125, 16.9775390625, 17.647216796875, 18.31689453125, 18.986572265625, 19.65625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 11.0, 14.0, 13.0, 12.0, 23.0, 24.0, 38.0, 35.0, 38.0, 57.0, 56.0, 62.0, 67.0, 82.0, 67.0, 67.0, 48.0, 60.0, 38.0, 48.0, 38.0, 19.0, 17.0, 13.0, 14.0, 12.0, 8.0, 6.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.92877197265625, -2.8360595703125, -2.74334716796875, -2.650634765625, -2.55792236328125, -2.4652099609375, -2.37249755859375, -2.27978515625, -2.18707275390625, -2.0943603515625, -2.00164794921875, -1.908935546875, -1.81622314453125, -1.7235107421875, -1.63079833984375, -1.5380859375, -1.44537353515625, -1.3526611328125, -1.25994873046875, -1.167236328125, -1.07452392578125, -0.9818115234375, -0.88909912109375, -0.79638671875, -0.70367431640625, -0.6109619140625, -0.51824951171875, -0.425537109375, -0.33282470703125, -0.2401123046875, -0.14739990234375, -0.0546875, 0.03802490234375, 0.1307373046875, 0.22344970703125, 0.316162109375, 0.40887451171875, 0.5015869140625, 0.59429931640625, 0.68701171875, 0.77972412109375, 0.8724365234375, 0.96514892578125, 1.057861328125, 1.15057373046875, 1.2432861328125, 1.33599853515625, 1.4287109375, 1.52142333984375, 1.6141357421875, 1.70684814453125, 1.799560546875, 1.89227294921875, 1.9849853515625, 2.07769775390625, 2.17041015625, 2.26312255859375, 2.3558349609375, 2.44854736328125, 2.541259765625, 2.63397216796875, 2.7266845703125, 2.81939697265625, 2.912109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 10.0, 17.0, 21.0, 26.0, 51.0, 79.0, 151.0, 260.0, 544.0, 1201.0, 4048.0, 51707.0, 4067581.0, 62413.0, 4071.0, 1151.0, 444.0, 207.0, 118.0, 71.0, 43.0, 25.0, 12.0, 14.0, 3.0, 9.0, 0.0, 4.0, 2.0], "bins": [-83.5625, -81.80419921875, -80.0458984375, -78.28759765625, -76.529296875, -74.77099609375, -73.0126953125, -71.25439453125, -69.49609375, -67.73779296875, -65.9794921875, -64.22119140625, -62.462890625, -60.70458984375, -58.9462890625, -57.18798828125, -55.4296875, -53.67138671875, -51.9130859375, -50.15478515625, -48.396484375, -46.63818359375, -44.8798828125, -43.12158203125, -41.36328125, -39.60498046875, -37.8466796875, -36.08837890625, -34.330078125, -32.57177734375, -30.8134765625, -29.05517578125, -27.296875, -25.53857421875, -23.7802734375, -22.02197265625, -20.263671875, -18.50537109375, -16.7470703125, -14.98876953125, -13.23046875, -11.47216796875, -9.7138671875, -7.95556640625, -6.197265625, -4.43896484375, -2.6806640625, -0.92236328125, 0.8359375, 2.59423828125, 4.3525390625, 6.11083984375, 7.869140625, 9.62744140625, 11.3857421875, 13.14404296875, 14.90234375, 16.66064453125, 18.4189453125, 20.17724609375, 21.935546875, 23.69384765625, 25.4521484375, 27.21044921875, 28.96875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 8.0, 16.0, 28.0, 51.0, 137.0, 396.0, 1584.0, 1302.0, 307.0, 122.0, 50.0, 32.0, 17.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.515625, -20.11285400390625, -19.7100830078125, -19.30731201171875, -18.904541015625, -18.50177001953125, -18.0989990234375, -17.69622802734375, -17.29345703125, -16.89068603515625, -16.4879150390625, -16.08514404296875, -15.682373046875, -15.27960205078125, -14.8768310546875, -14.47406005859375, -14.0712890625, -13.66851806640625, -13.2657470703125, -12.86297607421875, -12.460205078125, -12.05743408203125, -11.6546630859375, -11.25189208984375, -10.84912109375, -10.44635009765625, -10.0435791015625, -9.64080810546875, -9.238037109375, -8.83526611328125, -8.4324951171875, -8.02972412109375, -7.626953125, -7.22418212890625, -6.8214111328125, -6.41864013671875, -6.015869140625, -5.61309814453125, -5.2103271484375, -4.80755615234375, -4.40478515625, -4.00201416015625, -3.5992431640625, -3.19647216796875, -2.793701171875, -2.39093017578125, -1.9881591796875, -1.58538818359375, -1.1826171875, -0.77984619140625, -0.3770751953125, 0.02569580078125, 0.428466796875, 0.83123779296875, 1.2340087890625, 1.63677978515625, 2.03955078125, 2.44232177734375, 2.8450927734375, 3.24786376953125, 3.650634765625, 4.05340576171875, 4.4561767578125, 4.85894775390625, 5.26171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 43.0, 210.0, 443.0, 235.0, 48.0, 10.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.90866088867188, -76.64916229248047, -71.38965606689453, -66.13015747070312, -60.87065505981445, -55.61115264892578, -50.351654052734375, -45.0921516418457, -39.83264923095703, -34.57314682006836, -29.31364631652832, -24.05414581298828, -18.79464340209961, -13.535140991210938, -8.275640487670898, -3.0161399841308594, 2.2433624267578125, 7.502863883972168, 12.762365341186523, 18.021865844726562, 23.281368255615234, 28.540870666503906, 33.80036926269531, 39.059871673583984, 44.319374084472656, 49.57887649536133, 54.83837890625, 60.097877502441406, 65.35737609863281, 70.61688232421875, 75.87638092041016, 81.13587951660156, 86.3953857421875, 91.6548843383789, 96.91439056396484, 102.17388916015625, 107.43339538574219, 112.6928939819336, 117.952392578125, 123.21189880371094, 128.47140502929688, 133.7309112548828, 138.9904022216797, 144.24990844726562, 149.50941467285156, 154.7689208984375, 160.02841186523438, 165.2879180908203, 170.5474090576172, 175.80691528320312, 181.06640625, 186.32591247558594, 191.58541870117188, 196.84490966796875, 202.1044158935547, 207.36392211914062, 212.6234130859375, 217.88291931152344, 223.1424102783203, 228.40191650390625, 233.6614227294922, 238.92092895507812, 244.180419921875, 249.43992614746094, 254.69943237304688]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 15.0, 27.0, 39.0, 78.0, 79.0, 94.0, 85.0, 86.0, 84.0, 108.0, 65.0, 64.0, 50.0, 36.0, 24.0, 21.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.94160079956055, -53.329349517822266, -51.71709442138672, -50.10484313964844, -48.49258804321289, -46.88033676147461, -45.26808166503906, -43.65583038330078, -42.0435791015625, -40.43132781982422, -38.81907272338867, -37.20682144165039, -35.594566345214844, -33.98231506347656, -32.37006378173828, -30.757808685302734, -29.14555549621582, -27.533302307128906, -25.921049118041992, -24.308795928955078, -22.696544647216797, -21.084291458129883, -19.47203826904297, -17.859786987304688, -16.24753189086914, -14.635278701782227, -13.023026466369629, -11.410773277282715, -9.798521041870117, -8.186267852783203, -6.574014663696289, -4.961762428283691, -3.3495101928710938, -1.7372573614120483, -0.12500452995300293, 1.487248420715332, 3.099501132965088, 4.711753845214844, 6.324007034301758, 7.9362592697143555, 9.54851245880127, 11.160765647888184, 12.773017883300781, 14.385271072387695, 15.99752426147461, 17.60977554321289, 19.222030639648438, 20.83428192138672, 22.446535110473633, 24.058788299560547, 25.67104148864746, 27.283294677734375, 28.895545959472656, 30.50779914855957, 32.120052337646484, 33.732303619384766, 35.34455871582031, 36.956809997558594, 38.56906509399414, 40.18131637573242, 41.79357147216797, 43.40582275390625, 45.01807403564453, 46.63032913208008, 48.24258041381836]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 12.0, 5.0, 15.0, 18.0, 24.0, 26.0, 44.0, 44.0, 87.0, 100.0, 146.0, 232.0, 365.0, 570.0, 998.0, 1831.0, 3952.0, 10338.0, 35349.0, 142456.0, 449018.0, 297128.0, 73669.0, 19455.0, 6495.0, 2731.0, 1294.0, 751.0, 431.0, 306.0, 212.0, 117.0, 91.0, 54.0, 46.0, 40.0, 25.0, 22.0, 23.0, 8.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.328125, -15.8446044921875, -15.361083984375, -14.8775634765625, -14.39404296875, -13.9105224609375, -13.427001953125, -12.9434814453125, -12.4599609375, -11.9764404296875, -11.492919921875, -11.0093994140625, -10.52587890625, -10.0423583984375, -9.558837890625, -9.0753173828125, -8.591796875, -8.1082763671875, -7.624755859375, -7.1412353515625, -6.65771484375, -6.1741943359375, -5.690673828125, -5.2071533203125, -4.7236328125, -4.2401123046875, -3.756591796875, -3.2730712890625, -2.78955078125, -2.3060302734375, -1.822509765625, -1.3389892578125, -0.85546875, -0.3719482421875, 0.111572265625, 0.5950927734375, 1.07861328125, 1.5621337890625, 2.045654296875, 2.5291748046875, 3.0126953125, 3.4962158203125, 3.979736328125, 4.4632568359375, 4.94677734375, 5.4302978515625, 5.913818359375, 6.3973388671875, 6.880859375, 7.3643798828125, 7.847900390625, 8.3314208984375, 8.81494140625, 9.2984619140625, 9.781982421875, 10.2655029296875, 10.7490234375, 11.2325439453125, 11.716064453125, 12.1995849609375, 12.68310546875, 13.1666259765625, 13.650146484375, 14.1336669921875, 14.6171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 12.0, 16.0, 16.0, 23.0, 26.0, 53.0, 58.0, 77.0, 104.0, 113.0, 102.0, 93.0, 74.0, 63.0, 57.0, 43.0, 22.0, 19.0, 10.0, 6.0, 1.0, 0.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9296875, -4.7889404296875, -4.648193359375, -4.5074462890625, -4.36669921875, -4.2259521484375, -4.085205078125, -3.9444580078125, -3.8037109375, -3.6629638671875, -3.522216796875, -3.3814697265625, -3.24072265625, -3.0999755859375, -2.959228515625, -2.8184814453125, -2.677734375, -2.5369873046875, -2.396240234375, -2.2554931640625, -2.11474609375, -1.9739990234375, -1.833251953125, -1.6925048828125, -1.5517578125, -1.4110107421875, -1.270263671875, -1.1295166015625, -0.98876953125, -0.8480224609375, -0.707275390625, -0.5665283203125, -0.42578125, -0.2850341796875, -0.144287109375, -0.0035400390625, 0.13720703125, 0.2779541015625, 0.418701171875, 0.5594482421875, 0.7001953125, 0.8409423828125, 0.981689453125, 1.1224365234375, 1.26318359375, 1.4039306640625, 1.544677734375, 1.6854248046875, 1.826171875, 1.9669189453125, 2.107666015625, 2.2484130859375, 2.38916015625, 2.5299072265625, 2.670654296875, 2.8114013671875, 2.9521484375, 3.0928955078125, 3.233642578125, 3.3743896484375, 3.51513671875, 3.6558837890625, 3.796630859375, 3.9373779296875, 4.078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 12.0, 11.0, 20.0, 43.0, 44.0, 62.0, 130.0, 235.0, 429.0, 1005.0, 2800.0, 9882.0, 44276.0, 203357.0, 507439.0, 215596.0, 47549.0, 10729.0, 2871.0, 1023.0, 432.0, 246.0, 144.0, 69.0, 37.0, 36.0, 17.0, 15.0, 8.0, 9.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.140625, -10.7041015625, -10.267578125, -9.8310546875, -9.39453125, -8.9580078125, -8.521484375, -8.0849609375, -7.6484375, -7.2119140625, -6.775390625, -6.3388671875, -5.90234375, -5.4658203125, -5.029296875, -4.5927734375, -4.15625, -3.7197265625, -3.283203125, -2.8466796875, -2.41015625, -1.9736328125, -1.537109375, -1.1005859375, -0.6640625, -0.2275390625, 0.208984375, 0.6455078125, 1.08203125, 1.5185546875, 1.955078125, 2.3916015625, 2.828125, 3.2646484375, 3.701171875, 4.1376953125, 4.57421875, 5.0107421875, 5.447265625, 5.8837890625, 6.3203125, 6.7568359375, 7.193359375, 7.6298828125, 8.06640625, 8.5029296875, 8.939453125, 9.3759765625, 9.8125, 10.2490234375, 10.685546875, 11.1220703125, 11.55859375, 11.9951171875, 12.431640625, 12.8681640625, 13.3046875, 13.7412109375, 14.177734375, 14.6142578125, 15.05078125, 15.4873046875, 15.923828125, 16.3603515625, 16.796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 9.0, 5.0, 6.0, 9.0, 9.0, 16.0, 16.0, 11.0, 23.0, 23.0, 25.0, 22.0, 30.0, 34.0, 45.0, 41.0, 41.0, 55.0, 45.0, 43.0, 37.0, 45.0, 40.0, 41.0, 42.0, 44.0, 39.0, 40.0, 26.0, 26.0, 27.0, 18.0, 20.0, 7.0, 9.0, 12.0, 5.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.443603515625, -9.12939453125, -8.815185546875, -8.5009765625, -8.186767578125, -7.87255859375, -7.558349609375, -7.244140625, -6.929931640625, -6.61572265625, -6.301513671875, -5.9873046875, -5.673095703125, -5.35888671875, -5.044677734375, -4.73046875, -4.416259765625, -4.10205078125, -3.787841796875, -3.4736328125, -3.159423828125, -2.84521484375, -2.531005859375, -2.216796875, -1.902587890625, -1.58837890625, -1.274169921875, -0.9599609375, -0.645751953125, -0.33154296875, -0.017333984375, 0.296875, 0.611083984375, 0.92529296875, 1.239501953125, 1.5537109375, 1.867919921875, 2.18212890625, 2.496337890625, 2.810546875, 3.124755859375, 3.43896484375, 3.753173828125, 4.0673828125, 4.381591796875, 4.69580078125, 5.010009765625, 5.32421875, 5.638427734375, 5.95263671875, 6.266845703125, 6.5810546875, 6.895263671875, 7.20947265625, 7.523681640625, 7.837890625, 8.152099609375, 8.46630859375, 8.780517578125, 9.0947265625, 9.408935546875, 9.72314453125, 10.037353515625, 10.3515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 2.0, 4.0, 8.0, 22.0, 48.0, 72.0, 171.0, 377.0, 1068.0, 3311.0, 14149.0, 80415.0, 585067.0, 311690.0, 40511.0, 8211.0, 2162.0, 725.0, 258.0, 137.0, 64.0, 30.0, 14.0, 10.0, 7.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.453125, -12.13232421875, -11.8115234375, -11.49072265625, -11.169921875, -10.84912109375, -10.5283203125, -10.20751953125, -9.88671875, -9.56591796875, -9.2451171875, -8.92431640625, -8.603515625, -8.28271484375, -7.9619140625, -7.64111328125, -7.3203125, -6.99951171875, -6.6787109375, -6.35791015625, -6.037109375, -5.71630859375, -5.3955078125, -5.07470703125, -4.75390625, -4.43310546875, -4.1123046875, -3.79150390625, -3.470703125, -3.14990234375, -2.8291015625, -2.50830078125, -2.1875, -1.86669921875, -1.5458984375, -1.22509765625, -0.904296875, -0.58349609375, -0.2626953125, 0.05810546875, 0.37890625, 0.69970703125, 1.0205078125, 1.34130859375, 1.662109375, 1.98291015625, 2.3037109375, 2.62451171875, 2.9453125, 3.26611328125, 3.5869140625, 3.90771484375, 4.228515625, 4.54931640625, 4.8701171875, 5.19091796875, 5.51171875, 5.83251953125, 6.1533203125, 6.47412109375, 6.794921875, 7.11572265625, 7.4365234375, 7.75732421875, 8.078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 2.0, 9.0, 5.0, 9.0, 6.0, 14.0, 14.0, 26.0, 34.0, 40.0, 42.0, 109.0, 157.0, 144.0, 112.0, 70.0, 46.0, 34.0, 24.0, 25.0, 9.0, 12.0, 7.0, 8.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015668869018554688, -0.0015235096216201782, -0.0014801323413848877, -0.0014367550611495972, -0.0013933777809143066, -0.0013500005006790161, -0.0013066232204437256, -0.001263245940208435, -0.0012198686599731445, -0.001176491379737854, -0.0011331140995025635, -0.001089736819267273, -0.0010463595390319824, -0.001002982258796692, -0.0009596049785614014, -0.0009162276983261108, -0.0008728504180908203, -0.0008294731378555298, -0.0007860958576202393, -0.0007427185773849487, -0.0006993412971496582, -0.0006559640169143677, -0.0006125867366790771, -0.0005692094564437866, -0.0005258321762084961, -0.00048245489597320557, -0.00043907761573791504, -0.0003957003355026245, -0.000352323055267334, -0.00030894577503204346, -0.00026556849479675293, -0.0002221912145614624, -0.00017881393432617188, -0.00013543665409088135, -9.205937385559082e-05, -4.868209362030029e-05, -5.304813385009766e-06, 3.807246685028076e-05, 8.144974708557129e-05, 0.00012482702732086182, 0.00016820430755615234, 0.00021158158779144287, 0.0002549588680267334, 0.0002983361482620239, 0.00034171342849731445, 0.000385090708732605, 0.0004284679889678955, 0.00047184526920318604, 0.0005152225494384766, 0.0005585998296737671, 0.0006019771099090576, 0.0006453543901443481, 0.0006887316703796387, 0.0007321089506149292, 0.0007754862308502197, 0.0008188635110855103, 0.0008622407913208008, 0.0009056180715560913, 0.0009489953517913818, 0.0009923726320266724, 0.0010357499122619629, 0.0010791271924972534, 0.001122504472732544, 0.0011658817529678345, 0.001209259033203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 15.0, 17.0, 20.0, 33.0, 42.0, 63.0, 122.0, 209.0, 374.0, 758.0, 1497.0, 3504.0, 9351.0, 28071.0, 104424.0, 455035.0, 335412.0, 75278.0, 21540.0, 7265.0, 2959.0, 1235.0, 579.0, 272.0, 179.0, 100.0, 50.0, 47.0, 20.0, 17.0, 10.0, 12.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.5625, -6.33526611328125, -6.1080322265625, -5.88079833984375, -5.653564453125, -5.42633056640625, -5.1990966796875, -4.97186279296875, -4.74462890625, -4.51739501953125, -4.2901611328125, -4.06292724609375, -3.835693359375, -3.60845947265625, -3.3812255859375, -3.15399169921875, -2.9267578125, -2.69952392578125, -2.4722900390625, -2.24505615234375, -2.017822265625, -1.79058837890625, -1.5633544921875, -1.33612060546875, -1.10888671875, -0.88165283203125, -0.6544189453125, -0.42718505859375, -0.199951171875, 0.02728271484375, 0.2545166015625, 0.48175048828125, 0.708984375, 0.93621826171875, 1.1634521484375, 1.39068603515625, 1.617919921875, 1.84515380859375, 2.0723876953125, 2.29962158203125, 2.52685546875, 2.75408935546875, 2.9813232421875, 3.20855712890625, 3.435791015625, 3.66302490234375, 3.8902587890625, 4.11749267578125, 4.3447265625, 4.57196044921875, 4.7991943359375, 5.02642822265625, 5.253662109375, 5.48089599609375, 5.7081298828125, 5.93536376953125, 6.16259765625, 6.38983154296875, 6.6170654296875, 6.84429931640625, 7.071533203125, 7.29876708984375, 7.5260009765625, 7.75323486328125, 7.98046875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 10.0, 13.0, 8.0, 16.0, 23.0, 17.0, 35.0, 31.0, 46.0, 60.0, 71.0, 95.0, 95.0, 95.0, 87.0, 54.0, 47.0, 44.0, 34.0, 27.0, 20.0, 13.0, 13.0, 10.0, 6.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3828125, -6.20013427734375, -6.0174560546875, -5.83477783203125, -5.652099609375, -5.46942138671875, -5.2867431640625, -5.10406494140625, -4.92138671875, -4.73870849609375, -4.5560302734375, -4.37335205078125, -4.190673828125, -4.00799560546875, -3.8253173828125, -3.64263916015625, -3.4599609375, -3.27728271484375, -3.0946044921875, -2.91192626953125, -2.729248046875, -2.54656982421875, -2.3638916015625, -2.18121337890625, -1.99853515625, -1.81585693359375, -1.6331787109375, -1.45050048828125, -1.267822265625, -1.08514404296875, -0.9024658203125, -0.71978759765625, -0.537109375, -0.35443115234375, -0.1717529296875, 0.01092529296875, 0.193603515625, 0.37628173828125, 0.5589599609375, 0.74163818359375, 0.92431640625, 1.10699462890625, 1.2896728515625, 1.47235107421875, 1.655029296875, 1.83770751953125, 2.0203857421875, 2.20306396484375, 2.3857421875, 2.56842041015625, 2.7510986328125, 2.93377685546875, 3.116455078125, 3.29913330078125, 3.4818115234375, 3.66448974609375, 3.84716796875, 4.02984619140625, 4.2125244140625, 4.39520263671875, 4.577880859375, 4.76055908203125, 4.9432373046875, 5.12591552734375, 5.30859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 9.0, 11.0, 27.0, 50.0, 114.0, 149.0, 215.0, 193.0, 121.0, 66.0, 32.0, 13.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.51082229614258, -43.41568374633789, -39.32054901123047, -35.22541046142578, -31.130271911621094, -27.035133361816406, -22.93999671936035, -18.844860076904297, -14.74972152709961, -10.654583930969238, -6.559446334838867, -2.464308738708496, 1.630828857421875, 5.7259674072265625, 9.821104049682617, 13.916240692138672, 18.01137924194336, 22.106517791748047, 26.2016544342041, 30.296791076660156, 34.391929626464844, 38.48706817626953, 42.58220672607422, 46.67734146118164, 50.77248001098633, 54.867618560791016, 58.96275329589844, 63.057891845703125, 67.15303039550781, 71.2481689453125, 75.34330749511719, 79.43844604492188, 83.5335693359375, 87.62870788574219, 91.72384643554688, 95.81898498535156, 99.91412353515625, 104.00926208496094, 108.1043930053711, 112.19953155517578, 116.29467010498047, 120.38980865478516, 124.48494720458984, 128.580078125, 132.6752166748047, 136.77035522460938, 140.86549377441406, 144.96063232421875, 149.05577087402344, 153.15090942382812, 157.2460479736328, 161.3411865234375, 165.4363250732422, 169.53146362304688, 173.62660217285156, 177.72174072265625, 181.81686401367188, 185.91200256347656, 190.00714111328125, 194.10227966308594, 198.19741821289062, 202.2925567626953, 206.3876953125, 210.48281860351562, 214.57797241210938]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 5.0, 15.0, 11.0, 17.0, 16.0, 22.0, 19.0, 26.0, 28.0, 24.0, 42.0, 37.0, 37.0, 48.0, 44.0, 50.0, 45.0, 52.0, 47.0, 36.0, 43.0, 50.0, 34.0, 33.0, 36.0, 22.0, 34.0, 25.0, 17.0, 12.0, 14.0, 10.0, 14.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-60.47914505004883, -58.56175994873047, -56.644371032714844, -54.72698211669922, -52.80959701538086, -50.8922119140625, -48.974822998046875, -47.05743408203125, -45.14004898071289, -43.22266387939453, -41.305274963378906, -39.38788604736328, -37.47050094604492, -35.55311584472656, -33.63572692871094, -31.718339920043945, -29.800952911376953, -27.88356590270996, -25.96617889404297, -24.048791885375977, -22.131404876708984, -20.214017868041992, -18.296630859375, -16.379243850708008, -14.461856842041016, -12.544469833374023, -10.627082824707031, -8.709695816040039, -6.792308807373047, -4.874921798706055, -2.9575347900390625, -1.0401477813720703, 0.8772392272949219, 2.794626235961914, 4.712013244628906, 6.629400253295898, 8.54678726196289, 10.464174270629883, 12.381561279296875, 14.298948287963867, 16.21633529663086, 18.13372230529785, 20.051109313964844, 21.968496322631836, 23.885883331298828, 25.80327033996582, 27.720657348632812, 29.638044357299805, 31.555431365966797, 33.472816467285156, 35.39020538330078, 37.307594299316406, 39.224979400634766, 41.142364501953125, 43.05975341796875, 44.977142333984375, 46.894527435302734, 48.811912536621094, 50.72930145263672, 52.646690368652344, 54.5640754699707, 56.48146057128906, 58.39884948730469, 60.31623840332031, 62.23362350463867]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 8.0, 9.0, 8.0, 13.0, 17.0, 23.0, 38.0, 44.0, 59.0, 88.0, 151.0, 240.0, 486.0, 1195.0, 3148.0, 12557.0, 127580.0, 3990754.0, 46275.0, 7669.0, 2256.0, 792.0, 368.0, 190.0, 100.0, 67.0, 34.0, 27.0, 22.0, 17.0, 12.0, 9.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.84375, -24.8623046875, -23.880859375, -22.8994140625, -21.91796875, -20.9365234375, -19.955078125, -18.9736328125, -17.9921875, -17.0107421875, -16.029296875, -15.0478515625, -14.06640625, -13.0849609375, -12.103515625, -11.1220703125, -10.140625, -9.1591796875, -8.177734375, -7.1962890625, -6.21484375, -5.2333984375, -4.251953125, -3.2705078125, -2.2890625, -1.3076171875, -0.326171875, 0.6552734375, 1.63671875, 2.6181640625, 3.599609375, 4.5810546875, 5.5625, 6.5439453125, 7.525390625, 8.5068359375, 9.48828125, 10.4697265625, 11.451171875, 12.4326171875, 13.4140625, 14.3955078125, 15.376953125, 16.3583984375, 17.33984375, 18.3212890625, 19.302734375, 20.2841796875, 21.265625, 22.2470703125, 23.228515625, 24.2099609375, 25.19140625, 26.1728515625, 27.154296875, 28.1357421875, 29.1171875, 30.0986328125, 31.080078125, 32.0615234375, 33.04296875, 34.0244140625, 35.005859375, 35.9873046875, 36.96875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 9.0, 10.0, 12.0, 16.0, 25.0, 34.0, 40.0, 56.0, 64.0, 83.0, 69.0, 79.0, 82.0, 73.0, 88.0, 62.0, 51.0, 53.0, 27.0, 19.0, 13.0, 9.0, 6.0, 7.0, 3.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.349609375, -3.224456787109375, -3.09930419921875, -2.974151611328125, -2.8489990234375, -2.723846435546875, -2.59869384765625, -2.473541259765625, -2.348388671875, -2.223236083984375, -2.09808349609375, -1.972930908203125, -1.8477783203125, -1.722625732421875, -1.59747314453125, -1.472320556640625, -1.34716796875, -1.222015380859375, -1.09686279296875, -0.971710205078125, -0.8465576171875, -0.721405029296875, -0.59625244140625, -0.471099853515625, -0.345947265625, -0.220794677734375, -0.09564208984375, 0.029510498046875, 0.1546630859375, 0.279815673828125, 0.40496826171875, 0.530120849609375, 0.6552734375, 0.780426025390625, 0.90557861328125, 1.030731201171875, 1.1558837890625, 1.281036376953125, 1.40618896484375, 1.531341552734375, 1.656494140625, 1.781646728515625, 1.90679931640625, 2.031951904296875, 2.1571044921875, 2.282257080078125, 2.40740966796875, 2.532562255859375, 2.65771484375, 2.782867431640625, 2.90802001953125, 3.033172607421875, 3.1583251953125, 3.283477783203125, 3.40863037109375, 3.533782958984375, 3.658935546875, 3.784088134765625, 3.90924072265625, 4.034393310546875, 4.1595458984375, 4.284698486328125, 4.40985107421875, 4.535003662109375, 4.66015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 14.0, 28.0, 34.0, 58.0, 93.0, 159.0, 297.0, 569.0, 1244.0, 3063.0, 8400.0, 29320.0, 174179.0, 3619857.0, 301014.0, 38700.0, 10596.0, 3605.0, 1483.0, 696.0, 348.0, 191.0, 116.0, 68.0, 48.0, 25.0, 15.0, 14.0, 11.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.515625, -14.008056640625, -13.50048828125, -12.992919921875, -12.4853515625, -11.977783203125, -11.47021484375, -10.962646484375, -10.455078125, -9.947509765625, -9.43994140625, -8.932373046875, -8.4248046875, -7.917236328125, -7.40966796875, -6.902099609375, -6.39453125, -5.886962890625, -5.37939453125, -4.871826171875, -4.3642578125, -3.856689453125, -3.34912109375, -2.841552734375, -2.333984375, -1.826416015625, -1.31884765625, -0.811279296875, -0.3037109375, 0.203857421875, 0.71142578125, 1.218994140625, 1.7265625, 2.234130859375, 2.74169921875, 3.249267578125, 3.7568359375, 4.264404296875, 4.77197265625, 5.279541015625, 5.787109375, 6.294677734375, 6.80224609375, 7.309814453125, 7.8173828125, 8.324951171875, 8.83251953125, 9.340087890625, 9.84765625, 10.355224609375, 10.86279296875, 11.370361328125, 11.8779296875, 12.385498046875, 12.89306640625, 13.400634765625, 13.908203125, 14.415771484375, 14.92333984375, 15.430908203125, 15.9384765625, 16.446044921875, 16.95361328125, 17.461181640625, 17.96875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 2.0, 9.0, 10.0, 18.0, 19.0, 15.0, 31.0, 45.0, 38.0, 61.0, 111.0, 186.0, 363.0, 883.0, 1237.0, 431.0, 211.0, 128.0, 73.0, 51.0, 36.0, 23.0, 14.0, 10.0, 8.0, 8.0, 10.0, 4.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.345703125, -3.226837158203125, -3.10797119140625, -2.989105224609375, -2.8702392578125, -2.751373291015625, -2.63250732421875, -2.513641357421875, -2.394775390625, -2.275909423828125, -2.15704345703125, -2.038177490234375, -1.9193115234375, -1.800445556640625, -1.68157958984375, -1.562713623046875, -1.44384765625, -1.324981689453125, -1.20611572265625, -1.087249755859375, -0.9683837890625, -0.849517822265625, -0.73065185546875, -0.611785888671875, -0.492919921875, -0.374053955078125, -0.25518798828125, -0.136322021484375, -0.0174560546875, 0.101409912109375, 0.22027587890625, 0.339141845703125, 0.4580078125, 0.576873779296875, 0.69573974609375, 0.814605712890625, 0.9334716796875, 1.052337646484375, 1.17120361328125, 1.290069580078125, 1.408935546875, 1.527801513671875, 1.64666748046875, 1.765533447265625, 1.8843994140625, 2.003265380859375, 2.12213134765625, 2.240997314453125, 2.35986328125, 2.478729248046875, 2.59759521484375, 2.716461181640625, 2.8353271484375, 2.954193115234375, 3.07305908203125, 3.191925048828125, 3.310791015625, 3.429656982421875, 3.54852294921875, 3.667388916015625, 3.7862548828125, 3.905120849609375, 4.02398681640625, 4.142852783203125, 4.26171875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 5.0, 12.0, 32.0, 42.0, 80.0, 113.0, 158.0, 151.0, 154.0, 113.0, 56.0, 29.0, 30.0, 13.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.488037109375, -33.311302185058594, -32.13457107543945, -30.957836151123047, -29.78110122680664, -28.604368209838867, -27.427635192871094, -26.250900268554688, -25.074167251586914, -23.89743423461914, -22.720699310302734, -21.54396629333496, -20.367233276367188, -19.19049835205078, -18.013765335083008, -16.837032318115234, -15.660297393798828, -14.483563423156738, -13.306829452514648, -12.130096435546875, -10.953362464904785, -9.776628494262695, -8.599895477294922, -7.423161506652832, -6.246427536010742, -5.069693565368652, -3.8929600715637207, -2.71622633934021, -1.5394926071166992, -0.3627586364746094, 0.8139748573303223, 1.990708351135254, 3.1674423217773438, 4.344176292419434, 5.520909786224365, 6.697643280029297, 7.874377250671387, 9.051111221313477, 10.22784423828125, 11.40457820892334, 12.58131217956543, 13.75804615020752, 14.93478012084961, 16.111513137817383, 17.288246154785156, 18.464981079101562, 19.641714096069336, 20.81844711303711, 21.995182037353516, 23.17191505432129, 24.348649978637695, 25.52538299560547, 26.702117919921875, 27.87885093688965, 29.055583953857422, 30.232318878173828, 31.4090518951416, 32.585784912109375, 33.76251983642578, 34.93925476074219, 36.11598587036133, 37.292720794677734, 38.46945571899414, 39.64618682861328, 40.82292175292969]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 9.0, 7.0, 4.0, 12.0, 12.0, 15.0, 20.0, 17.0, 17.0, 27.0, 25.0, 30.0, 37.0, 37.0, 29.0, 32.0, 39.0, 36.0, 24.0, 48.0, 39.0, 43.0, 50.0, 43.0, 55.0, 39.0, 34.0, 39.0, 20.0, 20.0, 20.0, 24.0, 15.0, 17.0, 8.0, 12.0, 8.0, 7.0, 6.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.179865837097168, -14.753652572631836, -14.327439308166504, -13.901226043701172, -13.475011825561523, -13.048799514770508, -12.62258529663086, -12.196372032165527, -11.770158767700195, -11.343945503234863, -10.917732238769531, -10.4915189743042, -10.065305709838867, -9.639091491699219, -9.212878227233887, -8.786664962768555, -8.360451698303223, -7.934238433837891, -7.508025169372559, -7.081811428070068, -6.655598163604736, -6.229384899139404, -5.803171157836914, -5.376957893371582, -4.95074462890625, -4.524531364440918, -4.098318099975586, -3.6721043586730957, -3.2458910942077637, -2.8196778297424316, -2.3934643268585205, -1.9672508239746094, -1.541036605834961, -1.1148232221603394, -0.6886098384857178, -0.2623964548110962, 0.1638169288635254, 0.5900301933288574, 1.0162436962127686, 1.4424571990966797, 1.8686704635620117, 2.2948837280273438, 2.721097230911255, 3.147310733795166, 3.573523998260498, 3.99973726272583, 4.42595100402832, 4.852164268493652, 5.278377532958984, 5.704590797424316, 6.130804061889648, 6.557017803192139, 6.983231067657471, 7.409444332122803, 7.835658073425293, 8.261871337890625, 8.688084602355957, 9.114297866821289, 9.540511131286621, 9.966724395751953, 10.392938613891602, 10.819150924682617, 11.245365142822266, 11.671578407287598, 12.09779167175293]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 12.0, 12.0, 14.0, 18.0, 17.0, 32.0, 62.0, 100.0, 161.0, 259.0, 569.0, 1288.0, 3066.0, 10585.0, 53753.0, 361881.0, 509613.0, 84609.0, 15371.0, 4138.0, 1484.0, 659.0, 349.0, 167.0, 110.0, 74.0, 48.0, 31.0, 19.0, 13.0, 15.0, 4.0, 9.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.615478515625, -17.90283203125, -17.190185546875, -16.4775390625, -15.764892578125, -15.05224609375, -14.339599609375, -13.626953125, -12.914306640625, -12.20166015625, -11.489013671875, -10.7763671875, -10.063720703125, -9.35107421875, -8.638427734375, -7.92578125, -7.213134765625, -6.50048828125, -5.787841796875, -5.0751953125, -4.362548828125, -3.64990234375, -2.937255859375, -2.224609375, -1.511962890625, -0.79931640625, -0.086669921875, 0.6259765625, 1.338623046875, 2.05126953125, 2.763916015625, 3.4765625, 4.189208984375, 4.90185546875, 5.614501953125, 6.3271484375, 7.039794921875, 7.75244140625, 8.465087890625, 9.177734375, 9.890380859375, 10.60302734375, 11.315673828125, 12.0283203125, 12.740966796875, 13.45361328125, 14.166259765625, 14.87890625, 15.591552734375, 16.30419921875, 17.016845703125, 17.7294921875, 18.442138671875, 19.15478515625, 19.867431640625, 20.580078125, 21.292724609375, 22.00537109375, 22.718017578125, 23.4306640625, 24.143310546875, 24.85595703125, 25.568603515625, 26.28125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 6.0, 5.0, 14.0, 21.0, 23.0, 33.0, 46.0, 59.0, 71.0, 83.0, 114.0, 86.0, 97.0, 90.0, 76.0, 53.0, 48.0, 22.0, 15.0, 13.0, 7.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75390625, -4.61041259765625, -4.4669189453125, -4.32342529296875, -4.179931640625, -4.03643798828125, -3.8929443359375, -3.74945068359375, -3.60595703125, -3.46246337890625, -3.3189697265625, -3.17547607421875, -3.031982421875, -2.88848876953125, -2.7449951171875, -2.60150146484375, -2.4580078125, -2.31451416015625, -2.1710205078125, -2.02752685546875, -1.884033203125, -1.74053955078125, -1.5970458984375, -1.45355224609375, -1.31005859375, -1.16656494140625, -1.0230712890625, -0.87957763671875, -0.736083984375, -0.59259033203125, -0.4490966796875, -0.30560302734375, -0.162109375, -0.01861572265625, 0.1248779296875, 0.26837158203125, 0.411865234375, 0.55535888671875, 0.6988525390625, 0.84234619140625, 0.98583984375, 1.12933349609375, 1.2728271484375, 1.41632080078125, 1.559814453125, 1.70330810546875, 1.8468017578125, 1.99029541015625, 2.1337890625, 2.27728271484375, 2.4207763671875, 2.56427001953125, 2.707763671875, 2.85125732421875, 2.9947509765625, 3.13824462890625, 3.28173828125, 3.42523193359375, 3.5687255859375, 3.71221923828125, 3.855712890625, 3.99920654296875, 4.1427001953125, 4.28619384765625, 4.4296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 12.0, 17.0, 23.0, 39.0, 42.0, 45.0, 57.0, 96.0, 159.0, 218.0, 341.0, 577.0, 1151.0, 2538.0, 7040.0, 24858.0, 96218.0, 330007.0, 399907.0, 134704.0, 34396.0, 9565.0, 3288.0, 1375.0, 692.0, 388.0, 243.0, 158.0, 101.0, 78.0, 53.0, 37.0, 33.0, 28.0, 17.0, 10.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -11.2666015625, -10.892578125, -10.5185546875, -10.14453125, -9.7705078125, -9.396484375, -9.0224609375, -8.6484375, -8.2744140625, -7.900390625, -7.5263671875, -7.15234375, -6.7783203125, -6.404296875, -6.0302734375, -5.65625, -5.2822265625, -4.908203125, -4.5341796875, -4.16015625, -3.7861328125, -3.412109375, -3.0380859375, -2.6640625, -2.2900390625, -1.916015625, -1.5419921875, -1.16796875, -0.7939453125, -0.419921875, -0.0458984375, 0.328125, 0.7021484375, 1.076171875, 1.4501953125, 1.82421875, 2.1982421875, 2.572265625, 2.9462890625, 3.3203125, 3.6943359375, 4.068359375, 4.4423828125, 4.81640625, 5.1904296875, 5.564453125, 5.9384765625, 6.3125, 6.6865234375, 7.060546875, 7.4345703125, 7.80859375, 8.1826171875, 8.556640625, 8.9306640625, 9.3046875, 9.6787109375, 10.052734375, 10.4267578125, 10.80078125, 11.1748046875, 11.548828125, 11.9228515625, 12.296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 10.0, 17.0, 9.0, 22.0, 26.0, 32.0, 28.0, 26.0, 32.0, 38.0, 33.0, 34.0, 44.0, 37.0, 50.0, 39.0, 44.0, 47.0, 46.0, 39.0, 39.0, 33.0, 31.0, 29.0, 26.0, 20.0, 21.0, 23.0, 19.0, 21.0, 13.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.25, -9.9447021484375, -9.639404296875, -9.3341064453125, -9.02880859375, -8.7235107421875, -8.418212890625, -8.1129150390625, -7.8076171875, -7.5023193359375, -7.197021484375, -6.8917236328125, -6.58642578125, -6.2811279296875, -5.975830078125, -5.6705322265625, -5.365234375, -5.0599365234375, -4.754638671875, -4.4493408203125, -4.14404296875, -3.8387451171875, -3.533447265625, -3.2281494140625, -2.9228515625, -2.6175537109375, -2.312255859375, -2.0069580078125, -1.70166015625, -1.3963623046875, -1.091064453125, -0.7857666015625, -0.48046875, -0.1751708984375, 0.130126953125, 0.4354248046875, 0.74072265625, 1.0460205078125, 1.351318359375, 1.6566162109375, 1.9619140625, 2.2672119140625, 2.572509765625, 2.8778076171875, 3.18310546875, 3.4884033203125, 3.793701171875, 4.0989990234375, 4.404296875, 4.7095947265625, 5.014892578125, 5.3201904296875, 5.62548828125, 5.9307861328125, 6.236083984375, 6.5413818359375, 6.8466796875, 7.1519775390625, 7.457275390625, 7.7625732421875, 8.06787109375, 8.3731689453125, 8.678466796875, 8.9837646484375, 9.2890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 5.0, 12.0, 17.0, 21.0, 40.0, 62.0, 86.0, 134.0, 255.0, 478.0, 841.0, 1546.0, 3385.0, 7363.0, 17405.0, 46455.0, 153734.0, 445150.0, 256217.0, 71102.0, 24857.0, 10302.0, 4512.0, 2121.0, 1036.0, 576.0, 308.0, 209.0, 108.0, 73.0, 46.0, 26.0, 12.0, 11.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.63446044921875, -5.4447021484375, -5.25494384765625, -5.065185546875, -4.87542724609375, -4.6856689453125, -4.49591064453125, -4.30615234375, -4.11639404296875, -3.9266357421875, -3.73687744140625, -3.547119140625, -3.35736083984375, -3.1676025390625, -2.97784423828125, -2.7880859375, -2.59832763671875, -2.4085693359375, -2.21881103515625, -2.029052734375, -1.83929443359375, -1.6495361328125, -1.45977783203125, -1.27001953125, -1.08026123046875, -0.8905029296875, -0.70074462890625, -0.510986328125, -0.32122802734375, -0.1314697265625, 0.05828857421875, 0.248046875, 0.43780517578125, 0.6275634765625, 0.81732177734375, 1.007080078125, 1.19683837890625, 1.3865966796875, 1.57635498046875, 1.76611328125, 1.95587158203125, 2.1456298828125, 2.33538818359375, 2.525146484375, 2.71490478515625, 2.9046630859375, 3.09442138671875, 3.2841796875, 3.47393798828125, 3.6636962890625, 3.85345458984375, 4.043212890625, 4.23297119140625, 4.4227294921875, 4.61248779296875, 4.80224609375, 4.99200439453125, 5.1817626953125, 5.37152099609375, 5.561279296875, 5.75103759765625, 5.9407958984375, 6.13055419921875, 6.3203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 7.0, 15.0, 14.0, 15.0, 27.0, 43.0, 29.0, 52.0, 71.0, 101.0, 146.0, 121.0, 93.0, 83.0, 50.0, 29.0, 14.0, 24.0, 15.0, 7.0, 5.0, 5.0, 5.0, 4.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011701583862304688, -0.0011246204376220703, -0.0010790824890136719, -0.0010335445404052734, -0.000988006591796875, -0.0009424686431884766, -0.0008969306945800781, -0.0008513927459716797, -0.0008058547973632812, -0.0007603168487548828, -0.0007147789001464844, -0.0006692409515380859, -0.0006237030029296875, -0.0005781650543212891, -0.0005326271057128906, -0.0004870891571044922, -0.00044155120849609375, -0.0003960132598876953, -0.0003504753112792969, -0.00030493736267089844, -0.0002593994140625, -0.00021386146545410156, -0.00016832351684570312, -0.0001227855682373047, -7.724761962890625e-05, -3.170967102050781e-05, 1.3828277587890625e-05, 5.936622619628906e-05, 0.0001049041748046875, 0.00015044212341308594, 0.00019598007202148438, 0.0002415180206298828, 0.00028705596923828125, 0.0003325939178466797, 0.0003781318664550781, 0.00042366981506347656, 0.000469207763671875, 0.0005147457122802734, 0.0005602836608886719, 0.0006058216094970703, 0.0006513595581054688, 0.0006968975067138672, 0.0007424354553222656, 0.0007879734039306641, 0.0008335113525390625, 0.0008790493011474609, 0.0009245872497558594, 0.0009701251983642578, 0.0010156631469726562, 0.0010612010955810547, 0.0011067390441894531, 0.0011522769927978516, 0.00119781494140625, 0.0012433528900146484, 0.0012888908386230469, 0.0013344287872314453, 0.0013799667358398438, 0.0014255046844482422, 0.0014710426330566406, 0.001516580581665039, 0.0015621185302734375, 0.001607656478881836, 0.0016531944274902344, 0.0016987323760986328, 0.0017442703247070312]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 9.0, 14.0, 19.0, 13.0, 25.0, 44.0, 83.0, 132.0, 239.0, 440.0, 914.0, 1975.0, 5627.0, 19134.0, 87900.0, 586963.0, 283151.0, 44286.0, 11114.0, 3634.0, 1410.0, 645.0, 335.0, 190.0, 70.0, 71.0, 33.0, 22.0, 11.0, 14.0, 5.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.506103515625, -8.17626953125, -7.846435546875, -7.5166015625, -7.186767578125, -6.85693359375, -6.527099609375, -6.197265625, -5.867431640625, -5.53759765625, -5.207763671875, -4.8779296875, -4.548095703125, -4.21826171875, -3.888427734375, -3.55859375, -3.228759765625, -2.89892578125, -2.569091796875, -2.2392578125, -1.909423828125, -1.57958984375, -1.249755859375, -0.919921875, -0.590087890625, -0.26025390625, 0.069580078125, 0.3994140625, 0.729248046875, 1.05908203125, 1.388916015625, 1.71875, 2.048583984375, 2.37841796875, 2.708251953125, 3.0380859375, 3.367919921875, 3.69775390625, 4.027587890625, 4.357421875, 4.687255859375, 5.01708984375, 5.346923828125, 5.6767578125, 6.006591796875, 6.33642578125, 6.666259765625, 6.99609375, 7.325927734375, 7.65576171875, 7.985595703125, 8.3154296875, 8.645263671875, 8.97509765625, 9.304931640625, 9.634765625, 9.964599609375, 10.29443359375, 10.624267578125, 10.9541015625, 11.283935546875, 11.61376953125, 11.943603515625, 12.2734375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 5.0, 4.0, 7.0, 17.0, 19.0, 29.0, 34.0, 36.0, 66.0, 104.0, 125.0, 135.0, 116.0, 87.0, 52.0, 49.0, 28.0, 20.0, 13.0, 11.0, 9.0, 7.0, 3.0, 8.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.65411376953125, -8.3941650390625, -8.13421630859375, -7.874267578125, -7.61431884765625, -7.3543701171875, -7.09442138671875, -6.83447265625, -6.57452392578125, -6.3145751953125, -6.05462646484375, -5.794677734375, -5.53472900390625, -5.2747802734375, -5.01483154296875, -4.7548828125, -4.49493408203125, -4.2349853515625, -3.97503662109375, -3.715087890625, -3.45513916015625, -3.1951904296875, -2.93524169921875, -2.67529296875, -2.41534423828125, -2.1553955078125, -1.89544677734375, -1.635498046875, -1.37554931640625, -1.1156005859375, -0.85565185546875, -0.595703125, -0.33575439453125, -0.0758056640625, 0.18414306640625, 0.444091796875, 0.70404052734375, 0.9639892578125, 1.22393798828125, 1.48388671875, 1.74383544921875, 2.0037841796875, 2.26373291015625, 2.523681640625, 2.78363037109375, 3.0435791015625, 3.30352783203125, 3.5634765625, 3.82342529296875, 4.0833740234375, 4.34332275390625, 4.603271484375, 4.86322021484375, 5.1231689453125, 5.38311767578125, 5.64306640625, 5.90301513671875, 6.1629638671875, 6.42291259765625, 6.682861328125, 6.94281005859375, 7.2027587890625, 7.46270751953125, 7.72265625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 18.0, 84.0, 162.0, 277.0, 253.0, 125.0, 49.0, 22.0, 9.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.2959976196289, -99.06365203857422, -92.83130645751953, -86.59896850585938, -80.36662292480469, -74.13427734375, -67.90193176269531, -61.669586181640625, -55.43724060058594, -49.20489501953125, -42.97254943847656, -36.74020767211914, -30.507862091064453, -24.275516510009766, -18.043174743652344, -11.810829162597656, -5.578483581542969, 0.6538610458374023, 6.886205673217773, 13.118549346923828, 19.350894927978516, 25.583240509033203, 31.815582275390625, 38.04792785644531, 44.2802734375, 50.51261901855469, 56.744964599609375, 62.9773063659668, 69.20965576171875, 75.44200134277344, 81.6743392944336, 87.90668487548828, 94.1390380859375, 100.37138366699219, 106.60372924804688, 112.83607482910156, 119.06842041015625, 125.30076599121094, 131.53311157226562, 137.76544189453125, 143.997802734375, 150.2301483154297, 156.46249389648438, 162.69483947753906, 168.92718505859375, 175.15953063964844, 181.39187622070312, 187.62420654296875, 193.85655212402344, 200.08889770507812, 206.3212432861328, 212.5535888671875, 218.7859344482422, 225.01828002929688, 231.2506103515625, 237.48297119140625, 243.71530151367188, 249.94764709472656, 256.17999267578125, 262.4123229980469, 268.6446838378906, 274.87701416015625, 281.109375, 287.3417053222656, 293.5740661621094]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 7.0, 4.0, 8.0, 7.0, 10.0, 12.0, 15.0, 14.0, 20.0, 24.0, 27.0, 28.0, 35.0, 37.0, 45.0, 30.0, 44.0, 48.0, 56.0, 41.0, 56.0, 54.0, 43.0, 43.0, 41.0, 27.0, 35.0, 35.0, 21.0, 22.0, 22.0, 17.0, 18.0, 5.0, 10.0, 5.0, 11.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.64113235473633, -59.731319427490234, -57.82150650024414, -55.91168975830078, -54.00187683105469, -52.092063903808594, -50.1822509765625, -48.272438049316406, -46.36262512207031, -44.45281219482422, -42.542999267578125, -40.63318634033203, -38.72336959838867, -36.81355667114258, -34.903743743896484, -32.99393081665039, -31.08411407470703, -29.174301147460938, -27.26448631286621, -25.354673385620117, -23.44485855102539, -21.535045623779297, -19.625232696533203, -17.71541976928711, -15.805604934692383, -13.895791053771973, -11.985977172851562, -10.076164245605469, -8.166350364685059, -6.256536483764648, -4.346723556518555, -2.4369096755981445, -0.527099609375, 1.382714033126831, 3.292527675628662, 5.202341079711914, 7.112154960632324, 9.021968841552734, 10.931781768798828, 12.841595649719238, 14.751409530639648, 16.661222457885742, 18.57103729248047, 20.480850219726562, 22.390663146972656, 24.300477981567383, 26.210290908813477, 28.120105743408203, 30.029918670654297, 31.93973159790039, 33.849544525146484, 35.759361267089844, 37.66917419433594, 39.57898712158203, 41.488800048828125, 43.39861297607422, 45.30842590332031, 47.218238830566406, 49.1280517578125, 51.037864685058594, 52.94768142700195, 54.85749435424805, 56.76730728149414, 58.677120208740234, 60.586936950683594]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 4.0, 8.0, 6.0, 11.0, 14.0, 14.0, 30.0, 40.0, 57.0, 62.0, 100.0, 185.0, 291.0, 731.0, 1951.0, 9190.0, 144859.0, 4001618.0, 29260.0, 4092.0, 1015.0, 370.0, 161.0, 73.0, 49.0, 23.0, 28.0, 7.0, 9.0, 6.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.3125, -51.80078125, -50.2890625, -48.77734375, -47.265625, -45.75390625, -44.2421875, -42.73046875, -41.21875, -39.70703125, -38.1953125, -36.68359375, -35.171875, -33.66015625, -32.1484375, -30.63671875, -29.125, -27.61328125, -26.1015625, -24.58984375, -23.078125, -21.56640625, -20.0546875, -18.54296875, -17.03125, -15.51953125, -14.0078125, -12.49609375, -10.984375, -9.47265625, -7.9609375, -6.44921875, -4.9375, -3.42578125, -1.9140625, -0.40234375, 1.109375, 2.62109375, 4.1328125, 5.64453125, 7.15625, 8.66796875, 10.1796875, 11.69140625, 13.203125, 14.71484375, 16.2265625, 17.73828125, 19.25, 20.76171875, 22.2734375, 23.78515625, 25.296875, 26.80859375, 28.3203125, 29.83203125, 31.34375, 32.85546875, 34.3671875, 35.87890625, 37.390625, 38.90234375, 40.4140625, 41.92578125, 43.4375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 11.0, 17.0, 16.0, 18.0, 33.0, 43.0, 67.0, 81.0, 70.0, 100.0, 100.0, 104.0, 85.0, 85.0, 52.0, 27.0, 32.0, 21.0, 17.0, 7.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.45709228515625, -4.3048095703125, -4.15252685546875, -4.000244140625, -3.84796142578125, -3.6956787109375, -3.54339599609375, -3.39111328125, -3.23883056640625, -3.0865478515625, -2.93426513671875, -2.781982421875, -2.62969970703125, -2.4774169921875, -2.32513427734375, -2.1728515625, -2.02056884765625, -1.8682861328125, -1.71600341796875, -1.563720703125, -1.41143798828125, -1.2591552734375, -1.10687255859375, -0.95458984375, -0.80230712890625, -0.6500244140625, -0.49774169921875, -0.345458984375, -0.19317626953125, -0.0408935546875, 0.11138916015625, 0.263671875, 0.41595458984375, 0.5682373046875, 0.72052001953125, 0.872802734375, 1.02508544921875, 1.1773681640625, 1.32965087890625, 1.48193359375, 1.63421630859375, 1.7864990234375, 1.93878173828125, 2.091064453125, 2.24334716796875, 2.3956298828125, 2.54791259765625, 2.7001953125, 2.85247802734375, 3.0047607421875, 3.15704345703125, 3.309326171875, 3.46160888671875, 3.6138916015625, 3.76617431640625, 3.91845703125, 4.07073974609375, 4.2230224609375, 4.37530517578125, 4.527587890625, 4.67987060546875, 4.8321533203125, 4.98443603515625, 5.13671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 7.0, 10.0, 11.0, 17.0, 33.0, 56.0, 102.0, 171.0, 307.0, 687.0, 1341.0, 3230.0, 8703.0, 29657.0, 185380.0, 3655641.0, 258028.0, 34653.0, 9886.0, 3508.0, 1490.0, 636.0, 299.0, 173.0, 113.0, 52.0, 22.0, 26.0, 13.0, 10.0, 4.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.22265625, -19.6015625, -18.98046875, -18.359375, -17.73828125, -17.1171875, -16.49609375, -15.875, -15.25390625, -14.6328125, -14.01171875, -13.390625, -12.76953125, -12.1484375, -11.52734375, -10.90625, -10.28515625, -9.6640625, -9.04296875, -8.421875, -7.80078125, -7.1796875, -6.55859375, -5.9375, -5.31640625, -4.6953125, -4.07421875, -3.453125, -2.83203125, -2.2109375, -1.58984375, -0.96875, -0.34765625, 0.2734375, 0.89453125, 1.515625, 2.13671875, 2.7578125, 3.37890625, 4.0, 4.62109375, 5.2421875, 5.86328125, 6.484375, 7.10546875, 7.7265625, 8.34765625, 8.96875, 9.58984375, 10.2109375, 10.83203125, 11.453125, 12.07421875, 12.6953125, 13.31640625, 13.9375, 14.55859375, 15.1796875, 15.80078125, 16.421875, 17.04296875, 17.6640625, 18.28515625, 18.90625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 8.0, 6.0, 19.0, 11.0, 16.0, 23.0, 26.0, 29.0, 48.0, 71.0, 112.0, 165.0, 325.0, 770.0, 1258.0, 520.0, 249.0, 127.0, 63.0, 46.0, 29.0, 25.0, 28.0, 15.0, 13.0, 9.0, 8.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.875, -5.70843505859375, -5.5418701171875, -5.37530517578125, -5.208740234375, -5.04217529296875, -4.8756103515625, -4.70904541015625, -4.54248046875, -4.37591552734375, -4.2093505859375, -4.04278564453125, -3.876220703125, -3.70965576171875, -3.5430908203125, -3.37652587890625, -3.2099609375, -3.04339599609375, -2.8768310546875, -2.71026611328125, -2.543701171875, -2.37713623046875, -2.2105712890625, -2.04400634765625, -1.87744140625, -1.71087646484375, -1.5443115234375, -1.37774658203125, -1.211181640625, -1.04461669921875, -0.8780517578125, -0.71148681640625, -0.544921875, -0.37835693359375, -0.2117919921875, -0.04522705078125, 0.121337890625, 0.28790283203125, 0.4544677734375, 0.62103271484375, 0.78759765625, 0.95416259765625, 1.1207275390625, 1.28729248046875, 1.453857421875, 1.62042236328125, 1.7869873046875, 1.95355224609375, 2.1201171875, 2.28668212890625, 2.4532470703125, 2.61981201171875, 2.786376953125, 2.95294189453125, 3.1195068359375, 3.28607177734375, 3.45263671875, 3.61920166015625, 3.7857666015625, 3.95233154296875, 4.118896484375, 4.28546142578125, 4.4520263671875, 4.61859130859375, 4.78515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 12.0, 57.0, 198.0, 342.0, 249.0, 96.0, 29.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-195.0822296142578, -191.45753479003906, -187.83285522460938, -184.20816040039062, -180.58346557617188, -176.95877075195312, -173.33407592773438, -169.7093963623047, -166.08470153808594, -162.4600067138672, -158.8353271484375, -155.21063232421875, -151.5859375, -147.96124267578125, -144.3365478515625, -140.7118682861328, -137.08717346191406, -133.4624786376953, -129.83779907226562, -126.21310424804688, -122.58840942382812, -118.96371459960938, -115.33902740478516, -111.71434020996094, -108.08964538574219, -104.46495056152344, -100.84026336669922, -97.215576171875, -93.59088134765625, -89.9661865234375, -86.34149932861328, -82.71681213378906, -79.09212493896484, -75.46743774414062, -71.84274291992188, -68.21804809570312, -64.5933609008789, -60.96866989135742, -57.34397888183594, -53.71928787231445, -50.09459686279297, -46.469905853271484, -42.84521484375, -39.220523834228516, -35.59583282470703, -31.971141815185547, -28.346450805664062, -24.721759796142578, -21.097068786621094, -17.47237777709961, -13.847686767578125, -10.22299575805664, -6.598304748535156, -2.973613739013672, 0.6510772705078125, 4.275768280029297, 7.900459289550781, 11.525150299072266, 15.14984130859375, 18.774532318115234, 22.39922332763672, 26.023914337158203, 29.648605346679688, 33.27329635620117, 36.897987365722656]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 2.0, 9.0, 10.0, 10.0, 12.0, 14.0, 34.0, 31.0, 22.0, 43.0, 43.0, 34.0, 45.0, 53.0, 42.0, 51.0, 42.0, 53.0, 51.0, 44.0, 58.0, 33.0, 52.0, 28.0, 23.0, 29.0, 21.0, 22.0, 27.0, 13.0, 12.0, 10.0, 8.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.670917510986328, -20.9078311920166, -20.144746780395508, -19.38166046142578, -18.618576049804688, -17.85548973083496, -17.092403411865234, -16.32931900024414, -15.566232681274414, -14.803147315979004, -14.040061950683594, -13.276975631713867, -12.513890266418457, -11.750804901123047, -10.98771858215332, -10.22463321685791, -9.4615478515625, -8.69846248626709, -7.9353766441345215, -7.172290802001953, -6.409205436706543, -5.646120071411133, -4.8830342292785645, -4.119948387145996, -3.356863021850586, -2.5937774181365967, -1.8306918144226074, -1.0676062107086182, -0.3045206069946289, 0.45856499671936035, 1.2216506004333496, 1.984736442565918, 2.747821807861328, 3.5109074115753174, 4.273993015289307, 5.037078857421875, 5.800164222717285, 6.563249588012695, 7.326335430145264, 8.089421272277832, 8.852506637573242, 9.615592002868652, 10.378677368164062, 11.141763687133789, 11.9048490524292, 12.66793441772461, 13.431020736694336, 14.194106101989746, 14.957191467285156, 15.720276832580566, 16.483362197875977, 17.246448516845703, 18.009532928466797, 18.772619247436523, 19.53570556640625, 20.298789978027344, 21.06187629699707, 21.824962615966797, 22.58804702758789, 23.351133346557617, 24.114219665527344, 24.877304077148438, 25.640390396118164, 26.40347671508789, 27.166561126708984]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 13.0, 19.0, 22.0, 34.0, 32.0, 53.0, 91.0, 142.0, 233.0, 481.0, 951.0, 2289.0, 6852.0, 26121.0, 140616.0, 640266.0, 185362.0, 31831.0, 8235.0, 2766.0, 985.0, 468.0, 248.0, 151.0, 92.0, 66.0, 34.0, 24.0, 26.0, 20.0, 6.0, 3.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.351318359375, -18.71826171875, -18.085205078125, -17.4521484375, -16.819091796875, -16.18603515625, -15.552978515625, -14.919921875, -14.286865234375, -13.65380859375, -13.020751953125, -12.3876953125, -11.754638671875, -11.12158203125, -10.488525390625, -9.85546875, -9.222412109375, -8.58935546875, -7.956298828125, -7.3232421875, -6.690185546875, -6.05712890625, -5.424072265625, -4.791015625, -4.157958984375, -3.52490234375, -2.891845703125, -2.2587890625, -1.625732421875, -0.99267578125, -0.359619140625, 0.2734375, 0.906494140625, 1.53955078125, 2.172607421875, 2.8056640625, 3.438720703125, 4.07177734375, 4.704833984375, 5.337890625, 5.970947265625, 6.60400390625, 7.237060546875, 7.8701171875, 8.503173828125, 9.13623046875, 9.769287109375, 10.40234375, 11.035400390625, 11.66845703125, 12.301513671875, 12.9345703125, 13.567626953125, 14.20068359375, 14.833740234375, 15.466796875, 16.099853515625, 16.73291015625, 17.365966796875, 17.9990234375, 18.632080078125, 19.26513671875, 19.898193359375, 20.53125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 10.0, 11.0, 14.0, 25.0, 28.0, 46.0, 53.0, 80.0, 101.0, 111.0, 102.0, 99.0, 91.0, 82.0, 49.0, 33.0, 22.0, 23.0, 8.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4609375, -5.29595947265625, -5.1309814453125, -4.96600341796875, -4.801025390625, -4.63604736328125, -4.4710693359375, -4.30609130859375, -4.14111328125, -3.97613525390625, -3.8111572265625, -3.64617919921875, -3.481201171875, -3.31622314453125, -3.1512451171875, -2.98626708984375, -2.8212890625, -2.65631103515625, -2.4913330078125, -2.32635498046875, -2.161376953125, -1.99639892578125, -1.8314208984375, -1.66644287109375, -1.50146484375, -1.33648681640625, -1.1715087890625, -1.00653076171875, -0.841552734375, -0.67657470703125, -0.5115966796875, -0.34661865234375, -0.181640625, -0.01666259765625, 0.1483154296875, 0.31329345703125, 0.478271484375, 0.64324951171875, 0.8082275390625, 0.97320556640625, 1.13818359375, 1.30316162109375, 1.4681396484375, 1.63311767578125, 1.798095703125, 1.96307373046875, 2.1280517578125, 2.29302978515625, 2.4580078125, 2.62298583984375, 2.7879638671875, 2.95294189453125, 3.117919921875, 3.28289794921875, 3.4478759765625, 3.61285400390625, 3.77783203125, 3.94281005859375, 4.1077880859375, 4.27276611328125, 4.437744140625, 4.60272216796875, 4.7677001953125, 4.93267822265625, 5.09765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 18.0, 17.0, 30.0, 41.0, 60.0, 97.0, 205.0, 433.0, 1013.0, 3495.0, 17659.0, 143821.0, 703502.0, 153752.0, 18777.0, 3680.0, 1040.0, 438.0, 195.0, 105.0, 54.0, 33.0, 26.0, 13.0, 11.0, 11.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.921875, -16.28369140625, -15.6455078125, -15.00732421875, -14.369140625, -13.73095703125, -13.0927734375, -12.45458984375, -11.81640625, -11.17822265625, -10.5400390625, -9.90185546875, -9.263671875, -8.62548828125, -7.9873046875, -7.34912109375, -6.7109375, -6.07275390625, -5.4345703125, -4.79638671875, -4.158203125, -3.52001953125, -2.8818359375, -2.24365234375, -1.60546875, -0.96728515625, -0.3291015625, 0.30908203125, 0.947265625, 1.58544921875, 2.2236328125, 2.86181640625, 3.5, 4.13818359375, 4.7763671875, 5.41455078125, 6.052734375, 6.69091796875, 7.3291015625, 7.96728515625, 8.60546875, 9.24365234375, 9.8818359375, 10.52001953125, 11.158203125, 11.79638671875, 12.4345703125, 13.07275390625, 13.7109375, 14.34912109375, 14.9873046875, 15.62548828125, 16.263671875, 16.90185546875, 17.5400390625, 18.17822265625, 18.81640625, 19.45458984375, 20.0927734375, 20.73095703125, 21.369140625, 22.00732421875, 22.6455078125, 23.28369140625, 23.921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 4.0, 4.0, 7.0, 12.0, 14.0, 13.0, 9.0, 8.0, 18.0, 28.0, 22.0, 37.0, 41.0, 29.0, 55.0, 54.0, 41.0, 55.0, 49.0, 47.0, 41.0, 47.0, 45.0, 55.0, 58.0, 34.0, 36.0, 20.0, 17.0, 20.0, 13.0, 15.0, 14.0, 11.0, 5.0, 10.0, 4.0, 1.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -11.215576171875, -10.84521484375, -10.474853515625, -10.1044921875, -9.734130859375, -9.36376953125, -8.993408203125, -8.623046875, -8.252685546875, -7.88232421875, -7.511962890625, -7.1416015625, -6.771240234375, -6.40087890625, -6.030517578125, -5.66015625, -5.289794921875, -4.91943359375, -4.549072265625, -4.1787109375, -3.808349609375, -3.43798828125, -3.067626953125, -2.697265625, -2.326904296875, -1.95654296875, -1.586181640625, -1.2158203125, -0.845458984375, -0.47509765625, -0.104736328125, 0.265625, 0.635986328125, 1.00634765625, 1.376708984375, 1.7470703125, 2.117431640625, 2.48779296875, 2.858154296875, 3.228515625, 3.598876953125, 3.96923828125, 4.339599609375, 4.7099609375, 5.080322265625, 5.45068359375, 5.821044921875, 6.19140625, 6.561767578125, 6.93212890625, 7.302490234375, 7.6728515625, 8.043212890625, 8.41357421875, 8.783935546875, 9.154296875, 9.524658203125, 9.89501953125, 10.265380859375, 10.6357421875, 11.006103515625, 11.37646484375, 11.746826171875, 12.1171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 13.0, 30.0, 47.0, 105.0, 225.0, 482.0, 1397.0, 4684.0, 20669.0, 159413.0, 761525.0, 81609.0, 13318.0, 3340.0, 1016.0, 360.0, 155.0, 74.0, 46.0, 19.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.348388671875, -13.00927734375, -12.670166015625, -12.3310546875, -11.991943359375, -11.65283203125, -11.313720703125, -10.974609375, -10.635498046875, -10.29638671875, -9.957275390625, -9.6181640625, -9.279052734375, -8.93994140625, -8.600830078125, -8.26171875, -7.922607421875, -7.58349609375, -7.244384765625, -6.9052734375, -6.566162109375, -6.22705078125, -5.887939453125, -5.548828125, -5.209716796875, -4.87060546875, -4.531494140625, -4.1923828125, -3.853271484375, -3.51416015625, -3.175048828125, -2.8359375, -2.496826171875, -2.15771484375, -1.818603515625, -1.4794921875, -1.140380859375, -0.80126953125, -0.462158203125, -0.123046875, 0.216064453125, 0.55517578125, 0.894287109375, 1.2333984375, 1.572509765625, 1.91162109375, 2.250732421875, 2.58984375, 2.928955078125, 3.26806640625, 3.607177734375, 3.9462890625, 4.285400390625, 4.62451171875, 4.963623046875, 5.302734375, 5.641845703125, 5.98095703125, 6.320068359375, 6.6591796875, 6.998291015625, 7.33740234375, 7.676513671875, 8.015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 3.0, 7.0, 9.0, 12.0, 8.0, 17.0, 33.0, 50.0, 92.0, 207.0, 243.0, 125.0, 65.0, 35.0, 18.0, 14.0, 15.0, 8.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00214385986328125, -0.002083003520965576, -0.0020221471786499023, -0.0019612908363342285, -0.0019004344940185547, -0.0018395781517028809, -0.001778721809387207, -0.0017178654670715332, -0.0016570091247558594, -0.0015961527824401855, -0.0015352964401245117, -0.0014744400978088379, -0.001413583755493164, -0.0013527274131774902, -0.0012918710708618164, -0.0012310147285461426, -0.0011701583862304688, -0.001109302043914795, -0.001048445701599121, -0.0009875893592834473, -0.0009267330169677734, -0.0008658766746520996, -0.0008050203323364258, -0.000744163990020752, -0.0006833076477050781, -0.0006224513053894043, -0.0005615949630737305, -0.0005007386207580566, -0.0004398822784423828, -0.000379025936126709, -0.00031816959381103516, -0.00025731325149536133, -0.0001964569091796875, -0.00013560056686401367, -7.474422454833984e-05, -1.3887882232666016e-05, 4.696846008300781e-05, 0.00010782480239868164, 0.00016868114471435547, 0.0002295374870300293, 0.0002903938293457031, 0.00035125017166137695, 0.0004121065139770508, 0.0004729628562927246, 0.0005338191986083984, 0.0005946755409240723, 0.0006555318832397461, 0.0007163882255554199, 0.0007772445678710938, 0.0008381009101867676, 0.0008989572525024414, 0.0009598135948181152, 0.001020669937133789, 0.0010815262794494629, 0.0011423826217651367, 0.0012032389640808105, 0.0012640953063964844, 0.0013249516487121582, 0.001385807991027832, 0.0014466643333435059, 0.0015075206756591797, 0.0015683770179748535, 0.0016292333602905273, 0.0016900897026062012, 0.001750946044921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 7.0, 8.0, 11.0, 14.0, 27.0, 28.0, 45.0, 74.0, 138.0, 245.0, 446.0, 1140.0, 2693.0, 7920.0, 25196.0, 103417.0, 704934.0, 154465.0, 32021.0, 9880.0, 3329.0, 1261.0, 584.0, 286.0, 127.0, 89.0, 55.0, 40.0, 14.0, 14.0, 12.0, 11.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7109375, -8.4437255859375, -8.176513671875, -7.9093017578125, -7.64208984375, -7.3748779296875, -7.107666015625, -6.8404541015625, -6.5732421875, -6.3060302734375, -6.038818359375, -5.7716064453125, -5.50439453125, -5.2371826171875, -4.969970703125, -4.7027587890625, -4.435546875, -4.1683349609375, -3.901123046875, -3.6339111328125, -3.36669921875, -3.0994873046875, -2.832275390625, -2.5650634765625, -2.2978515625, -2.0306396484375, -1.763427734375, -1.4962158203125, -1.22900390625, -0.9617919921875, -0.694580078125, -0.4273681640625, -0.16015625, 0.1070556640625, 0.374267578125, 0.6414794921875, 0.90869140625, 1.1759033203125, 1.443115234375, 1.7103271484375, 1.9775390625, 2.2447509765625, 2.511962890625, 2.7791748046875, 3.04638671875, 3.3135986328125, 3.580810546875, 3.8480224609375, 4.115234375, 4.3824462890625, 4.649658203125, 4.9168701171875, 5.18408203125, 5.4512939453125, 5.718505859375, 5.9857177734375, 6.2529296875, 6.5201416015625, 6.787353515625, 7.0545654296875, 7.32177734375, 7.5889892578125, 7.856201171875, 8.1234130859375, 8.390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 5.0, 3.0, 6.0, 8.0, 15.0, 22.0, 23.0, 31.0, 63.0, 107.0, 143.0, 175.0, 128.0, 88.0, 61.0, 35.0, 24.0, 10.0, 12.0, 11.0, 4.0, 8.0, 2.0, 7.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40234375, -7.1671142578125, -6.931884765625, -6.6966552734375, -6.46142578125, -6.2261962890625, -5.990966796875, -5.7557373046875, -5.5205078125, -5.2852783203125, -5.050048828125, -4.8148193359375, -4.57958984375, -4.3443603515625, -4.109130859375, -3.8739013671875, -3.638671875, -3.4034423828125, -3.168212890625, -2.9329833984375, -2.69775390625, -2.4625244140625, -2.227294921875, -1.9920654296875, -1.7568359375, -1.5216064453125, -1.286376953125, -1.0511474609375, -0.81591796875, -0.5806884765625, -0.345458984375, -0.1102294921875, 0.125, 0.3602294921875, 0.595458984375, 0.8306884765625, 1.06591796875, 1.3011474609375, 1.536376953125, 1.7716064453125, 2.0068359375, 2.2420654296875, 2.477294921875, 2.7125244140625, 2.94775390625, 3.1829833984375, 3.418212890625, 3.6534423828125, 3.888671875, 4.1239013671875, 4.359130859375, 4.5943603515625, 4.82958984375, 5.0648193359375, 5.300048828125, 5.5352783203125, 5.7705078125, 6.0057373046875, 6.240966796875, 6.4761962890625, 6.71142578125, 6.9466552734375, 7.181884765625, 7.4171142578125, 7.65234375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 19.0, 17.0, 29.0, 73.0, 96.0, 144.0, 147.0, 129.0, 137.0, 90.0, 52.0, 28.0, 10.0, 11.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-95.45228576660156, -92.02389526367188, -88.59550476074219, -85.1671142578125, -81.73873138427734, -78.31034088134766, -74.88195037841797, -71.45355987548828, -68.02517700195312, -64.59678649902344, -61.168399810791016, -57.74000930786133, -54.311622619628906, -50.88323211669922, -47.45484161376953, -44.026451110839844, -40.598060607910156, -37.16967010498047, -33.74128341674805, -30.31289291381836, -26.884504318237305, -23.45611572265625, -20.027725219726562, -16.599336624145508, -13.170948028564453, -9.742559432983398, -6.314169883728027, -2.8857803344726562, 0.5426082611083984, 3.970996856689453, 7.399387359619141, 10.827775955200195, 14.25616455078125, 17.684553146362305, 21.11294174194336, 24.541332244873047, 27.9697208404541, 31.398109436035156, 34.826499938964844, 38.25489044189453, 41.68327713012695, 45.11166763305664, 48.54005432128906, 51.96844482421875, 55.39683532714844, 58.82522201538086, 62.25361251831055, 65.68199920654297, 69.11038970947266, 72.53878021240234, 75.96717071533203, 79.39555358886719, 82.82394409179688, 86.25233459472656, 89.68072509765625, 93.10911560058594, 96.53750610351562, 99.96589660644531, 103.394287109375, 106.82267761230469, 110.25106048583984, 113.67945098876953, 117.10784149169922, 120.5362319946289, 123.96461486816406]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 7.0, 12.0, 12.0, 11.0, 8.0, 11.0, 22.0, 24.0, 23.0, 26.0, 33.0, 33.0, 37.0, 36.0, 54.0, 44.0, 49.0, 46.0, 38.0, 40.0, 46.0, 37.0, 32.0, 36.0, 38.0, 35.0, 25.0, 32.0, 27.0, 16.0, 9.0, 13.0, 16.0, 9.0, 12.0, 10.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0], "bins": [-66.17778015136719, -64.39293670654297, -62.60809326171875, -60.82324981689453, -59.03840637207031, -57.253562927246094, -55.468719482421875, -53.683876037597656, -51.89903259277344, -50.11418914794922, -48.329345703125, -46.54450225830078, -44.75965881347656, -42.974815368652344, -41.189971923828125, -39.405128479003906, -37.62028503417969, -35.83544158935547, -34.05059814453125, -32.26575469970703, -30.480911254882812, -28.696067810058594, -26.911224365234375, -25.126380920410156, -23.341537475585938, -21.55669403076172, -19.7718505859375, -17.98700714111328, -16.202163696289062, -14.417320251464844, -12.632476806640625, -10.847633361816406, -9.062793731689453, -7.277950286865234, -5.493106842041016, -3.708263397216797, -1.9234199523925781, -0.13857650756835938, 1.6462669372558594, 3.431110382080078, 5.215953826904297, 7.000797271728516, 8.785640716552734, 10.570484161376953, 12.355327606201172, 14.14017105102539, 15.92501449584961, 17.709857940673828, 19.494701385498047, 21.279544830322266, 23.064388275146484, 24.849231719970703, 26.634075164794922, 28.41891860961914, 30.20376205444336, 31.988605499267578, 33.7734489440918, 35.558292388916016, 37.343135833740234, 39.12797927856445, 40.91282272338867, 42.69766616821289, 44.48250961303711, 46.26735305786133, 48.05219650268555]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 8.0, 7.0, 6.0, 16.0, 16.0, 22.0, 31.0, 73.0, 113.0, 234.0, 563.0, 1840.0, 10884.0, 1135923.0, 3029488.0, 12081.0, 1988.0, 548.0, 191.0, 109.0, 66.0, 24.0, 17.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.625, -57.9697265625, -56.314453125, -54.6591796875, -53.00390625, -51.3486328125, -49.693359375, -48.0380859375, -46.3828125, -44.7275390625, -43.072265625, -41.4169921875, -39.76171875, -38.1064453125, -36.451171875, -34.7958984375, -33.140625, -31.4853515625, -29.830078125, -28.1748046875, -26.51953125, -24.8642578125, -23.208984375, -21.5537109375, -19.8984375, -18.2431640625, -16.587890625, -14.9326171875, -13.27734375, -11.6220703125, -9.966796875, -8.3115234375, -6.65625, -5.0009765625, -3.345703125, -1.6904296875, -0.03515625, 1.6201171875, 3.275390625, 4.9306640625, 6.5859375, 8.2412109375, 9.896484375, 11.5517578125, 13.20703125, 14.8623046875, 16.517578125, 18.1728515625, 19.828125, 21.4833984375, 23.138671875, 24.7939453125, 26.44921875, 28.1044921875, 29.759765625, 31.4150390625, 33.0703125, 34.7255859375, 36.380859375, 38.0361328125, 39.69140625, 41.3466796875, 43.001953125, 44.6572265625, 46.3125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 7.0, 6.0, 13.0, 18.0, 19.0, 40.0, 47.0, 59.0, 72.0, 78.0, 71.0, 91.0, 74.0, 84.0, 66.0, 57.0, 49.0, 42.0, 30.0, 21.0, 22.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.807373046875, -3.66552734375, -3.523681640625, -3.3818359375, -3.239990234375, -3.09814453125, -2.956298828125, -2.814453125, -2.672607421875, -2.53076171875, -2.388916015625, -2.2470703125, -2.105224609375, -1.96337890625, -1.821533203125, -1.6796875, -1.537841796875, -1.39599609375, -1.254150390625, -1.1123046875, -0.970458984375, -0.82861328125, -0.686767578125, -0.544921875, -0.403076171875, -0.26123046875, -0.119384765625, 0.0224609375, 0.164306640625, 0.30615234375, 0.447998046875, 0.58984375, 0.731689453125, 0.87353515625, 1.015380859375, 1.1572265625, 1.299072265625, 1.44091796875, 1.582763671875, 1.724609375, 1.866455078125, 2.00830078125, 2.150146484375, 2.2919921875, 2.433837890625, 2.57568359375, 2.717529296875, 2.859375, 3.001220703125, 3.14306640625, 3.284912109375, 3.4267578125, 3.568603515625, 3.71044921875, 3.852294921875, 3.994140625, 4.135986328125, 4.27783203125, 4.419677734375, 4.5615234375, 4.703369140625, 4.84521484375, 4.987060546875, 5.12890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 9.0, 19.0, 38.0, 66.0, 134.0, 244.0, 722.0, 2228.0, 9519.0, 72417.0, 3926300.0, 163070.0, 14908.0, 3048.0, 935.0, 316.0, 151.0, 58.0, 39.0, 21.0, 9.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.59375, -43.547607421875, -42.50146484375, -41.455322265625, -40.4091796875, -39.363037109375, -38.31689453125, -37.270751953125, -36.224609375, -35.178466796875, -34.13232421875, -33.086181640625, -32.0400390625, -30.993896484375, -29.94775390625, -28.901611328125, -27.85546875, -26.809326171875, -25.76318359375, -24.717041015625, -23.6708984375, -22.624755859375, -21.57861328125, -20.532470703125, -19.486328125, -18.440185546875, -17.39404296875, -16.347900390625, -15.3017578125, -14.255615234375, -13.20947265625, -12.163330078125, -11.1171875, -10.071044921875, -9.02490234375, -7.978759765625, -6.9326171875, -5.886474609375, -4.84033203125, -3.794189453125, -2.748046875, -1.701904296875, -0.65576171875, 0.390380859375, 1.4365234375, 2.482666015625, 3.52880859375, 4.574951171875, 5.62109375, 6.667236328125, 7.71337890625, 8.759521484375, 9.8056640625, 10.851806640625, 11.89794921875, 12.944091796875, 13.990234375, 15.036376953125, 16.08251953125, 17.128662109375, 18.1748046875, 19.220947265625, 20.26708984375, 21.313232421875, 22.359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 10.0, 18.0, 24.0, 15.0, 37.0, 66.0, 106.0, 267.0, 913.0, 1720.0, 437.0, 165.0, 92.0, 56.0, 26.0, 25.0, 22.0, 19.0, 5.0, 8.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.3515625, -9.1298828125, -8.908203125, -8.6865234375, -8.46484375, -8.2431640625, -8.021484375, -7.7998046875, -7.578125, -7.3564453125, -7.134765625, -6.9130859375, -6.69140625, -6.4697265625, -6.248046875, -6.0263671875, -5.8046875, -5.5830078125, -5.361328125, -5.1396484375, -4.91796875, -4.6962890625, -4.474609375, -4.2529296875, -4.03125, -3.8095703125, -3.587890625, -3.3662109375, -3.14453125, -2.9228515625, -2.701171875, -2.4794921875, -2.2578125, -2.0361328125, -1.814453125, -1.5927734375, -1.37109375, -1.1494140625, -0.927734375, -0.7060546875, -0.484375, -0.2626953125, -0.041015625, 0.1806640625, 0.40234375, 0.6240234375, 0.845703125, 1.0673828125, 1.2890625, 1.5107421875, 1.732421875, 1.9541015625, 2.17578125, 2.3974609375, 2.619140625, 2.8408203125, 3.0625, 3.2841796875, 3.505859375, 3.7275390625, 3.94921875, 4.1708984375, 4.392578125, 4.6142578125, 4.8359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 24.0, 46.0, 102.0, 183.0, 257.0, 194.0, 111.0, 48.0, 24.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.7572021484375, -53.34828567504883, -50.93936538696289, -48.53044891357422, -46.12153244018555, -43.712615966796875, -41.30369567871094, -38.894779205322266, -36.485862731933594, -34.07694625854492, -31.668027877807617, -29.259109497070312, -26.85019302368164, -24.441274642944336, -22.03235626220703, -19.62343978881836, -17.214519500732422, -14.805602073669434, -12.396684646606445, -9.98776626586914, -7.578848838806152, -5.169931411743164, -2.7610130310058594, -0.3520965576171875, 2.056821823120117, 4.4657392501831055, 6.874657154083252, 9.283575057983398, 11.692492485046387, 14.101409912109375, 16.51032829284668, 18.91924476623535, 21.328163146972656, 23.73708152770996, 26.145998001098633, 28.554916381835938, 30.96383285522461, 33.37274932861328, 35.78166961669922, 38.19058609008789, 40.59950256347656, 43.008419036865234, 45.41733932495117, 47.826255798339844, 50.235172271728516, 52.64408874511719, 55.053009033203125, 57.4619255065918, 59.870845794677734, 62.279762268066406, 64.68868255615234, 67.09759521484375, 69.50651550292969, 71.91543579101562, 74.32435607910156, 76.73326873779297, 79.1421890258789, 81.55110931396484, 83.96002197265625, 86.36894226074219, 88.77786254882812, 91.18677520751953, 93.59569549560547, 96.00460815429688, 98.41352844238281]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 7.0, 9.0, 10.0, 9.0, 17.0, 27.0, 33.0, 32.0, 38.0, 34.0, 36.0, 55.0, 42.0, 46.0, 44.0, 41.0, 55.0, 49.0, 38.0, 40.0, 51.0, 42.0, 47.0, 28.0, 30.0, 26.0, 32.0, 16.0, 19.0, 11.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.991661071777344, -25.238811492919922, -24.485963821411133, -23.73311424255371, -22.980266571044922, -22.2274169921875, -21.474567413330078, -20.72171974182129, -19.968870162963867, -19.216020584106445, -18.463172912597656, -17.710323333740234, -16.957475662231445, -16.204626083374023, -15.451777458190918, -14.698928833007812, -13.946080207824707, -13.193231582641602, -12.440382957458496, -11.68753433227539, -10.934684753417969, -10.181836128234863, -9.428987503051758, -8.676137924194336, -7.923289775848389, -7.170441150665283, -6.4175920486450195, -5.664743423461914, -4.911894798278809, -4.159045696258545, -3.4061970710754395, -2.653347969055176, -1.9004993438720703, -1.1476504802703857, -0.3948017358779907, 0.3580470085144043, 1.1108958721160889, 1.8637447357177734, 2.616593360900879, 3.3694424629211426, 4.122291088104248, 4.8751397132873535, 5.627988815307617, 6.380837440490723, 7.133686065673828, 7.886535167694092, 8.639383316040039, 9.392232894897461, 10.145081520080566, 10.897930145263672, 11.650778770446777, 12.403627395629883, 13.156476974487305, 13.90932559967041, 14.662174224853516, 15.415023803710938, 16.167871475219727, 16.92072105407715, 17.673568725585938, 18.42641830444336, 19.17926597595215, 19.93211555480957, 20.68496322631836, 21.43781280517578, 22.190662384033203]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 8.0, 0.0, 1.0, 4.0, 1.0, 9.0, 13.0, 15.0, 21.0, 31.0, 46.0, 94.0, 163.0, 278.0, 462.0, 956.0, 2205.0, 6003.0, 18568.0, 66088.0, 282279.0, 485859.0, 133863.0, 34722.0, 10366.0, 3565.0, 1464.0, 608.0, 351.0, 208.0, 119.0, 69.0, 48.0, 18.0, 25.0, 13.0, 15.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.24462890625, -10.7392578125, -10.23388671875, -9.728515625, -9.22314453125, -8.7177734375, -8.21240234375, -7.70703125, -7.20166015625, -6.6962890625, -6.19091796875, -5.685546875, -5.18017578125, -4.6748046875, -4.16943359375, -3.6640625, -3.15869140625, -2.6533203125, -2.14794921875, -1.642578125, -1.13720703125, -0.6318359375, -0.12646484375, 0.37890625, 0.88427734375, 1.3896484375, 1.89501953125, 2.400390625, 2.90576171875, 3.4111328125, 3.91650390625, 4.421875, 4.92724609375, 5.4326171875, 5.93798828125, 6.443359375, 6.94873046875, 7.4541015625, 7.95947265625, 8.46484375, 8.97021484375, 9.4755859375, 9.98095703125, 10.486328125, 10.99169921875, 11.4970703125, 12.00244140625, 12.5078125, 13.01318359375, 13.5185546875, 14.02392578125, 14.529296875, 15.03466796875, 15.5400390625, 16.04541015625, 16.55078125, 17.05615234375, 17.5615234375, 18.06689453125, 18.572265625, 19.07763671875, 19.5830078125, 20.08837890625, 20.59375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 15.0, 13.0, 15.0, 32.0, 33.0, 54.0, 55.0, 72.0, 84.0, 66.0, 85.0, 84.0, 61.0, 65.0, 59.0, 59.0, 40.0, 26.0, 23.0, 16.0, 17.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6484375, -4.50189208984375, -4.3553466796875, -4.20880126953125, -4.062255859375, -3.91571044921875, -3.7691650390625, -3.62261962890625, -3.47607421875, -3.32952880859375, -3.1829833984375, -3.03643798828125, -2.889892578125, -2.74334716796875, -2.5968017578125, -2.45025634765625, -2.3037109375, -2.15716552734375, -2.0106201171875, -1.86407470703125, -1.717529296875, -1.57098388671875, -1.4244384765625, -1.27789306640625, -1.13134765625, -0.98480224609375, -0.8382568359375, -0.69171142578125, -0.545166015625, -0.39862060546875, -0.2520751953125, -0.10552978515625, 0.041015625, 0.18756103515625, 0.3341064453125, 0.48065185546875, 0.627197265625, 0.77374267578125, 0.9202880859375, 1.06683349609375, 1.21337890625, 1.35992431640625, 1.5064697265625, 1.65301513671875, 1.799560546875, 1.94610595703125, 2.0926513671875, 2.23919677734375, 2.3857421875, 2.53228759765625, 2.6788330078125, 2.82537841796875, 2.971923828125, 3.11846923828125, 3.2650146484375, 3.41156005859375, 3.55810546875, 3.70465087890625, 3.8511962890625, 3.99774169921875, 4.144287109375, 4.29083251953125, 4.4373779296875, 4.58392333984375, 4.73046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 2.0, 6.0, 4.0, 6.0, 11.0, 18.0, 38.0, 42.0, 66.0, 160.0, 291.0, 735.0, 2155.0, 7722.0, 37144.0, 220886.0, 607693.0, 138647.0, 24506.0, 5634.0, 1660.0, 572.0, 246.0, 118.0, 65.0, 35.0, 19.0, 17.0, 7.0, 11.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.671875, -17.108642578125, -16.54541015625, -15.982177734375, -15.4189453125, -14.855712890625, -14.29248046875, -13.729248046875, -13.166015625, -12.602783203125, -12.03955078125, -11.476318359375, -10.9130859375, -10.349853515625, -9.78662109375, -9.223388671875, -8.66015625, -8.096923828125, -7.53369140625, -6.970458984375, -6.4072265625, -5.843994140625, -5.28076171875, -4.717529296875, -4.154296875, -3.591064453125, -3.02783203125, -2.464599609375, -1.9013671875, -1.338134765625, -0.77490234375, -0.211669921875, 0.3515625, 0.914794921875, 1.47802734375, 2.041259765625, 2.6044921875, 3.167724609375, 3.73095703125, 4.294189453125, 4.857421875, 5.420654296875, 5.98388671875, 6.547119140625, 7.1103515625, 7.673583984375, 8.23681640625, 8.800048828125, 9.36328125, 9.926513671875, 10.48974609375, 11.052978515625, 11.6162109375, 12.179443359375, 12.74267578125, 13.305908203125, 13.869140625, 14.432373046875, 14.99560546875, 15.558837890625, 16.1220703125, 16.685302734375, 17.24853515625, 17.811767578125, 18.375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 12.0, 15.0, 19.0, 17.0, 25.0, 30.0, 33.0, 39.0, 36.0, 32.0, 44.0, 48.0, 49.0, 51.0, 60.0, 51.0, 37.0, 38.0, 58.0, 53.0, 47.0, 34.0, 30.0, 22.0, 21.0, 14.0, 22.0, 10.0, 15.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.609375, -11.18701171875, -10.7646484375, -10.34228515625, -9.919921875, -9.49755859375, -9.0751953125, -8.65283203125, -8.23046875, -7.80810546875, -7.3857421875, -6.96337890625, -6.541015625, -6.11865234375, -5.6962890625, -5.27392578125, -4.8515625, -4.42919921875, -4.0068359375, -3.58447265625, -3.162109375, -2.73974609375, -2.3173828125, -1.89501953125, -1.47265625, -1.05029296875, -0.6279296875, -0.20556640625, 0.216796875, 0.63916015625, 1.0615234375, 1.48388671875, 1.90625, 2.32861328125, 2.7509765625, 3.17333984375, 3.595703125, 4.01806640625, 4.4404296875, 4.86279296875, 5.28515625, 5.70751953125, 6.1298828125, 6.55224609375, 6.974609375, 7.39697265625, 7.8193359375, 8.24169921875, 8.6640625, 9.08642578125, 9.5087890625, 9.93115234375, 10.353515625, 10.77587890625, 11.1982421875, 11.62060546875, 12.04296875, 12.46533203125, 12.8876953125, 13.31005859375, 13.732421875, 14.15478515625, 14.5771484375, 14.99951171875, 15.421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 11.0, 12.0, 19.0, 28.0, 53.0, 54.0, 102.0, 137.0, 212.0, 402.0, 878.0, 2234.0, 10209.0, 116679.0, 870219.0, 38852.0, 5378.0, 1552.0, 663.0, 329.0, 191.0, 99.0, 77.0, 44.0, 23.0, 28.0, 13.0, 13.0, 5.0, 9.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.921875, -23.28076171875, -22.6396484375, -21.99853515625, -21.357421875, -20.71630859375, -20.0751953125, -19.43408203125, -18.79296875, -18.15185546875, -17.5107421875, -16.86962890625, -16.228515625, -15.58740234375, -14.9462890625, -14.30517578125, -13.6640625, -13.02294921875, -12.3818359375, -11.74072265625, -11.099609375, -10.45849609375, -9.8173828125, -9.17626953125, -8.53515625, -7.89404296875, -7.2529296875, -6.61181640625, -5.970703125, -5.32958984375, -4.6884765625, -4.04736328125, -3.40625, -2.76513671875, -2.1240234375, -1.48291015625, -0.841796875, -0.20068359375, 0.4404296875, 1.08154296875, 1.72265625, 2.36376953125, 3.0048828125, 3.64599609375, 4.287109375, 4.92822265625, 5.5693359375, 6.21044921875, 6.8515625, 7.49267578125, 8.1337890625, 8.77490234375, 9.416015625, 10.05712890625, 10.6982421875, 11.33935546875, 11.98046875, 12.62158203125, 13.2626953125, 13.90380859375, 14.544921875, 15.18603515625, 15.8271484375, 16.46826171875, 17.109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 9.0, 5.0, 19.0, 15.0, 34.0, 42.0, 39.0, 85.0, 224.0, 206.0, 117.0, 66.0, 35.0, 28.0, 22.0, 12.0, 10.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.002765655517578125, -0.002699941396713257, -0.0026342272758483887, -0.0025685131549835205, -0.0025027990341186523, -0.002437084913253784, -0.002371370792388916, -0.002305656671524048, -0.0022399425506591797, -0.0021742284297943115, -0.0021085143089294434, -0.002042800188064575, -0.001977086067199707, -0.0019113719463348389, -0.0018456578254699707, -0.0017799437046051025, -0.0017142295837402344, -0.0016485154628753662, -0.001582801342010498, -0.0015170872211456299, -0.0014513731002807617, -0.0013856589794158936, -0.0013199448585510254, -0.0012542307376861572, -0.001188516616821289, -0.001122802495956421, -0.0010570883750915527, -0.0009913742542266846, -0.0009256601333618164, -0.0008599460124969482, -0.0007942318916320801, -0.0007285177707672119, -0.0006628036499023438, -0.0005970895290374756, -0.0005313754081726074, -0.00046566128730773926, -0.0003999471664428711, -0.00033423304557800293, -0.00026851892471313477, -0.0002028048038482666, -0.00013709068298339844, -7.137656211853027e-05, -5.662441253662109e-06, 6.0051679611206055e-05, 0.00012576580047607422, 0.00019147992134094238, 0.00025719404220581055, 0.0003229081630706787, 0.0003886222839355469, 0.00045433640480041504, 0.0005200505256652832, 0.0005857646465301514, 0.0006514787673950195, 0.0007171928882598877, 0.0007829070091247559, 0.000848621129989624, 0.0009143352508544922, 0.0009800493717193604, 0.0010457634925842285, 0.0011114776134490967, 0.0011771917343139648, 0.001242905855178833, 0.0013086199760437012, 0.0013743340969085693, 0.0014400482177734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 9.0, 17.0, 18.0, 28.0, 57.0, 122.0, 282.0, 1091.0, 6676.0, 126394.0, 893892.0, 17107.0, 2007.0, 497.0, 179.0, 80.0, 43.0, 20.0, 15.0, 8.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-43.0625, -42.109619140625, -41.15673828125, -40.203857421875, -39.2509765625, -38.298095703125, -37.34521484375, -36.392333984375, -35.439453125, -34.486572265625, -33.53369140625, -32.580810546875, -31.6279296875, -30.675048828125, -29.72216796875, -28.769287109375, -27.81640625, -26.863525390625, -25.91064453125, -24.957763671875, -24.0048828125, -23.052001953125, -22.09912109375, -21.146240234375, -20.193359375, -19.240478515625, -18.28759765625, -17.334716796875, -16.3818359375, -15.428955078125, -14.47607421875, -13.523193359375, -12.5703125, -11.617431640625, -10.66455078125, -9.711669921875, -8.7587890625, -7.805908203125, -6.85302734375, -5.900146484375, -4.947265625, -3.994384765625, -3.04150390625, -2.088623046875, -1.1357421875, -0.182861328125, 0.77001953125, 1.722900390625, 2.67578125, 3.628662109375, 4.58154296875, 5.534423828125, 6.4873046875, 7.440185546875, 8.39306640625, 9.345947265625, 10.298828125, 11.251708984375, 12.20458984375, 13.157470703125, 14.1103515625, 15.063232421875, 16.01611328125, 16.968994140625, 17.921875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 20.0, 23.0, 34.0, 83.0, 196.0, 314.0, 144.0, 64.0, 40.0, 21.0, 23.0, 2.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.21875, -18.7305908203125, -18.242431640625, -17.7542724609375, -17.26611328125, -16.7779541015625, -16.289794921875, -15.8016357421875, -15.3134765625, -14.8253173828125, -14.337158203125, -13.8489990234375, -13.36083984375, -12.8726806640625, -12.384521484375, -11.8963623046875, -11.408203125, -10.9200439453125, -10.431884765625, -9.9437255859375, -9.45556640625, -8.9674072265625, -8.479248046875, -7.9910888671875, -7.5029296875, -7.0147705078125, -6.526611328125, -6.0384521484375, -5.55029296875, -5.0621337890625, -4.573974609375, -4.0858154296875, -3.59765625, -3.1094970703125, -2.621337890625, -2.1331787109375, -1.64501953125, -1.1568603515625, -0.668701171875, -0.1805419921875, 0.3076171875, 0.7957763671875, 1.283935546875, 1.7720947265625, 2.26025390625, 2.7484130859375, 3.236572265625, 3.7247314453125, 4.212890625, 4.7010498046875, 5.189208984375, 5.6773681640625, 6.16552734375, 6.6536865234375, 7.141845703125, 7.6300048828125, 8.1181640625, 8.6063232421875, 9.094482421875, 9.5826416015625, 10.07080078125, 10.5589599609375, 11.047119140625, 11.5352783203125, 12.0234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 37.0, 62.0, 118.0, 227.0, 262.0, 179.0, 71.0, 30.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.67164611816406, -156.66128540039062, -149.6509246826172, -142.64056396484375, -135.63021850585938, -128.61984252929688, -121.6094970703125, -114.59913635253906, -107.58877563476562, -100.57841491699219, -93.56805419921875, -86.55770111083984, -79.5473403930664, -72.53697967529297, -65.52662658691406, -58.516265869140625, -51.50590515136719, -44.49554443359375, -37.48518753051758, -30.474828720092773, -23.46446990966797, -16.45410919189453, -9.44375228881836, -2.4333953857421875, 4.57696533203125, 11.587324142456055, 18.59768295288086, 25.608041763305664, 32.61840057373047, 39.628761291503906, 46.63911819458008, 53.64947509765625, 60.659820556640625, 67.67018127441406, 74.6805419921875, 81.6908950805664, 88.70125579833984, 95.71161651611328, 102.72196960449219, 109.73233032226562, 116.74269104003906, 123.7530517578125, 130.76341247558594, 137.77377319335938, 144.78411865234375, 151.79449462890625, 158.80484008789062, 165.81520080566406, 172.8255615234375, 179.83592224121094, 186.84628295898438, 193.8566436767578, 200.86700439453125, 207.87734985351562, 214.88771057128906, 221.8980712890625, 228.90843200683594, 235.91879272460938, 242.9291534423828, 249.93951416015625, 256.9498596191406, 263.9602355957031, 270.9705810546875, 277.98095703125, 284.9913024902344]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 9.0, 9.0, 14.0, 22.0, 18.0, 12.0, 18.0, 24.0, 30.0, 26.0, 30.0, 34.0, 39.0, 39.0, 44.0, 48.0, 52.0, 38.0, 46.0, 36.0, 39.0, 41.0, 31.0, 39.0, 29.0, 25.0, 25.0, 21.0, 19.0, 26.0, 27.0, 16.0, 12.0, 12.0, 3.0, 5.0, 5.0, 7.0, 4.0, 3.0, 3.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-52.840850830078125, -51.15983963012695, -49.478824615478516, -47.797813415527344, -46.116798400878906, -44.435787200927734, -42.7547721862793, -41.073760986328125, -39.39274597167969, -37.711734771728516, -36.03071975708008, -34.349708557128906, -32.66869354248047, -30.987682342529297, -29.30666732788086, -27.625656127929688, -25.944643020629883, -24.263629913330078, -22.582616806030273, -20.90160369873047, -19.220590591430664, -17.53957748413086, -15.858565330505371, -14.177552223205566, -12.496539115905762, -10.815526008605957, -9.134512901306152, -7.453500270843506, -5.772487163543701, -4.091474533081055, -2.41046142578125, -0.7294483184814453, 0.9515647888183594, 2.632577896118164, 4.313591003417969, 5.994603633880615, 7.67561674118042, 9.356629371643066, 11.037642478942871, 12.718655586242676, 14.39966869354248, 16.08068084716797, 17.761693954467773, 19.442707061767578, 21.123720169067383, 22.804733276367188, 24.485746383666992, 26.166759490966797, 27.8477725982666, 29.528785705566406, 31.20979881286621, 32.890811920166016, 34.57182312011719, 36.252838134765625, 37.9338493347168, 39.614864349365234, 41.295875549316406, 42.97688674926758, 44.657901763916016, 46.33891296386719, 48.019927978515625, 49.7009391784668, 51.381954193115234, 53.062965393066406, 54.743980407714844]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 3.0, 7.0, 12.0, 9.0, 13.0, 19.0, 41.0, 67.0, 65.0, 112.0, 220.0, 354.0, 674.0, 1412.0, 3272.0, 9423.0, 39588.0, 3373648.0, 719151.0, 31855.0, 8368.0, 3075.0, 1273.0, 696.0, 345.0, 194.0, 136.0, 69.0, 54.0, 32.0, 17.0, 8.0, 17.0, 6.0, 9.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-41.53125, -40.464599609375, -39.39794921875, -38.331298828125, -37.2646484375, -36.197998046875, -35.13134765625, -34.064697265625, -32.998046875, -31.931396484375, -30.86474609375, -29.798095703125, -28.7314453125, -27.664794921875, -26.59814453125, -25.531494140625, -24.46484375, -23.398193359375, -22.33154296875, -21.264892578125, -20.1982421875, -19.131591796875, -18.06494140625, -16.998291015625, -15.931640625, -14.864990234375, -13.79833984375, -12.731689453125, -11.6650390625, -10.598388671875, -9.53173828125, -8.465087890625, -7.3984375, -6.331787109375, -5.26513671875, -4.198486328125, -3.1318359375, -2.065185546875, -0.99853515625, 0.068115234375, 1.134765625, 2.201416015625, 3.26806640625, 4.334716796875, 5.4013671875, 6.468017578125, 7.53466796875, 8.601318359375, 9.66796875, 10.734619140625, 11.80126953125, 12.867919921875, 13.9345703125, 15.001220703125, 16.06787109375, 17.134521484375, 18.201171875, 19.267822265625, 20.33447265625, 21.401123046875, 22.4677734375, 23.534423828125, 24.60107421875, 25.667724609375, 26.734375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 25.0, 41.0, 56.0, 79.0, 78.0, 103.0, 105.0, 104.0, 93.0, 69.0, 76.0, 47.0, 43.0, 34.0, 14.0, 7.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.328125, -7.1243896484375, -6.920654296875, -6.7169189453125, -6.51318359375, -6.3094482421875, -6.105712890625, -5.9019775390625, -5.6982421875, -5.4945068359375, -5.290771484375, -5.0870361328125, -4.88330078125, -4.6795654296875, -4.475830078125, -4.2720947265625, -4.068359375, -3.8646240234375, -3.660888671875, -3.4571533203125, -3.25341796875, -3.0496826171875, -2.845947265625, -2.6422119140625, -2.4384765625, -2.2347412109375, -2.031005859375, -1.8272705078125, -1.62353515625, -1.4197998046875, -1.216064453125, -1.0123291015625, -0.80859375, -0.6048583984375, -0.401123046875, -0.1973876953125, 0.00634765625, 0.2100830078125, 0.413818359375, 0.6175537109375, 0.8212890625, 1.0250244140625, 1.228759765625, 1.4324951171875, 1.63623046875, 1.8399658203125, 2.043701171875, 2.2474365234375, 2.451171875, 2.6549072265625, 2.858642578125, 3.0623779296875, 3.26611328125, 3.4698486328125, 3.673583984375, 3.8773193359375, 4.0810546875, 4.2847900390625, 4.488525390625, 4.6922607421875, 4.89599609375, 5.0997314453125, 5.303466796875, 5.5072021484375, 5.7109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 13.0, 11.0, 29.0, 35.0, 77.0, 164.0, 297.0, 607.0, 1663.0, 7909.0, 82297.0, 4016711.0, 74208.0, 7473.0, 1629.0, 578.0, 290.0, 145.0, 60.0, 38.0, 23.0, 10.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.75, -64.1650390625, -62.580078125, -60.9951171875, -59.41015625, -57.8251953125, -56.240234375, -54.6552734375, -53.0703125, -51.4853515625, -49.900390625, -48.3154296875, -46.73046875, -45.1455078125, -43.560546875, -41.9755859375, -40.390625, -38.8056640625, -37.220703125, -35.6357421875, -34.05078125, -32.4658203125, -30.880859375, -29.2958984375, -27.7109375, -26.1259765625, -24.541015625, -22.9560546875, -21.37109375, -19.7861328125, -18.201171875, -16.6162109375, -15.03125, -13.4462890625, -11.861328125, -10.2763671875, -8.69140625, -7.1064453125, -5.521484375, -3.9365234375, -2.3515625, -0.7666015625, 0.818359375, 2.4033203125, 3.98828125, 5.5732421875, 7.158203125, 8.7431640625, 10.328125, 11.9130859375, 13.498046875, 15.0830078125, 16.66796875, 18.2529296875, 19.837890625, 21.4228515625, 23.0078125, 24.5927734375, 26.177734375, 27.7626953125, 29.34765625, 30.9326171875, 32.517578125, 34.1025390625, 35.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 9.0, 13.0, 17.0, 30.0, 30.0, 58.0, 145.0, 479.0, 2597.0, 412.0, 124.0, 63.0, 32.0, 15.0, 19.0, 7.0, 11.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.109375, -15.7296142578125, -15.349853515625, -14.9700927734375, -14.59033203125, -14.2105712890625, -13.830810546875, -13.4510498046875, -13.0712890625, -12.6915283203125, -12.311767578125, -11.9320068359375, -11.55224609375, -11.1724853515625, -10.792724609375, -10.4129638671875, -10.033203125, -9.6534423828125, -9.273681640625, -8.8939208984375, -8.51416015625, -8.1343994140625, -7.754638671875, -7.3748779296875, -6.9951171875, -6.6153564453125, -6.235595703125, -5.8558349609375, -5.47607421875, -5.0963134765625, -4.716552734375, -4.3367919921875, -3.95703125, -3.5772705078125, -3.197509765625, -2.8177490234375, -2.43798828125, -2.0582275390625, -1.678466796875, -1.2987060546875, -0.9189453125, -0.5391845703125, -0.159423828125, 0.2203369140625, 0.60009765625, 0.9798583984375, 1.359619140625, 1.7393798828125, 2.119140625, 2.4989013671875, 2.878662109375, 3.2584228515625, 3.63818359375, 4.0179443359375, 4.397705078125, 4.7774658203125, 5.1572265625, 5.5369873046875, 5.916748046875, 6.2965087890625, 6.67626953125, 7.0560302734375, 7.435791015625, 7.8155517578125, 8.1953125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 7.0, 7.0, 23.0, 19.0, 49.0, 75.0, 125.0, 174.0, 170.0, 135.0, 90.0, 56.0, 30.0, 16.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.50460052490234, -65.521728515625, -63.538856506347656, -61.55598449707031, -59.5731086730957, -57.59023666381836, -55.607364654541016, -53.62449264526367, -51.64162063598633, -49.658748626708984, -47.67587661743164, -45.69300079345703, -43.71012878417969, -41.727256774902344, -39.744384765625, -37.761512756347656, -35.77864074707031, -33.79576873779297, -31.812894821166992, -29.83002281188965, -27.847150802612305, -25.864276885986328, -23.881404876708984, -21.89853286743164, -19.91565704345703, -17.932785034179688, -15.949912071228027, -13.967039108276367, -11.984167098999023, -10.001294136047363, -8.018421173095703, -6.035549163818359, -4.052677154541016, -2.0698046684265137, -0.08693194389343262, 1.8959407806396484, 3.8788132667541504, 5.861685752868652, 7.8445587158203125, 9.827430725097656, 11.810303688049316, 13.793176651000977, 15.77604866027832, 17.758922576904297, 19.74179458618164, 21.724666595458984, 23.707538604736328, 25.690410614013672, 27.67328453063965, 29.656156539916992, 31.63903045654297, 33.62190246582031, 35.604774475097656, 37.587646484375, 39.570518493652344, 41.55339050292969, 43.5362663269043, 45.51913833618164, 47.502010345458984, 49.484886169433594, 51.46775817871094, 53.45063018798828, 55.433502197265625, 57.41637420654297, 59.39924621582031]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 8.0, 12.0, 13.0, 14.0, 25.0, 23.0, 28.0, 28.0, 38.0, 51.0, 36.0, 42.0, 43.0, 50.0, 55.0, 55.0, 55.0, 52.0, 49.0, 38.0, 37.0, 28.0, 36.0, 24.0, 30.0, 21.0, 18.0, 21.0, 14.0, 6.0, 9.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.11056137084961, -31.223161697387695, -30.33576202392578, -29.448360443115234, -28.56096076965332, -27.673561096191406, -26.786161422729492, -25.898761749267578, -25.011362075805664, -24.12396240234375, -23.236562728881836, -22.349163055419922, -21.461761474609375, -20.57436180114746, -19.686962127685547, -18.799562454223633, -17.91216278076172, -17.024763107299805, -16.13736343383789, -15.24996280670166, -14.362563133239746, -13.475162506103516, -12.587762832641602, -11.700363159179688, -10.81296157836914, -9.925561904907227, -9.038161277770996, -8.150761604309082, -7.263361930847168, -6.375961780548096, -5.488561630249023, -4.601161956787109, -3.7137622833251953, -2.826362371444702, -1.9389623403549194, -1.0515623092651367, -0.16416239738464355, 0.7232375144958496, 1.6106376647949219, 2.498037338256836, 3.385437488555908, 4.2728376388549805, 5.1602373123168945, 6.047637462615967, 6.935037612915039, 7.822437286376953, 8.709836959838867, 9.597236633300781, 10.484637260437012, 11.372036933898926, 12.259437561035156, 13.14683723449707, 14.034236907958984, 14.921636581420898, 15.809037208557129, 16.69643783569336, 17.583837509155273, 18.471237182617188, 19.3586368560791, 20.246036529541016, 21.133438110351562, 22.020837783813477, 22.90823745727539, 23.795637130737305, 24.68303680419922]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 9.0, 12.0, 12.0, 17.0, 25.0, 37.0, 44.0, 93.0, 157.0, 231.0, 476.0, 805.0, 1836.0, 4356.0, 12676.0, 41471.0, 155843.0, 485498.0, 250641.0, 64398.0, 18677.0, 6359.0, 2489.0, 1076.0, 554.0, 295.0, 170.0, 91.0, 58.0, 53.0, 31.0, 15.0, 10.0, 12.0, 6.0, 3.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.4375, -19.792236328125, -19.14697265625, -18.501708984375, -17.8564453125, -17.211181640625, -16.56591796875, -15.920654296875, -15.275390625, -14.630126953125, -13.98486328125, -13.339599609375, -12.6943359375, -12.049072265625, -11.40380859375, -10.758544921875, -10.11328125, -9.468017578125, -8.82275390625, -8.177490234375, -7.5322265625, -6.886962890625, -6.24169921875, -5.596435546875, -4.951171875, -4.305908203125, -3.66064453125, -3.015380859375, -2.3701171875, -1.724853515625, -1.07958984375, -0.434326171875, 0.2109375, 0.856201171875, 1.50146484375, 2.146728515625, 2.7919921875, 3.437255859375, 4.08251953125, 4.727783203125, 5.373046875, 6.018310546875, 6.66357421875, 7.308837890625, 7.9541015625, 8.599365234375, 9.24462890625, 9.889892578125, 10.53515625, 11.180419921875, 11.82568359375, 12.470947265625, 13.1162109375, 13.761474609375, 14.40673828125, 15.052001953125, 15.697265625, 16.342529296875, 16.98779296875, 17.633056640625, 18.2783203125, 18.923583984375, 19.56884765625, 20.214111328125, 20.859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 13.0, 8.0, 24.0, 18.0, 28.0, 27.0, 41.0, 39.0, 47.0, 66.0, 70.0, 80.0, 74.0, 83.0, 53.0, 62.0, 54.0, 47.0, 39.0, 33.0, 23.0, 20.0, 11.0, 13.0, 12.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90234375, -4.7408447265625, -4.579345703125, -4.4178466796875, -4.25634765625, -4.0948486328125, -3.933349609375, -3.7718505859375, -3.6103515625, -3.4488525390625, -3.287353515625, -3.1258544921875, -2.96435546875, -2.8028564453125, -2.641357421875, -2.4798583984375, -2.318359375, -2.1568603515625, -1.995361328125, -1.8338623046875, -1.67236328125, -1.5108642578125, -1.349365234375, -1.1878662109375, -1.0263671875, -0.8648681640625, -0.703369140625, -0.5418701171875, -0.38037109375, -0.2188720703125, -0.057373046875, 0.1041259765625, 0.265625, 0.4271240234375, 0.588623046875, 0.7501220703125, 0.91162109375, 1.0731201171875, 1.234619140625, 1.3961181640625, 1.5576171875, 1.7191162109375, 1.880615234375, 2.0421142578125, 2.20361328125, 2.3651123046875, 2.526611328125, 2.6881103515625, 2.849609375, 3.0111083984375, 3.172607421875, 3.3341064453125, 3.49560546875, 3.6571044921875, 3.818603515625, 3.9801025390625, 4.1416015625, 4.3031005859375, 4.464599609375, 4.6260986328125, 4.78759765625, 4.9490966796875, 5.110595703125, 5.2720947265625, 5.43359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 15.0, 24.0, 28.0, 46.0, 77.0, 103.0, 162.0, 287.0, 547.0, 1284.0, 4486.0, 26410.0, 281310.0, 655671.0, 65503.0, 8841.0, 2091.0, 719.0, 367.0, 173.0, 134.0, 79.0, 56.0, 46.0, 30.0, 15.0, 7.0, 6.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.34375, -30.33935546875, -29.3349609375, -28.33056640625, -27.326171875, -26.32177734375, -25.3173828125, -24.31298828125, -23.30859375, -22.30419921875, -21.2998046875, -20.29541015625, -19.291015625, -18.28662109375, -17.2822265625, -16.27783203125, -15.2734375, -14.26904296875, -13.2646484375, -12.26025390625, -11.255859375, -10.25146484375, -9.2470703125, -8.24267578125, -7.23828125, -6.23388671875, -5.2294921875, -4.22509765625, -3.220703125, -2.21630859375, -1.2119140625, -0.20751953125, 0.796875, 1.80126953125, 2.8056640625, 3.81005859375, 4.814453125, 5.81884765625, 6.8232421875, 7.82763671875, 8.83203125, 9.83642578125, 10.8408203125, 11.84521484375, 12.849609375, 13.85400390625, 14.8583984375, 15.86279296875, 16.8671875, 17.87158203125, 18.8759765625, 19.88037109375, 20.884765625, 21.88916015625, 22.8935546875, 23.89794921875, 24.90234375, 25.90673828125, 26.9111328125, 27.91552734375, 28.919921875, 29.92431640625, 30.9287109375, 31.93310546875, 32.9375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 6.0, 11.0, 6.0, 9.0, 16.0, 21.0, 17.0, 28.0, 33.0, 35.0, 29.0, 45.0, 53.0, 56.0, 38.0, 59.0, 57.0, 53.0, 49.0, 47.0, 42.0, 49.0, 45.0, 35.0, 17.0, 24.0, 17.0, 21.0, 10.0, 14.0, 10.0, 10.0, 5.0, 5.0, 6.0, 3.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.842529296875, -18.18505859375, -17.527587890625, -16.8701171875, -16.212646484375, -15.55517578125, -14.897705078125, -14.240234375, -13.582763671875, -12.92529296875, -12.267822265625, -11.6103515625, -10.952880859375, -10.29541015625, -9.637939453125, -8.98046875, -8.322998046875, -7.66552734375, -7.008056640625, -6.3505859375, -5.693115234375, -5.03564453125, -4.378173828125, -3.720703125, -3.063232421875, -2.40576171875, -1.748291015625, -1.0908203125, -0.433349609375, 0.22412109375, 0.881591796875, 1.5390625, 2.196533203125, 2.85400390625, 3.511474609375, 4.1689453125, 4.826416015625, 5.48388671875, 6.141357421875, 6.798828125, 7.456298828125, 8.11376953125, 8.771240234375, 9.4287109375, 10.086181640625, 10.74365234375, 11.401123046875, 12.05859375, 12.716064453125, 13.37353515625, 14.031005859375, 14.6884765625, 15.345947265625, 16.00341796875, 16.660888671875, 17.318359375, 17.975830078125, 18.63330078125, 19.290771484375, 19.9482421875, 20.605712890625, 21.26318359375, 21.920654296875, 22.578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 6.0, 10.0, 11.0, 19.0, 18.0, 27.0, 46.0, 59.0, 103.0, 150.0, 237.0, 377.0, 675.0, 1146.0, 2430.0, 5623.0, 16325.0, 78042.0, 746649.0, 157618.0, 24650.0, 7635.0, 3172.0, 1478.0, 835.0, 424.0, 256.0, 186.0, 117.0, 74.0, 49.0, 24.0, 32.0, 14.0, 9.0, 6.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.390625, -18.796875, -18.203125, -17.609375, -17.015625, -16.421875, -15.828125, -15.234375, -14.640625, -14.046875, -13.453125, -12.859375, -12.265625, -11.671875, -11.078125, -10.484375, -9.890625, -9.296875, -8.703125, -8.109375, -7.515625, -6.921875, -6.328125, -5.734375, -5.140625, -4.546875, -3.953125, -3.359375, -2.765625, -2.171875, -1.578125, -0.984375, -0.390625, 0.203125, 0.796875, 1.390625, 1.984375, 2.578125, 3.171875, 3.765625, 4.359375, 4.953125, 5.546875, 6.140625, 6.734375, 7.328125, 7.921875, 8.515625, 9.109375, 9.703125, 10.296875, 10.890625, 11.484375, 12.078125, 12.671875, 13.265625, 13.859375, 14.453125, 15.046875, 15.640625, 16.234375, 16.828125, 17.421875, 18.015625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 8.0, 10.0, 21.0, 19.0, 39.0, 68.0, 121.0, 347.0, 174.0, 83.0, 37.0, 20.0, 17.0, 4.0, 5.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0052947998046875, -0.005122542381286621, -0.004950284957885742, -0.004778027534484863, -0.004605770111083984, -0.0044335126876831055, -0.0042612552642822266, -0.004088997840881348, -0.003916740417480469, -0.00374448299407959, -0.003572225570678711, -0.003399968147277832, -0.003227710723876953, -0.0030554533004760742, -0.0028831958770751953, -0.0027109384536743164, -0.0025386810302734375, -0.0023664236068725586, -0.0021941661834716797, -0.0020219087600708008, -0.0018496513366699219, -0.001677393913269043, -0.001505136489868164, -0.0013328790664672852, -0.0011606216430664062, -0.0009883642196655273, -0.0008161067962646484, -0.0006438493728637695, -0.0004715919494628906, -0.0002993345260620117, -0.0001270771026611328, 4.5180320739746094e-05, 0.000217437744140625, 0.0003896951675415039, 0.0005619525909423828, 0.0007342100143432617, 0.0009064674377441406, 0.0010787248611450195, 0.0012509822845458984, 0.0014232397079467773, 0.0015954971313476562, 0.0017677545547485352, 0.001940011978149414, 0.002112269401550293, 0.002284526824951172, 0.0024567842483520508, 0.0026290416717529297, 0.0028012990951538086, 0.0029735565185546875, 0.0031458139419555664, 0.0033180713653564453, 0.0034903287887573242, 0.003662586212158203, 0.003834843635559082, 0.004007101058959961, 0.00417935848236084, 0.004351615905761719, 0.004523873329162598, 0.0046961307525634766, 0.0048683881759643555, 0.005040645599365234, 0.005212903022766113, 0.005385160446166992, 0.005557417869567871, 0.00572967529296875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 12.0, 11.0, 17.0, 25.0, 38.0, 60.0, 124.0, 215.0, 409.0, 877.0, 2291.0, 8689.0, 67458.0, 896661.0, 59562.0, 8058.0, 2276.0, 838.0, 407.0, 213.0, 130.0, 64.0, 49.0, 24.0, 9.0, 9.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.125, -36.951171875, -35.77734375, -34.603515625, -33.4296875, -32.255859375, -31.08203125, -29.908203125, -28.734375, -27.560546875, -26.38671875, -25.212890625, -24.0390625, -22.865234375, -21.69140625, -20.517578125, -19.34375, -18.169921875, -16.99609375, -15.822265625, -14.6484375, -13.474609375, -12.30078125, -11.126953125, -9.953125, -8.779296875, -7.60546875, -6.431640625, -5.2578125, -4.083984375, -2.91015625, -1.736328125, -0.5625, 0.611328125, 1.78515625, 2.958984375, 4.1328125, 5.306640625, 6.48046875, 7.654296875, 8.828125, 10.001953125, 11.17578125, 12.349609375, 13.5234375, 14.697265625, 15.87109375, 17.044921875, 18.21875, 19.392578125, 20.56640625, 21.740234375, 22.9140625, 24.087890625, 25.26171875, 26.435546875, 27.609375, 28.783203125, 29.95703125, 31.130859375, 32.3046875, 33.478515625, 34.65234375, 35.826171875, 37.0]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 2.0, 1.0, 3.0, 9.0, 11.0, 12.0, 17.0, 9.0, 21.0, 20.0, 46.0, 80.0, 164.0, 233.0, 140.0, 78.0, 45.0, 29.0, 26.0, 9.0, 8.0, 9.0, 9.0, 4.0, 3.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.859375, -22.19287109375, -21.5263671875, -20.85986328125, -20.193359375, -19.52685546875, -18.8603515625, -18.19384765625, -17.52734375, -16.86083984375, -16.1943359375, -15.52783203125, -14.861328125, -14.19482421875, -13.5283203125, -12.86181640625, -12.1953125, -11.52880859375, -10.8623046875, -10.19580078125, -9.529296875, -8.86279296875, -8.1962890625, -7.52978515625, -6.86328125, -6.19677734375, -5.5302734375, -4.86376953125, -4.197265625, -3.53076171875, -2.8642578125, -2.19775390625, -1.53125, -0.86474609375, -0.1982421875, 0.46826171875, 1.134765625, 1.80126953125, 2.4677734375, 3.13427734375, 3.80078125, 4.46728515625, 5.1337890625, 5.80029296875, 6.466796875, 7.13330078125, 7.7998046875, 8.46630859375, 9.1328125, 9.79931640625, 10.4658203125, 11.13232421875, 11.798828125, 12.46533203125, 13.1318359375, 13.79833984375, 14.46484375, 15.13134765625, 15.7978515625, 16.46435546875, 17.130859375, 17.79736328125, 18.4638671875, 19.13037109375, 19.796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 8.0, 20.0, 34.0, 51.0, 103.0, 133.0, 165.0, 165.0, 143.0, 99.0, 45.0, 14.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.7103729248047, -228.84329223632812, -220.9761962890625, -213.10911560058594, -205.24203491210938, -197.37493896484375, -189.5078582763672, -181.64077758789062, -173.773681640625, -165.90660095214844, -158.0395050048828, -150.17242431640625, -142.30532836914062, -134.43824768066406, -126.5711669921875, -118.7040786743164, -110.83699035644531, -102.96990203857422, -95.10281372070312, -87.23573303222656, -79.36864471435547, -71.50155639648438, -63.63447189331055, -55.76738739013672, -47.900299072265625, -40.03321075439453, -32.1661262512207, -24.299039840698242, -16.43195343017578, -8.564865112304688, -0.6977806091308594, 7.169303894042969, 15.036376953125, 22.90346336364746, 30.770549774169922, 38.63763427734375, 46.504722595214844, 54.37181091308594, 62.238895416259766, 70.1059799194336, 77.97306823730469, 85.84015655517578, 93.70724487304688, 101.57432556152344, 109.44141387939453, 117.30850219726562, 125.17558288574219, 133.04266357421875, 140.90975952148438, 148.77684020996094, 156.64393615722656, 164.51101684570312, 172.37811279296875, 180.2451934814453, 188.11227416992188, 195.9793701171875, 203.84645080566406, 211.71353149414062, 219.58062744140625, 227.4477081298828, 235.31478881835938, 243.181884765625, 251.04896545410156, 258.9160461425781, 266.78314208984375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 2.0, 2.0, 10.0, 7.0, 8.0, 21.0, 11.0, 22.0, 30.0, 22.0, 41.0, 46.0, 43.0, 47.0, 59.0, 49.0, 60.0, 59.0, 62.0, 47.0, 50.0, 41.0, 44.0, 29.0, 35.0, 18.0, 27.0, 17.0, 21.0, 13.0, 18.0, 9.0, 12.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.8802490234375, -138.69435119628906, -134.50845336914062, -130.3225555419922, -126.13665771484375, -121.95075988769531, -117.7648696899414, -113.57897186279297, -109.39307403564453, -105.2071762084961, -101.02127838134766, -96.83538055419922, -92.64949035644531, -88.46359252929688, -84.27769470214844, -80.091796875, -75.90589904785156, -71.72000122070312, -67.53410339355469, -63.348209381103516, -59.16231155395508, -54.97641372680664, -50.79051971435547, -46.60462188720703, -42.418724060058594, -38.232826232910156, -34.04692840576172, -29.861034393310547, -25.67513656616211, -21.489238739013672, -17.303342819213867, -13.117446899414062, -8.931533813476562, -4.745636940002441, -0.5597400665283203, 3.626156806945801, 7.812053680419922, 11.99795150756836, 16.183847427368164, 20.36974334716797, 24.555641174316406, 28.741539001464844, 32.92743682861328, 37.11333084106445, 41.29922866821289, 45.48512649536133, 49.6710205078125, 53.85691833496094, 58.042816162109375, 62.22871398925781, 66.41461181640625, 70.60050964355469, 74.78640747070312, 78.97230529785156, 83.15819549560547, 87.3440933227539, 91.52999114990234, 95.71588897705078, 99.90178680419922, 104.08768463134766, 108.27357482910156, 112.45947265625, 116.64537048339844, 120.83126831054688, 125.01716613769531]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 0.0, 6.0, 8.0, 5.0, 9.0, 8.0, 15.0, 15.0, 36.0, 54.0, 99.0, 120.0, 247.0, 437.0, 809.0, 1666.0, 3920.0, 11271.0, 46863.0, 1233827.0, 2818863.0, 55056.0, 12698.0, 4404.0, 1848.0, 871.0, 485.0, 242.0, 162.0, 84.0, 58.0, 30.0, 29.0, 15.0, 7.0, 7.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.707275390625, -29.80517578125, -28.903076171875, -28.0009765625, -27.098876953125, -26.19677734375, -25.294677734375, -24.392578125, -23.490478515625, -22.58837890625, -21.686279296875, -20.7841796875, -19.882080078125, -18.97998046875, -18.077880859375, -17.17578125, -16.273681640625, -15.37158203125, -14.469482421875, -13.5673828125, -12.665283203125, -11.76318359375, -10.861083984375, -9.958984375, -9.056884765625, -8.15478515625, -7.252685546875, -6.3505859375, -5.448486328125, -4.54638671875, -3.644287109375, -2.7421875, -1.840087890625, -0.93798828125, -0.035888671875, 0.8662109375, 1.768310546875, 2.67041015625, 3.572509765625, 4.474609375, 5.376708984375, 6.27880859375, 7.180908203125, 8.0830078125, 8.985107421875, 9.88720703125, 10.789306640625, 11.69140625, 12.593505859375, 13.49560546875, 14.397705078125, 15.2998046875, 16.201904296875, 17.10400390625, 18.006103515625, 18.908203125, 19.810302734375, 20.71240234375, 21.614501953125, 22.5166015625, 23.418701171875, 24.32080078125, 25.222900390625, 26.125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 3.0, 5.0, 8.0, 11.0, 14.0, 15.0, 15.0, 26.0, 21.0, 27.0, 34.0, 29.0, 41.0, 50.0, 66.0, 51.0, 64.0, 51.0, 45.0, 48.0, 58.0, 45.0, 42.0, 43.0, 33.0, 28.0, 32.0, 17.0, 20.0, 17.0, 11.0, 11.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.90283203125, -3.7548828125, -3.60693359375, -3.458984375, -3.31103515625, -3.1630859375, -3.01513671875, -2.8671875, -2.71923828125, -2.5712890625, -2.42333984375, -2.275390625, -2.12744140625, -1.9794921875, -1.83154296875, -1.68359375, -1.53564453125, -1.3876953125, -1.23974609375, -1.091796875, -0.94384765625, -0.7958984375, -0.64794921875, -0.5, -0.35205078125, -0.2041015625, -0.05615234375, 0.091796875, 0.23974609375, 0.3876953125, 0.53564453125, 0.68359375, 0.83154296875, 0.9794921875, 1.12744140625, 1.275390625, 1.42333984375, 1.5712890625, 1.71923828125, 1.8671875, 2.01513671875, 2.1630859375, 2.31103515625, 2.458984375, 2.60693359375, 2.7548828125, 2.90283203125, 3.05078125, 3.19873046875, 3.3466796875, 3.49462890625, 3.642578125, 3.79052734375, 3.9384765625, 4.08642578125, 4.234375, 4.38232421875, 4.5302734375, 4.67822265625, 4.826171875, 4.97412109375, 5.1220703125, 5.27001953125, 5.41796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 22.0, 24.0, 50.0, 80.0, 142.0, 303.0, 625.0, 1560.0, 4400.0, 16885.0, 132740.0, 3859938.0, 152037.0, 17973.0, 4636.0, 1615.0, 665.0, 273.0, 132.0, 77.0, 38.0, 22.0, 11.0, 8.0, 10.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.6875, -44.4365234375, -43.185546875, -41.9345703125, -40.68359375, -39.4326171875, -38.181640625, -36.9306640625, -35.6796875, -34.4287109375, -33.177734375, -31.9267578125, -30.67578125, -29.4248046875, -28.173828125, -26.9228515625, -25.671875, -24.4208984375, -23.169921875, -21.9189453125, -20.66796875, -19.4169921875, -18.166015625, -16.9150390625, -15.6640625, -14.4130859375, -13.162109375, -11.9111328125, -10.66015625, -9.4091796875, -8.158203125, -6.9072265625, -5.65625, -4.4052734375, -3.154296875, -1.9033203125, -0.65234375, 0.5986328125, 1.849609375, 3.1005859375, 4.3515625, 5.6025390625, 6.853515625, 8.1044921875, 9.35546875, 10.6064453125, 11.857421875, 13.1083984375, 14.359375, 15.6103515625, 16.861328125, 18.1123046875, 19.36328125, 20.6142578125, 21.865234375, 23.1162109375, 24.3671875, 25.6181640625, 26.869140625, 28.1201171875, 29.37109375, 30.6220703125, 31.873046875, 33.1240234375, 34.375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 6.0, 10.0, 15.0, 18.0, 24.0, 37.0, 75.0, 136.0, 327.0, 1267.0, 1464.0, 323.0, 144.0, 77.0, 43.0, 27.0, 19.0, 10.0, 12.0, 7.0, 4.0, 2.0, 8.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.8984375, -15.4693603515625, -15.040283203125, -14.6112060546875, -14.18212890625, -13.7530517578125, -13.323974609375, -12.8948974609375, -12.4658203125, -12.0367431640625, -11.607666015625, -11.1785888671875, -10.74951171875, -10.3204345703125, -9.891357421875, -9.4622802734375, -9.033203125, -8.6041259765625, -8.175048828125, -7.7459716796875, -7.31689453125, -6.8878173828125, -6.458740234375, -6.0296630859375, -5.6005859375, -5.1715087890625, -4.742431640625, -4.3133544921875, -3.88427734375, -3.4552001953125, -3.026123046875, -2.5970458984375, -2.16796875, -1.7388916015625, -1.309814453125, -0.8807373046875, -0.45166015625, -0.0225830078125, 0.406494140625, 0.8355712890625, 1.2646484375, 1.6937255859375, 2.122802734375, 2.5518798828125, 2.98095703125, 3.4100341796875, 3.839111328125, 4.2681884765625, 4.697265625, 5.1263427734375, 5.555419921875, 5.9844970703125, 6.41357421875, 6.8426513671875, 7.271728515625, 7.7008056640625, 8.1298828125, 8.5589599609375, 8.988037109375, 9.4171142578125, 9.84619140625, 10.2752685546875, 10.704345703125, 11.1334228515625, 11.5625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 7.0, 19.0, 48.0, 145.0, 253.0, 236.0, 163.0, 76.0, 37.0, 12.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.12347412109375, -35.10445785522461, -30.085437774658203, -25.066421508789062, -20.04740333557129, -15.028385162353516, -10.009368896484375, -4.990348815917969, 0.028667449951171875, 5.047685146331787, 10.066702842712402, 15.08572006225586, 20.104738235473633, 25.123756408691406, 30.142772674560547, 35.16179275512695, 40.180809020996094, 45.199825286865234, 50.21884536743164, 55.23786163330078, 60.25688171386719, 65.27589416503906, 70.29491424560547, 75.31393432617188, 80.33294677734375, 85.35196685791016, 90.37097930908203, 95.38999938964844, 100.40901947021484, 105.42803955078125, 110.44705200195312, 115.46607208251953, 120.48509216308594, 125.50411224365234, 130.52313232421875, 135.54214477539062, 140.5611572265625, 145.58018493652344, 150.5991973876953, 155.61822509765625, 160.63723754882812, 165.65625, 170.67527770996094, 175.6942901611328, 180.7133026123047, 185.73233032226562, 190.7513427734375, 195.77035522460938, 200.78936767578125, 205.80838012695312, 210.82740783691406, 215.84642028808594, 220.8654327392578, 225.88446044921875, 230.90347290039062, 235.9224853515625, 240.94151306152344, 245.9605255126953, 250.97955322265625, 255.99856567382812, 261.017578125, 266.0365905761719, 271.05560302734375, 276.07464599609375, 281.0936584472656]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 14.0, 13.0, 17.0, 13.0, 17.0, 25.0, 29.0, 25.0, 36.0, 38.0, 38.0, 39.0, 49.0, 57.0, 70.0, 54.0, 52.0, 37.0, 46.0, 37.0, 39.0, 37.0, 40.0, 36.0, 32.0, 20.0, 12.0, 15.0, 6.0, 15.0, 9.0, 5.0, 6.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.758644104003906, -43.33696746826172, -41.91529083251953, -40.493614196777344, -39.07193374633789, -37.6502571105957, -36.228580474853516, -34.80690383911133, -33.38522720336914, -31.963550567626953, -30.541872024536133, -29.120195388793945, -27.698518753051758, -26.276840209960938, -24.85516357421875, -23.433486938476562, -22.011808395385742, -20.590131759643555, -19.168453216552734, -17.746776580810547, -16.32509994506836, -14.903422355651855, -13.481744766235352, -12.060068130493164, -10.63839054107666, -9.216712951660156, -7.795036315917969, -6.373358726501465, -4.951681613922119, -3.5300045013427734, -2.1083269119262695, -0.686650276184082, 0.7350273132324219, 2.1567044258117676, 3.5783817768096924, 5.000059127807617, 6.421736240386963, 7.843413352966309, 9.265090942382812, 10.686767578125, 12.108445167541504, 13.530122756958008, 14.951799392700195, 16.373477935791016, 17.795154571533203, 19.21683120727539, 20.638507843017578, 22.060184478759766, 23.481863021850586, 24.903539657592773, 26.325218200683594, 27.74689483642578, 29.16857147216797, 30.590248107910156, 32.011924743652344, 33.43360137939453, 34.855281829833984, 36.27695846557617, 37.69863510131836, 39.12031555175781, 40.5419921875, 41.96366882324219, 43.385345458984375, 44.80702209472656, 46.22869873046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 14.0, 15.0, 43.0, 64.0, 111.0, 166.0, 312.0, 492.0, 859.0, 1579.0, 2927.0, 5874.0, 11935.0, 25822.0, 57106.0, 124942.0, 233918.0, 268005.0, 166730.0, 79505.0, 35538.0, 16343.0, 7741.0, 3825.0, 2025.0, 1138.0, 594.0, 378.0, 197.0, 119.0, 80.0, 50.0, 33.0, 21.0, 11.0, 14.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2008056640625, -9.839111328125, -9.4774169921875, -9.11572265625, -8.7540283203125, -8.392333984375, -8.0306396484375, -7.6689453125, -7.3072509765625, -6.945556640625, -6.5838623046875, -6.22216796875, -5.8604736328125, -5.498779296875, -5.1370849609375, -4.775390625, -4.4136962890625, -4.052001953125, -3.6903076171875, -3.32861328125, -2.9669189453125, -2.605224609375, -2.2435302734375, -1.8818359375, -1.5201416015625, -1.158447265625, -0.7967529296875, -0.43505859375, -0.0733642578125, 0.288330078125, 0.6500244140625, 1.01171875, 1.3734130859375, 1.735107421875, 2.0968017578125, 2.45849609375, 2.8201904296875, 3.181884765625, 3.5435791015625, 3.9052734375, 4.2669677734375, 4.628662109375, 4.9903564453125, 5.35205078125, 5.7137451171875, 6.075439453125, 6.4371337890625, 6.798828125, 7.1605224609375, 7.522216796875, 7.8839111328125, 8.24560546875, 8.6072998046875, 8.968994140625, 9.3306884765625, 9.6923828125, 10.0540771484375, 10.415771484375, 10.7774658203125, 11.13916015625, 11.5008544921875, 11.862548828125, 12.2242431640625, 12.5859375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 8.0, 7.0, 11.0, 13.0, 14.0, 22.0, 20.0, 26.0, 29.0, 27.0, 34.0, 32.0, 40.0, 49.0, 39.0, 62.0, 61.0, 45.0, 55.0, 49.0, 47.0, 36.0, 46.0, 38.0, 36.0, 20.0, 21.0, 24.0, 17.0, 13.0, 11.0, 8.0, 8.0, 10.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.70721435546875, -4.5628662109375, -4.41851806640625, -4.274169921875, -4.12982177734375, -3.9854736328125, -3.84112548828125, -3.69677734375, -3.55242919921875, -3.4080810546875, -3.26373291015625, -3.119384765625, -2.97503662109375, -2.8306884765625, -2.68634033203125, -2.5419921875, -2.39764404296875, -2.2532958984375, -2.10894775390625, -1.964599609375, -1.82025146484375, -1.6759033203125, -1.53155517578125, -1.38720703125, -1.24285888671875, -1.0985107421875, -0.95416259765625, -0.809814453125, -0.66546630859375, -0.5211181640625, -0.37677001953125, -0.232421875, -0.08807373046875, 0.0562744140625, 0.20062255859375, 0.344970703125, 0.48931884765625, 0.6336669921875, 0.77801513671875, 0.92236328125, 1.06671142578125, 1.2110595703125, 1.35540771484375, 1.499755859375, 1.64410400390625, 1.7884521484375, 1.93280029296875, 2.0771484375, 2.22149658203125, 2.3658447265625, 2.51019287109375, 2.654541015625, 2.79888916015625, 2.9432373046875, 3.08758544921875, 3.23193359375, 3.37628173828125, 3.5206298828125, 3.66497802734375, 3.809326171875, 3.95367431640625, 4.0980224609375, 4.24237060546875, 4.38671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 6.0, 8.0, 7.0, 5.0, 13.0, 24.0, 24.0, 32.0, 71.0, 103.0, 155.0, 277.0, 456.0, 1044.0, 3263.0, 18416.0, 187609.0, 696671.0, 122744.0, 13157.0, 2587.0, 860.0, 384.0, 216.0, 148.0, 90.0, 67.0, 41.0, 30.0, 14.0, 15.0, 10.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.140625, -29.079833984375, -28.01904296875, -26.958251953125, -25.8974609375, -24.836669921875, -23.77587890625, -22.715087890625, -21.654296875, -20.593505859375, -19.53271484375, -18.471923828125, -17.4111328125, -16.350341796875, -15.28955078125, -14.228759765625, -13.16796875, -12.107177734375, -11.04638671875, -9.985595703125, -8.9248046875, -7.864013671875, -6.80322265625, -5.742431640625, -4.681640625, -3.620849609375, -2.56005859375, -1.499267578125, -0.4384765625, 0.622314453125, 1.68310546875, 2.743896484375, 3.8046875, 4.865478515625, 5.92626953125, 6.987060546875, 8.0478515625, 9.108642578125, 10.16943359375, 11.230224609375, 12.291015625, 13.351806640625, 14.41259765625, 15.473388671875, 16.5341796875, 17.594970703125, 18.65576171875, 19.716552734375, 20.77734375, 21.838134765625, 22.89892578125, 23.959716796875, 25.0205078125, 26.081298828125, 27.14208984375, 28.202880859375, 29.263671875, 30.324462890625, 31.38525390625, 32.446044921875, 33.5068359375, 34.567626953125, 35.62841796875, 36.689208984375, 37.75]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 8.0, 11.0, 13.0, 15.0, 23.0, 17.0, 26.0, 30.0, 29.0, 36.0, 45.0, 49.0, 45.0, 44.0, 47.0, 33.0, 58.0, 54.0, 41.0, 33.0, 44.0, 44.0, 35.0, 30.0, 31.0, 24.0, 22.0, 14.0, 18.0, 13.0, 11.0, 13.0, 8.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.921875, -28.095703125, -27.26953125, -26.443359375, -25.6171875, -24.791015625, -23.96484375, -23.138671875, -22.3125, -21.486328125, -20.66015625, -19.833984375, -19.0078125, -18.181640625, -17.35546875, -16.529296875, -15.703125, -14.876953125, -14.05078125, -13.224609375, -12.3984375, -11.572265625, -10.74609375, -9.919921875, -9.09375, -8.267578125, -7.44140625, -6.615234375, -5.7890625, -4.962890625, -4.13671875, -3.310546875, -2.484375, -1.658203125, -0.83203125, -0.005859375, 0.8203125, 1.646484375, 2.47265625, 3.298828125, 4.125, 4.951171875, 5.77734375, 6.603515625, 7.4296875, 8.255859375, 9.08203125, 9.908203125, 10.734375, 11.560546875, 12.38671875, 13.212890625, 14.0390625, 14.865234375, 15.69140625, 16.517578125, 17.34375, 18.169921875, 18.99609375, 19.822265625, 20.6484375, 21.474609375, 22.30078125, 23.126953125, 23.953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 11.0, 24.0, 25.0, 47.0, 51.0, 79.0, 120.0, 171.0, 241.0, 462.0, 938.0, 1821.0, 3967.0, 10048.0, 32669.0, 151021.0, 530675.0, 242995.0, 49681.0, 13654.0, 5016.0, 2189.0, 1061.0, 606.0, 323.0, 245.0, 130.0, 77.0, 63.0, 42.0, 29.0, 20.0, 13.0, 11.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.65625, -10.25634765625, -9.8564453125, -9.45654296875, -9.056640625, -8.65673828125, -8.2568359375, -7.85693359375, -7.45703125, -7.05712890625, -6.6572265625, -6.25732421875, -5.857421875, -5.45751953125, -5.0576171875, -4.65771484375, -4.2578125, -3.85791015625, -3.4580078125, -3.05810546875, -2.658203125, -2.25830078125, -1.8583984375, -1.45849609375, -1.05859375, -0.65869140625, -0.2587890625, 0.14111328125, 0.541015625, 0.94091796875, 1.3408203125, 1.74072265625, 2.140625, 2.54052734375, 2.9404296875, 3.34033203125, 3.740234375, 4.14013671875, 4.5400390625, 4.93994140625, 5.33984375, 5.73974609375, 6.1396484375, 6.53955078125, 6.939453125, 7.33935546875, 7.7392578125, 8.13916015625, 8.5390625, 8.93896484375, 9.3388671875, 9.73876953125, 10.138671875, 10.53857421875, 10.9384765625, 11.33837890625, 11.73828125, 12.13818359375, 12.5380859375, 12.93798828125, 13.337890625, 13.73779296875, 14.1376953125, 14.53759765625, 14.9375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 11.0, 8.0, 12.0, 11.0, 18.0, 31.0, 44.0, 42.0, 61.0, 77.0, 83.0, 96.0, 98.0, 75.0, 71.0, 64.0, 49.0, 43.0, 26.0, 21.0, 6.0, 14.0, 13.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002208709716796875, -0.002134382724761963, -0.0020600557327270508, -0.0019857287406921387, -0.0019114017486572266, -0.0018370747566223145, -0.0017627477645874023, -0.0016884207725524902, -0.0016140937805175781, -0.001539766788482666, -0.001465439796447754, -0.0013911128044128418, -0.0013167858123779297, -0.0012424588203430176, -0.0011681318283081055, -0.0010938048362731934, -0.0010194778442382812, -0.0009451508522033691, -0.000870823860168457, -0.0007964968681335449, -0.0007221698760986328, -0.0006478428840637207, -0.0005735158920288086, -0.0004991888999938965, -0.0004248619079589844, -0.00035053491592407227, -0.00027620792388916016, -0.00020188093185424805, -0.00012755393981933594, -5.322694778442383e-05, 2.110004425048828e-05, 9.542703628540039e-05, 0.0001697540283203125, 0.0002440810203552246, 0.0003184080123901367, 0.00039273500442504883, 0.00046706199645996094, 0.000541388988494873, 0.0006157159805297852, 0.0006900429725646973, 0.0007643699645996094, 0.0008386969566345215, 0.0009130239486694336, 0.0009873509407043457, 0.0010616779327392578, 0.00113600492477417, 0.001210331916809082, 0.0012846589088439941, 0.0013589859008789062, 0.0014333128929138184, 0.0015076398849487305, 0.0015819668769836426, 0.0016562938690185547, 0.0017306208610534668, 0.001804947853088379, 0.001879274845123291, 0.001953601837158203, 0.0020279288291931152, 0.0021022558212280273, 0.0021765828132629395, 0.0022509098052978516, 0.0023252367973327637, 0.0023995637893676758, 0.002473890781402588, 0.0025482177734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 15.0, 20.0, 36.0, 43.0, 95.0, 161.0, 368.0, 1153.0, 5222.0, 48510.0, 783902.0, 193852.0, 11885.0, 2156.0, 578.0, 242.0, 123.0, 74.0, 55.0, 21.0, 14.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.609375, -27.613037109375, -26.61669921875, -25.620361328125, -24.6240234375, -23.627685546875, -22.63134765625, -21.635009765625, -20.638671875, -19.642333984375, -18.64599609375, -17.649658203125, -16.6533203125, -15.656982421875, -14.66064453125, -13.664306640625, -12.66796875, -11.671630859375, -10.67529296875, -9.678955078125, -8.6826171875, -7.686279296875, -6.68994140625, -5.693603515625, -4.697265625, -3.700927734375, -2.70458984375, -1.708251953125, -0.7119140625, 0.284423828125, 1.28076171875, 2.277099609375, 3.2734375, 4.269775390625, 5.26611328125, 6.262451171875, 7.2587890625, 8.255126953125, 9.25146484375, 10.247802734375, 11.244140625, 12.240478515625, 13.23681640625, 14.233154296875, 15.2294921875, 16.225830078125, 17.22216796875, 18.218505859375, 19.21484375, 20.211181640625, 21.20751953125, 22.203857421875, 23.2001953125, 24.196533203125, 25.19287109375, 26.189208984375, 27.185546875, 28.181884765625, 29.17822265625, 30.174560546875, 31.1708984375, 32.167236328125, 33.16357421875, 34.159912109375, 35.15625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 6.0, 6.0, 6.0, 18.0, 19.0, 14.0, 30.0, 31.0, 43.0, 53.0, 41.0, 81.0, 84.0, 75.0, 105.0, 81.0, 60.0, 51.0, 36.0, 32.0, 27.0, 17.0, 18.0, 16.0, 6.0, 1.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.4453125, -12.068115234375, -11.69091796875, -11.313720703125, -10.9365234375, -10.559326171875, -10.18212890625, -9.804931640625, -9.427734375, -9.050537109375, -8.67333984375, -8.296142578125, -7.9189453125, -7.541748046875, -7.16455078125, -6.787353515625, -6.41015625, -6.032958984375, -5.65576171875, -5.278564453125, -4.9013671875, -4.524169921875, -4.14697265625, -3.769775390625, -3.392578125, -3.015380859375, -2.63818359375, -2.260986328125, -1.8837890625, -1.506591796875, -1.12939453125, -0.752197265625, -0.375, 0.002197265625, 0.37939453125, 0.756591796875, 1.1337890625, 1.510986328125, 1.88818359375, 2.265380859375, 2.642578125, 3.019775390625, 3.39697265625, 3.774169921875, 4.1513671875, 4.528564453125, 4.90576171875, 5.282958984375, 5.66015625, 6.037353515625, 6.41455078125, 6.791748046875, 7.1689453125, 7.546142578125, 7.92333984375, 8.300537109375, 8.677734375, 9.054931640625, 9.43212890625, 9.809326171875, 10.1865234375, 10.563720703125, 10.94091796875, 11.318115234375, 11.6953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 20.0, 58.0, 140.0, 218.0, 228.0, 180.0, 75.0, 43.0, 15.0, 12.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-314.6690979003906, -304.8736572265625, -295.0782165527344, -285.28277587890625, -275.4873352050781, -265.69189453125, -255.89646911621094, -246.1010284423828, -236.3055877685547, -226.51014709472656, -216.71470642089844, -206.9192657470703, -197.12384033203125, -187.32839965820312, -177.532958984375, -167.73751831054688, -157.94207763671875, -148.14663696289062, -138.3511962890625, -128.55575561523438, -118.76032257080078, -108.96488189697266, -99.16944885253906, -89.37400817871094, -79.57856750488281, -69.78312683105469, -59.98768997192383, -50.19225311279297, -40.396812438964844, -30.60137176513672, -20.80593490600586, -11.010498046875, -1.215057373046875, 8.580381393432617, 18.37582015991211, 28.1712589263916, 37.966697692871094, 47.76213836669922, 57.55757522583008, 67.35301208496094, 77.14845275878906, 86.94389343261719, 96.73933410644531, 106.5347671508789, 116.33020782470703, 126.12564849853516, 135.92108154296875, 145.71652221679688, 155.511962890625, 165.30740356445312, 175.10284423828125, 184.89828491210938, 194.6937255859375, 204.48916625976562, 214.2845916748047, 224.0800323486328, 233.87547302246094, 243.67091369628906, 253.4663543701172, 263.26177978515625, 273.0572204589844, 282.8526611328125, 292.6481018066406, 302.44354248046875, 312.2389831542969]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 6.0, 9.0, 3.0, 10.0, 9.0, 13.0, 14.0, 15.0, 19.0, 13.0, 22.0, 29.0, 29.0, 28.0, 30.0, 26.0, 39.0, 37.0, 34.0, 41.0, 31.0, 47.0, 39.0, 34.0, 40.0, 29.0, 32.0, 32.0, 32.0, 42.0, 37.0, 16.0, 19.0, 23.0, 22.0, 16.0, 16.0, 7.0, 11.0, 8.0, 10.0, 6.0, 7.0, 2.0, 7.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-115.05525970458984, -111.67643737792969, -108.297607421875, -104.91878509521484, -101.53996276855469, -98.16114044189453, -94.78231811523438, -91.40348815917969, -88.02466583251953, -84.64584350585938, -81.26701354980469, -77.88819122314453, -74.50936889648438, -71.13054656982422, -67.75172424316406, -64.37289428710938, -60.99407196044922, -57.61524963378906, -54.23642349243164, -50.85759735107422, -47.47877502441406, -44.099952697753906, -40.721126556396484, -37.34230041503906, -33.963478088378906, -30.584653854370117, -27.205829620361328, -23.82700538635254, -20.44818115234375, -17.06935691833496, -13.690532684326172, -10.311708450317383, -6.932891845703125, -3.554067611694336, -0.17524337768554688, 3.203580856323242, 6.582405090332031, 9.96122932434082, 13.34005355834961, 16.7188777923584, 20.097702026367188, 23.476526260375977, 26.855350494384766, 30.234174728393555, 33.612998962402344, 36.9918212890625, 40.37064743041992, 43.749473571777344, 47.1282958984375, 50.507118225097656, 53.88594436645508, 57.2647705078125, 60.643592834472656, 64.02241516113281, 67.4012451171875, 70.78006744384766, 74.15888977050781, 77.53771209716797, 80.91653442382812, 84.29536437988281, 87.67418670654297, 91.05300903320312, 94.43183898925781, 97.81066131591797, 101.18948364257812]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 10.0, 15.0, 24.0, 44.0, 61.0, 133.0, 274.0, 695.0, 2459.0, 31858.0, 4146004.0, 10202.0, 1525.0, 497.0, 215.0, 108.0, 52.0, 36.0, 26.0, 19.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.625, -89.8466796875, -87.068359375, -84.2900390625, -81.51171875, -78.7333984375, -75.955078125, -73.1767578125, -70.3984375, -67.6201171875, -64.841796875, -62.0634765625, -59.28515625, -56.5068359375, -53.728515625, -50.9501953125, -48.171875, -45.3935546875, -42.615234375, -39.8369140625, -37.05859375, -34.2802734375, -31.501953125, -28.7236328125, -25.9453125, -23.1669921875, -20.388671875, -17.6103515625, -14.83203125, -12.0537109375, -9.275390625, -6.4970703125, -3.71875, -0.9404296875, 1.837890625, 4.6162109375, 7.39453125, 10.1728515625, 12.951171875, 15.7294921875, 18.5078125, 21.2861328125, 24.064453125, 26.8427734375, 29.62109375, 32.3994140625, 35.177734375, 37.9560546875, 40.734375, 43.5126953125, 46.291015625, 49.0693359375, 51.84765625, 54.6259765625, 57.404296875, 60.1826171875, 62.9609375, 65.7392578125, 68.517578125, 71.2958984375, 74.07421875, 76.8525390625, 79.630859375, 82.4091796875, 85.1875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 4.0, 5.0, 12.0, 10.0, 28.0, 23.0, 27.0, 20.0, 21.0, 27.0, 27.0, 52.0, 52.0, 42.0, 43.0, 55.0, 47.0, 59.0, 38.0, 37.0, 44.0, 38.0, 38.0, 32.0, 35.0, 31.0, 23.0, 32.0, 17.0, 16.0, 15.0, 7.0, 6.0, 5.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.93212890625, -4.7666015625, -4.60107421875, -4.435546875, -4.27001953125, -4.1044921875, -3.93896484375, -3.7734375, -3.60791015625, -3.4423828125, -3.27685546875, -3.111328125, -2.94580078125, -2.7802734375, -2.61474609375, -2.44921875, -2.28369140625, -2.1181640625, -1.95263671875, -1.787109375, -1.62158203125, -1.4560546875, -1.29052734375, -1.125, -0.95947265625, -0.7939453125, -0.62841796875, -0.462890625, -0.29736328125, -0.1318359375, 0.03369140625, 0.19921875, 0.36474609375, 0.5302734375, 0.69580078125, 0.861328125, 1.02685546875, 1.1923828125, 1.35791015625, 1.5234375, 1.68896484375, 1.8544921875, 2.02001953125, 2.185546875, 2.35107421875, 2.5166015625, 2.68212890625, 2.84765625, 3.01318359375, 3.1787109375, 3.34423828125, 3.509765625, 3.67529296875, 3.8408203125, 4.00634765625, 4.171875, 4.33740234375, 4.5029296875, 4.66845703125, 4.833984375, 4.99951171875, 5.1650390625, 5.33056640625, 5.49609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 8.0, 6.0, 11.0, 16.0, 27.0, 25.0, 48.0, 37.0, 75.0, 81.0, 97.0, 149.0, 196.0, 236.0, 384.0, 484.0, 720.0, 1214.0, 2233.0, 4351.0, 10921.0, 42043.0, 3687348.0, 399094.0, 26787.0, 8546.0, 3647.0, 1959.0, 1141.0, 697.0, 456.0, 325.0, 225.0, 178.0, 110.0, 100.0, 76.0, 41.0, 47.0, 21.0, 24.0, 17.0, 14.0, 17.0, 12.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0], "bins": [-26.9375, -26.117919921875, -25.29833984375, -24.478759765625, -23.6591796875, -22.839599609375, -22.02001953125, -21.200439453125, -20.380859375, -19.561279296875, -18.74169921875, -17.922119140625, -17.1025390625, -16.282958984375, -15.46337890625, -14.643798828125, -13.82421875, -13.004638671875, -12.18505859375, -11.365478515625, -10.5458984375, -9.726318359375, -8.90673828125, -8.087158203125, -7.267578125, -6.447998046875, -5.62841796875, -4.808837890625, -3.9892578125, -3.169677734375, -2.35009765625, -1.530517578125, -0.7109375, 0.108642578125, 0.92822265625, 1.747802734375, 2.5673828125, 3.386962890625, 4.20654296875, 5.026123046875, 5.845703125, 6.665283203125, 7.48486328125, 8.304443359375, 9.1240234375, 9.943603515625, 10.76318359375, 11.582763671875, 12.40234375, 13.221923828125, 14.04150390625, 14.861083984375, 15.6806640625, 16.500244140625, 17.31982421875, 18.139404296875, 18.958984375, 19.778564453125, 20.59814453125, 21.417724609375, 22.2373046875, 23.056884765625, 23.87646484375, 24.696044921875, 25.515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 10.0, 9.0, 22.0, 43.0, 122.0, 1500.0, 2106.0, 130.0, 51.0, 15.0, 19.0, 8.0, 3.0, 3.0, 4.0, 9.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.94342041015625, -7.7227783203125, -7.50213623046875, -7.281494140625, -7.06085205078125, -6.8402099609375, -6.61956787109375, -6.39892578125, -6.17828369140625, -5.9576416015625, -5.73699951171875, -5.516357421875, -5.29571533203125, -5.0750732421875, -4.85443115234375, -4.6337890625, -4.41314697265625, -4.1925048828125, -3.97186279296875, -3.751220703125, -3.53057861328125, -3.3099365234375, -3.08929443359375, -2.86865234375, -2.64801025390625, -2.4273681640625, -2.20672607421875, -1.986083984375, -1.76544189453125, -1.5447998046875, -1.32415771484375, -1.103515625, -0.88287353515625, -0.6622314453125, -0.44158935546875, -0.220947265625, -0.00030517578125, 0.2203369140625, 0.44097900390625, 0.66162109375, 0.88226318359375, 1.1029052734375, 1.32354736328125, 1.544189453125, 1.76483154296875, 1.9854736328125, 2.20611572265625, 2.4267578125, 2.64739990234375, 2.8680419921875, 3.08868408203125, 3.309326171875, 3.52996826171875, 3.7506103515625, 3.97125244140625, 4.19189453125, 4.41253662109375, 4.6331787109375, 4.85382080078125, 5.074462890625, 5.29510498046875, 5.5157470703125, 5.73638916015625, 5.95703125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 10.0, 19.0, 51.0, 106.0, 169.0, 201.0, 191.0, 118.0, 67.0, 37.0, 16.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.04270935058594, -50.791961669921875, -49.54121398925781, -48.290462493896484, -47.03971481323242, -45.78896713256836, -44.5382194519043, -43.28746795654297, -42.036720275878906, -40.785972595214844, -39.53522491455078, -38.28447341918945, -37.03372573852539, -35.78297805786133, -34.532230377197266, -33.28147888183594, -32.030731201171875, -30.779983520507812, -29.529233932495117, -28.278486251831055, -27.02773666381836, -25.776988983154297, -24.526241302490234, -23.27549171447754, -22.02474594116211, -20.773998260498047, -19.52324867248535, -18.27250099182129, -17.021751403808594, -15.771003723144531, -14.520255088806152, -13.269506454467773, -12.018754959106445, -10.768006324768066, -9.517257690429688, -8.266510009765625, -7.015760898590088, -5.765012264251709, -4.514264106750488, -3.2635154724121094, -2.0127668380737305, -0.7620183229446411, 0.48873019218444824, 1.739478588104248, 2.990227222442627, 4.240975856781006, 5.491724014282227, 6.7424726486206055, 7.993221282958984, 9.243969917297363, 10.494718551635742, 11.745466232299805, 12.9962158203125, 14.246963500976562, 15.497712135314941, 16.74846076965332, 17.999210357666016, 19.249958038330078, 20.500707626342773, 21.751455307006836, 23.00220489501953, 24.252952575683594, 25.503700256347656, 26.75444984436035, 28.005197525024414]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 3.0, 6.0, 12.0, 5.0, 15.0, 20.0, 16.0, 22.0, 17.0, 17.0, 26.0, 15.0, 31.0, 34.0, 38.0, 28.0, 34.0, 31.0, 38.0, 38.0, 46.0, 44.0, 47.0, 37.0, 35.0, 35.0, 26.0, 38.0, 27.0, 17.0, 25.0, 31.0, 34.0, 24.0, 8.0, 13.0, 16.0, 15.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.579087257385254, -10.251937866210938, -9.924788475036621, -9.597639083862305, -9.270489692687988, -8.943340301513672, -8.616190910339355, -8.289041519165039, -7.961892604827881, -7.6347432136535645, -7.307593822479248, -6.980444431304932, -6.653295516967773, -6.326146125793457, -5.998996734619141, -5.671847343444824, -5.344697952270508, -5.017548561096191, -4.690399169921875, -4.363249778747559, -4.036100387573242, -3.708951234817505, -3.3818020820617676, -3.054652690887451, -2.7275032997131348, -2.4003539085388184, -2.073204517364502, -1.7460553646087646, -1.4189059734344482, -1.0917565822601318, -0.764607310295105, -0.4374580383300781, -0.11030769348144531, 0.21684163808822632, 0.543990969657898, 0.8711403012275696, 1.1982896327972412, 1.5254390239715576, 1.8525882959365845, 2.1797375679016113, 2.5068869590759277, 2.834036350250244, 3.1611857414245605, 3.488334894180298, 3.8154842853546143, 4.142633438110352, 4.469782829284668, 4.796932220458984, 5.124081611633301, 5.451231002807617, 5.778380393981934, 6.10552978515625, 6.432679176330566, 6.759828567504883, 7.086977481842041, 7.414126873016357, 7.741276264190674, 8.068425178527832, 8.395574569702148, 8.722723960876465, 9.049873352050781, 9.377022743225098, 9.704172134399414, 10.03132152557373, 10.358470916748047]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 7.0, 11.0, 13.0, 16.0, 18.0, 36.0, 74.0, 92.0, 143.0, 222.0, 395.0, 655.0, 1242.0, 2133.0, 3922.0, 7653.0, 14354.0, 28558.0, 56546.0, 109120.0, 187260.0, 233706.0, 183607.0, 106152.0, 54677.0, 27822.0, 14109.0, 7201.0, 4015.0, 2063.0, 1155.0, 593.0, 394.0, 199.0, 124.0, 83.0, 56.0, 37.0, 27.0, 18.0, 18.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.2607421875, -8.935546875, -8.6103515625, -8.28515625, -7.9599609375, -7.634765625, -7.3095703125, -6.984375, -6.6591796875, -6.333984375, -6.0087890625, -5.68359375, -5.3583984375, -5.033203125, -4.7080078125, -4.3828125, -4.0576171875, -3.732421875, -3.4072265625, -3.08203125, -2.7568359375, -2.431640625, -2.1064453125, -1.78125, -1.4560546875, -1.130859375, -0.8056640625, -0.48046875, -0.1552734375, 0.169921875, 0.4951171875, 0.8203125, 1.1455078125, 1.470703125, 1.7958984375, 2.12109375, 2.4462890625, 2.771484375, 3.0966796875, 3.421875, 3.7470703125, 4.072265625, 4.3974609375, 4.72265625, 5.0478515625, 5.373046875, 5.6982421875, 6.0234375, 6.3486328125, 6.673828125, 6.9990234375, 7.32421875, 7.6494140625, 7.974609375, 8.2998046875, 8.625, 8.9501953125, 9.275390625, 9.6005859375, 9.92578125, 10.2509765625, 10.576171875, 10.9013671875, 11.2265625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 7.0, 16.0, 16.0, 15.0, 21.0, 24.0, 23.0, 33.0, 29.0, 29.0, 45.0, 45.0, 44.0, 48.0, 52.0, 40.0, 53.0, 42.0, 44.0, 34.0, 46.0, 43.0, 35.0, 28.0, 29.0, 25.0, 29.0, 13.0, 15.0, 11.0, 11.0, 8.0, 6.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41796875, -5.2421875, -5.06640625, -4.890625, -4.71484375, -4.5390625, -4.36328125, -4.1875, -4.01171875, -3.8359375, -3.66015625, -3.484375, -3.30859375, -3.1328125, -2.95703125, -2.78125, -2.60546875, -2.4296875, -2.25390625, -2.078125, -1.90234375, -1.7265625, -1.55078125, -1.375, -1.19921875, -1.0234375, -0.84765625, -0.671875, -0.49609375, -0.3203125, -0.14453125, 0.03125, 0.20703125, 0.3828125, 0.55859375, 0.734375, 0.91015625, 1.0859375, 1.26171875, 1.4375, 1.61328125, 1.7890625, 1.96484375, 2.140625, 2.31640625, 2.4921875, 2.66796875, 2.84375, 3.01953125, 3.1953125, 3.37109375, 3.546875, 3.72265625, 3.8984375, 4.07421875, 4.25, 4.42578125, 4.6015625, 4.77734375, 4.953125, 5.12890625, 5.3046875, 5.48046875, 5.65625, 5.83203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 2.0, 10.0, 5.0, 4.0, 17.0, 15.0, 14.0, 20.0, 40.0, 59.0, 74.0, 99.0, 144.0, 194.0, 286.0, 413.0, 688.0, 1390.0, 3278.0, 10574.0, 43762.0, 221674.0, 548174.0, 168803.0, 34223.0, 8580.0, 2855.0, 1232.0, 619.0, 380.0, 235.0, 170.0, 116.0, 98.0, 68.0, 52.0, 33.0, 40.0, 19.0, 19.0, 12.0, 9.0, 12.0, 8.0, 4.0, 6.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-21.078125, -20.4072265625, -19.736328125, -19.0654296875, -18.39453125, -17.7236328125, -17.052734375, -16.3818359375, -15.7109375, -15.0400390625, -14.369140625, -13.6982421875, -13.02734375, -12.3564453125, -11.685546875, -11.0146484375, -10.34375, -9.6728515625, -9.001953125, -8.3310546875, -7.66015625, -6.9892578125, -6.318359375, -5.6474609375, -4.9765625, -4.3056640625, -3.634765625, -2.9638671875, -2.29296875, -1.6220703125, -0.951171875, -0.2802734375, 0.390625, 1.0615234375, 1.732421875, 2.4033203125, 3.07421875, 3.7451171875, 4.416015625, 5.0869140625, 5.7578125, 6.4287109375, 7.099609375, 7.7705078125, 8.44140625, 9.1123046875, 9.783203125, 10.4541015625, 11.125, 11.7958984375, 12.466796875, 13.1376953125, 13.80859375, 14.4794921875, 15.150390625, 15.8212890625, 16.4921875, 17.1630859375, 17.833984375, 18.5048828125, 19.17578125, 19.8466796875, 20.517578125, 21.1884765625, 21.859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 1.0, 4.0, 9.0, 8.0, 12.0, 12.0, 12.0, 19.0, 28.0, 21.0, 23.0, 31.0, 32.0, 21.0, 42.0, 35.0, 43.0, 45.0, 32.0, 42.0, 53.0, 42.0, 33.0, 42.0, 42.0, 47.0, 30.0, 34.0, 26.0, 25.0, 19.0, 21.0, 13.0, 20.0, 12.0, 13.0, 16.0, 10.0, 4.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.59375, -26.818603515625, -26.04345703125, -25.268310546875, -24.4931640625, -23.718017578125, -22.94287109375, -22.167724609375, -21.392578125, -20.617431640625, -19.84228515625, -19.067138671875, -18.2919921875, -17.516845703125, -16.74169921875, -15.966552734375, -15.19140625, -14.416259765625, -13.64111328125, -12.865966796875, -12.0908203125, -11.315673828125, -10.54052734375, -9.765380859375, -8.990234375, -8.215087890625, -7.43994140625, -6.664794921875, -5.8896484375, -5.114501953125, -4.33935546875, -3.564208984375, -2.7890625, -2.013916015625, -1.23876953125, -0.463623046875, 0.3115234375, 1.086669921875, 1.86181640625, 2.636962890625, 3.412109375, 4.187255859375, 4.96240234375, 5.737548828125, 6.5126953125, 7.287841796875, 8.06298828125, 8.838134765625, 9.61328125, 10.388427734375, 11.16357421875, 11.938720703125, 12.7138671875, 13.489013671875, 14.26416015625, 15.039306640625, 15.814453125, 16.589599609375, 17.36474609375, 18.139892578125, 18.9150390625, 19.690185546875, 20.46533203125, 21.240478515625, 22.015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 7.0, 8.0, 6.0, 11.0, 15.0, 18.0, 32.0, 45.0, 65.0, 91.0, 165.0, 253.0, 398.0, 680.0, 1301.0, 2474.0, 5652.0, 16066.0, 59726.0, 283070.0, 501843.0, 129656.0, 29915.0, 9364.0, 3662.0, 1798.0, 852.0, 504.0, 296.0, 202.0, 129.0, 92.0, 48.0, 34.0, 19.0, 17.0, 11.0, 12.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.1640625, -9.8673095703125, -9.570556640625, -9.2738037109375, -8.97705078125, -8.6802978515625, -8.383544921875, -8.0867919921875, -7.7900390625, -7.4932861328125, -7.196533203125, -6.8997802734375, -6.60302734375, -6.3062744140625, -6.009521484375, -5.7127685546875, -5.416015625, -5.1192626953125, -4.822509765625, -4.5257568359375, -4.22900390625, -3.9322509765625, -3.635498046875, -3.3387451171875, -3.0419921875, -2.7452392578125, -2.448486328125, -2.1517333984375, -1.85498046875, -1.5582275390625, -1.261474609375, -0.9647216796875, -0.66796875, -0.3712158203125, -0.074462890625, 0.2222900390625, 0.51904296875, 0.8157958984375, 1.112548828125, 1.4093017578125, 1.7060546875, 2.0028076171875, 2.299560546875, 2.5963134765625, 2.89306640625, 3.1898193359375, 3.486572265625, 3.7833251953125, 4.080078125, 4.3768310546875, 4.673583984375, 4.9703369140625, 5.26708984375, 5.5638427734375, 5.860595703125, 6.1573486328125, 6.4541015625, 6.7508544921875, 7.047607421875, 7.3443603515625, 7.64111328125, 7.9378662109375, 8.234619140625, 8.5313720703125, 8.828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 10.0, 28.0, 34.0, 68.0, 73.0, 98.0, 129.0, 135.0, 116.0, 100.0, 59.0, 53.0, 19.0, 16.0, 13.0, 8.0, 5.0, 7.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002246856689453125, -0.002157449722290039, -0.002068042755126953, -0.001978635787963867, -0.0018892288208007812, -0.0017998218536376953, -0.0017104148864746094, -0.0016210079193115234, -0.0015316009521484375, -0.0014421939849853516, -0.0013527870178222656, -0.0012633800506591797, -0.0011739730834960938, -0.0010845661163330078, -0.0009951591491699219, -0.0009057521820068359, -0.00081634521484375, -0.0007269382476806641, -0.0006375312805175781, -0.0005481243133544922, -0.00045871734619140625, -0.0003693103790283203, -0.0002799034118652344, -0.00019049644470214844, -0.0001010894775390625, -1.1682510375976562e-05, 7.772445678710938e-05, 0.0001671314239501953, 0.00025653839111328125, 0.0003459453582763672, 0.0004353523254394531, 0.0005247592926025391, 0.000614166259765625, 0.0007035732269287109, 0.0007929801940917969, 0.0008823871612548828, 0.0009717941284179688, 0.0010612010955810547, 0.0011506080627441406, 0.0012400150299072266, 0.0013294219970703125, 0.0014188289642333984, 0.0015082359313964844, 0.0015976428985595703, 0.0016870498657226562, 0.0017764568328857422, 0.0018658638000488281, 0.001955270767211914, 0.002044677734375, 0.002134084701538086, 0.002223491668701172, 0.002312898635864258, 0.0024023056030273438, 0.0024917125701904297, 0.0025811195373535156, 0.0026705265045166016, 0.0027599334716796875, 0.0028493404388427734, 0.0029387474060058594, 0.0030281543731689453, 0.0031175613403320312, 0.003206968307495117, 0.003296375274658203, 0.003385782241821289, 0.003475189208984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 4.0, 2.0, 7.0, 9.0, 11.0, 15.0, 29.0, 26.0, 56.0, 87.0, 128.0, 268.0, 556.0, 1381.0, 4383.0, 22641.0, 274300.0, 670402.0, 61790.0, 8431.0, 2269.0, 876.0, 390.0, 194.0, 113.0, 85.0, 39.0, 24.0, 9.0, 14.0, 9.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.51708984375, -16.9560546875, -16.39501953125, -15.833984375, -15.27294921875, -14.7119140625, -14.15087890625, -13.58984375, -13.02880859375, -12.4677734375, -11.90673828125, -11.345703125, -10.78466796875, -10.2236328125, -9.66259765625, -9.1015625, -8.54052734375, -7.9794921875, -7.41845703125, -6.857421875, -6.29638671875, -5.7353515625, -5.17431640625, -4.61328125, -4.05224609375, -3.4912109375, -2.93017578125, -2.369140625, -1.80810546875, -1.2470703125, -0.68603515625, -0.125, 0.43603515625, 0.9970703125, 1.55810546875, 2.119140625, 2.68017578125, 3.2412109375, 3.80224609375, 4.36328125, 4.92431640625, 5.4853515625, 6.04638671875, 6.607421875, 7.16845703125, 7.7294921875, 8.29052734375, 8.8515625, 9.41259765625, 9.9736328125, 10.53466796875, 11.095703125, 11.65673828125, 12.2177734375, 12.77880859375, 13.33984375, 13.90087890625, 14.4619140625, 15.02294921875, 15.583984375, 16.14501953125, 16.7060546875, 17.26708984375, 17.828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 14.0, 15.0, 32.0, 24.0, 43.0, 61.0, 66.0, 66.0, 84.0, 95.0, 78.0, 73.0, 75.0, 53.0, 46.0, 33.0, 29.0, 21.0, 22.0, 19.0, 6.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.36279296875, -11.9833984375, -11.60400390625, -11.224609375, -10.84521484375, -10.4658203125, -10.08642578125, -9.70703125, -9.32763671875, -8.9482421875, -8.56884765625, -8.189453125, -7.81005859375, -7.4306640625, -7.05126953125, -6.671875, -6.29248046875, -5.9130859375, -5.53369140625, -5.154296875, -4.77490234375, -4.3955078125, -4.01611328125, -3.63671875, -3.25732421875, -2.8779296875, -2.49853515625, -2.119140625, -1.73974609375, -1.3603515625, -0.98095703125, -0.6015625, -0.22216796875, 0.1572265625, 0.53662109375, 0.916015625, 1.29541015625, 1.6748046875, 2.05419921875, 2.43359375, 2.81298828125, 3.1923828125, 3.57177734375, 3.951171875, 4.33056640625, 4.7099609375, 5.08935546875, 5.46875, 5.84814453125, 6.2275390625, 6.60693359375, 6.986328125, 7.36572265625, 7.7451171875, 8.12451171875, 8.50390625, 8.88330078125, 9.2626953125, 9.64208984375, 10.021484375, 10.40087890625, 10.7802734375, 11.15966796875, 11.5390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [7.0, 4.0, 10.0, 25.0, 50.0, 82.0, 148.0, 203.0, 180.0, 146.0, 82.0, 49.0, 10.0, 9.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.85733795166016, -56.6220703125, -48.386802673339844, -40.15153884887695, -31.916271209716797, -23.68100357055664, -15.44573974609375, -7.210472106933594, 1.0247955322265625, 9.260062217712402, 17.495328903198242, 25.730594635009766, 33.96586227416992, 42.20112991333008, 50.43639373779297, 58.671661376953125, 66.90692901611328, 75.14219665527344, 83.3774642944336, 91.61273193359375, 99.84799194335938, 108.08326721191406, 116.31852722167969, 124.55379486083984, 132.7890625, 141.02432250976562, 149.2595977783203, 157.49485778808594, 165.73013305664062, 173.96539306640625, 182.20065307617188, 190.43592834472656, 198.67120361328125, 206.90646362304688, 215.14173889160156, 223.3769989013672, 231.61227416992188, 239.8475341796875, 248.08279418945312, 256.31805419921875, 264.5533447265625, 272.7886047363281, 281.02386474609375, 289.2591552734375, 297.4944152832031, 305.72967529296875, 313.9649353027344, 322.2001953125, 330.43548583984375, 338.6707458496094, 346.906005859375, 355.14129638671875, 363.3765563964844, 371.61181640625, 379.8470764160156, 388.08233642578125, 396.3175964355469, 404.5528564453125, 412.7881164550781, 421.0234069824219, 429.2586669921875, 437.4939270019531, 445.72918701171875, 453.9644775390625, 462.1997375488281]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 4.0, 12.0, 12.0, 7.0, 16.0, 14.0, 29.0, 20.0, 30.0, 28.0, 29.0, 26.0, 49.0, 37.0, 40.0, 62.0, 62.0, 51.0, 53.0, 49.0, 51.0, 43.0, 31.0, 34.0, 28.0, 24.0, 29.0, 17.0, 21.0, 16.0, 18.0, 9.0, 12.0, 14.0, 1.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-119.9652099609375, -115.71774291992188, -111.47027587890625, -107.22280883789062, -102.975341796875, -98.72787475585938, -94.48041534423828, -90.23294830322266, -85.98548126220703, -81.7380142211914, -77.49054718017578, -73.24308013916016, -68.99562072753906, -64.74815368652344, -60.50068664550781, -56.25321960449219, -52.00575256347656, -47.75828552246094, -43.51081848144531, -39.26335525512695, -35.01588821411133, -30.768421173095703, -26.52095603942871, -22.27349090576172, -18.026023864746094, -13.778557777404785, -9.531091690063477, -5.283625602722168, -1.0361595153808594, 3.2113075256347656, 7.458772659301758, 11.70623779296875, 15.953704833984375, 20.201171875, 24.448637008666992, 28.696102142333984, 32.94356918334961, 37.191036224365234, 41.438499450683594, 45.68596649169922, 49.933433532714844, 54.18090057373047, 58.428367614746094, 62.67583084106445, 66.92329406738281, 71.17076110839844, 75.41822814941406, 79.66569519042969, 83.91316223144531, 88.16062927246094, 92.40809631347656, 96.65556335449219, 100.90303039550781, 105.15049743652344, 109.39795684814453, 113.64542388916016, 117.89289093017578, 122.1403579711914, 126.38782501220703, 130.63528442382812, 134.88275146484375, 139.13021850585938, 143.377685546875, 147.62515258789062, 151.87261962890625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 9.0, 8.0, 22.0, 26.0, 41.0, 77.0, 111.0, 193.0, 348.0, 745.0, 1875.0, 6522.0, 69007.0, 4080368.0, 28075.0, 4264.0, 1357.0, 544.0, 279.0, 153.0, 87.0, 59.0, 37.0, 20.0, 24.0, 12.0, 11.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-49.9375, -48.668701171875, -47.39990234375, -46.131103515625, -44.8623046875, -43.593505859375, -42.32470703125, -41.055908203125, -39.787109375, -38.518310546875, -37.24951171875, -35.980712890625, -34.7119140625, -33.443115234375, -32.17431640625, -30.905517578125, -29.63671875, -28.367919921875, -27.09912109375, -25.830322265625, -24.5615234375, -23.292724609375, -22.02392578125, -20.755126953125, -19.486328125, -18.217529296875, -16.94873046875, -15.679931640625, -14.4111328125, -13.142333984375, -11.87353515625, -10.604736328125, -9.3359375, -8.067138671875, -6.79833984375, -5.529541015625, -4.2607421875, -2.991943359375, -1.72314453125, -0.454345703125, 0.814453125, 2.083251953125, 3.35205078125, 4.620849609375, 5.8896484375, 7.158447265625, 8.42724609375, 9.696044921875, 10.96484375, 12.233642578125, 13.50244140625, 14.771240234375, 16.0400390625, 17.308837890625, 18.57763671875, 19.846435546875, 21.115234375, 22.384033203125, 23.65283203125, 24.921630859375, 26.1904296875, 27.459228515625, 28.72802734375, 29.996826171875, 31.265625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 13.0, 16.0, 15.0, 18.0, 14.0, 27.0, 21.0, 32.0, 32.0, 36.0, 37.0, 59.0, 47.0, 47.0, 36.0, 41.0, 56.0, 47.0, 55.0, 57.0, 41.0, 41.0, 30.0, 37.0, 36.0, 20.0, 20.0, 15.0, 13.0, 6.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3671875, -6.1876220703125, -6.008056640625, -5.8284912109375, -5.64892578125, -5.4693603515625, -5.289794921875, -5.1102294921875, -4.9306640625, -4.7510986328125, -4.571533203125, -4.3919677734375, -4.21240234375, -4.0328369140625, -3.853271484375, -3.6737060546875, -3.494140625, -3.3145751953125, -3.135009765625, -2.9554443359375, -2.77587890625, -2.5963134765625, -2.416748046875, -2.2371826171875, -2.0576171875, -1.8780517578125, -1.698486328125, -1.5189208984375, -1.33935546875, -1.1597900390625, -0.980224609375, -0.8006591796875, -0.62109375, -0.4415283203125, -0.261962890625, -0.0823974609375, 0.09716796875, 0.2767333984375, 0.456298828125, 0.6358642578125, 0.8154296875, 0.9949951171875, 1.174560546875, 1.3541259765625, 1.53369140625, 1.7132568359375, 1.892822265625, 2.0723876953125, 2.251953125, 2.4315185546875, 2.611083984375, 2.7906494140625, 2.97021484375, 3.1497802734375, 3.329345703125, 3.5089111328125, 3.6884765625, 3.8680419921875, 4.047607421875, 4.2271728515625, 4.40673828125, 4.5863037109375, 4.765869140625, 4.9454345703125, 5.125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 10.0, 11.0, 9.0, 12.0, 17.0, 26.0, 30.0, 33.0, 56.0, 86.0, 82.0, 126.0, 164.0, 241.0, 352.0, 491.0, 886.0, 1587.0, 3464.0, 10685.0, 62933.0, 3924109.0, 161728.0, 17404.0, 4775.0, 1957.0, 1040.0, 644.0, 339.0, 264.0, 175.0, 131.0, 102.0, 66.0, 61.0, 45.0, 41.0, 27.0, 18.0, 15.0, 10.0, 10.0, 6.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-29.515625, -28.6640625, -27.8125, -26.9609375, -26.109375, -25.2578125, -24.40625, -23.5546875, -22.703125, -21.8515625, -21.0, -20.1484375, -19.296875, -18.4453125, -17.59375, -16.7421875, -15.890625, -15.0390625, -14.1875, -13.3359375, -12.484375, -11.6328125, -10.78125, -9.9296875, -9.078125, -8.2265625, -7.375, -6.5234375, -5.671875, -4.8203125, -3.96875, -3.1171875, -2.265625, -1.4140625, -0.5625, 0.2890625, 1.140625, 1.9921875, 2.84375, 3.6953125, 4.546875, 5.3984375, 6.25, 7.1015625, 7.953125, 8.8046875, 9.65625, 10.5078125, 11.359375, 12.2109375, 13.0625, 13.9140625, 14.765625, 15.6171875, 16.46875, 17.3203125, 18.171875, 19.0234375, 19.875, 20.7265625, 21.578125, 22.4296875, 23.28125, 24.1328125, 24.984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 16.0, 32.0, 79.0, 258.0, 3087.0, 368.0, 107.0, 39.0, 28.0, 11.0, 10.0, 2.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.435546875, -5.18359375, -4.931640625, -4.6796875, -4.427734375, -4.17578125, -3.923828125, -3.671875, -3.419921875, -3.16796875, -2.916015625, -2.6640625, -2.412109375, -2.16015625, -1.908203125, -1.65625, -1.404296875, -1.15234375, -0.900390625, -0.6484375, -0.396484375, -0.14453125, 0.107421875, 0.359375, 0.611328125, 0.86328125, 1.115234375, 1.3671875, 1.619140625, 1.87109375, 2.123046875, 2.375, 2.626953125, 2.87890625, 3.130859375, 3.3828125, 3.634765625, 3.88671875, 4.138671875, 4.390625, 4.642578125, 4.89453125, 5.146484375, 5.3984375, 5.650390625, 5.90234375, 6.154296875, 6.40625, 6.658203125, 6.91015625, 7.162109375, 7.4140625, 7.666015625, 7.91796875, 8.169921875, 8.421875, 8.673828125, 8.92578125, 9.177734375, 9.4296875, 9.681640625, 9.93359375, 10.185546875, 10.4375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 23.0, 60.0, 178.0, 282.0, 257.0, 118.0, 49.0, 21.0, 6.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.32489776611328, -32.373016357421875, -30.421138763427734, -28.46925926208496, -26.517379760742188, -24.56549835205078, -22.61362075805664, -20.661739349365234, -18.709861755371094, -16.75798225402832, -14.806102752685547, -12.854223251342773, -10.90234375, -8.95046329498291, -6.998583793640137, -5.046704292297363, -3.0948238372802734, -1.1429442167282104, 0.8089354038238525, 2.760815143585205, 4.7126946449279785, 6.66457462310791, 8.616454124450684, 10.568333625793457, 12.52021312713623, 14.472092628479004, 16.423973083496094, 18.375852584838867, 20.32773208618164, 22.279611587524414, 24.231491088867188, 26.18337059020996, 28.135250091552734, 30.087129592895508, 32.03900909423828, 33.99089050292969, 35.94276809692383, 37.894649505615234, 39.846527099609375, 41.79840850830078, 43.75028610229492, 45.70216751098633, 47.65404510498047, 49.605926513671875, 51.557804107666016, 53.50968551635742, 55.46156311035156, 57.41344451904297, 59.365325927734375, 61.31720733642578, 63.26908493041992, 65.22096252441406, 67.17284393310547, 69.12472534179688, 71.07660675048828, 73.02848052978516, 74.98036193847656, 76.93224334716797, 78.88412475585938, 80.83599853515625, 82.78787994384766, 84.73976135253906, 86.69164276123047, 88.64351654052734, 90.59539794921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 12.0, 10.0, 14.0, 21.0, 24.0, 22.0, 24.0, 23.0, 32.0, 23.0, 38.0, 40.0, 40.0, 46.0, 55.0, 50.0, 36.0, 44.0, 36.0, 32.0, 41.0, 52.0, 31.0, 28.0, 32.0, 25.0, 29.0, 26.0, 16.0, 14.0, 10.0, 13.0, 11.0, 10.0, 10.0, 7.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.948797225952148, -12.477943420410156, -12.00709056854248, -11.536236763000488, -11.065382957458496, -10.59453010559082, -10.123676300048828, -9.652822494506836, -9.181968688964844, -8.711114883422852, -8.240262031555176, -7.769408226013184, -7.298554420471191, -6.827701091766357, -6.356847763061523, -5.885993957519531, -5.4151411056518555, -4.9442877769470215, -4.473433971405029, -4.002580642700195, -3.5317270755767822, -3.060873508453369, -2.590020179748535, -2.119166612625122, -1.648313045501709, -1.177459478378296, -0.7066060304641724, -0.23575258255004883, 0.23510098457336426, 0.7059545516967773, 1.1768078804016113, 1.6476614475250244, 2.1185150146484375, 2.5893685817718506, 3.0602221488952637, 3.5310754776000977, 4.00192928314209, 4.472782611846924, 4.943635940551758, 5.41448974609375, 5.885343074798584, 6.356196403503418, 6.82705020904541, 7.297903537750244, 7.768756866455078, 8.23961067199707, 8.710464477539062, 9.181317329406738, 9.65217113494873, 10.123024940490723, 10.593877792358398, 11.06473159790039, 11.535585403442383, 12.006439208984375, 12.47729206085205, 12.948145866394043, 13.418998718261719, 13.889852523803711, 14.360705375671387, 14.831559181213379, 15.302412986755371, 15.773265838623047, 16.24411964416504, 16.71497344970703, 17.185827255249023]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 16.0, 12.0, 25.0, 31.0, 53.0, 81.0, 130.0, 192.0, 338.0, 605.0, 1036.0, 1869.0, 3532.0, 6872.0, 13764.0, 28289.0, 59235.0, 118521.0, 200710.0, 237319.0, 179865.0, 99815.0, 48818.0, 23209.0, 11400.0, 5865.0, 3082.0, 1534.0, 956.0, 507.0, 312.0, 207.0, 132.0, 65.0, 38.0, 31.0, 25.0, 20.0, 13.0, 8.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.3671875, -8.0916748046875, -7.816162109375, -7.5406494140625, -7.26513671875, -6.9896240234375, -6.714111328125, -6.4385986328125, -6.1630859375, -5.8875732421875, -5.612060546875, -5.3365478515625, -5.06103515625, -4.7855224609375, -4.510009765625, -4.2344970703125, -3.958984375, -3.6834716796875, -3.407958984375, -3.1324462890625, -2.85693359375, -2.5814208984375, -2.305908203125, -2.0303955078125, -1.7548828125, -1.4793701171875, -1.203857421875, -0.9283447265625, -0.65283203125, -0.3773193359375, -0.101806640625, 0.1737060546875, 0.44921875, 0.7247314453125, 1.000244140625, 1.2757568359375, 1.55126953125, 1.8267822265625, 2.102294921875, 2.3778076171875, 2.6533203125, 2.9288330078125, 3.204345703125, 3.4798583984375, 3.75537109375, 4.0308837890625, 4.306396484375, 4.5819091796875, 4.857421875, 5.1329345703125, 5.408447265625, 5.6839599609375, 5.95947265625, 6.2349853515625, 6.510498046875, 6.7860107421875, 7.0615234375, 7.3370361328125, 7.612548828125, 7.8880615234375, 8.16357421875, 8.4390869140625, 8.714599609375, 8.9901123046875, 9.265625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 8.0, 3.0, 8.0, 5.0, 6.0, 14.0, 13.0, 21.0, 25.0, 22.0, 30.0, 36.0, 43.0, 40.0, 51.0, 44.0, 57.0, 55.0, 59.0, 53.0, 50.0, 43.0, 49.0, 51.0, 35.0, 38.0, 29.0, 16.0, 24.0, 20.0, 9.0, 10.0, 8.0, 10.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.78125, -6.584228515625, -6.38720703125, -6.190185546875, -5.9931640625, -5.796142578125, -5.59912109375, -5.402099609375, -5.205078125, -5.008056640625, -4.81103515625, -4.614013671875, -4.4169921875, -4.219970703125, -4.02294921875, -3.825927734375, -3.62890625, -3.431884765625, -3.23486328125, -3.037841796875, -2.8408203125, -2.643798828125, -2.44677734375, -2.249755859375, -2.052734375, -1.855712890625, -1.65869140625, -1.461669921875, -1.2646484375, -1.067626953125, -0.87060546875, -0.673583984375, -0.4765625, -0.279541015625, -0.08251953125, 0.114501953125, 0.3115234375, 0.508544921875, 0.70556640625, 0.902587890625, 1.099609375, 1.296630859375, 1.49365234375, 1.690673828125, 1.8876953125, 2.084716796875, 2.28173828125, 2.478759765625, 2.67578125, 2.872802734375, 3.06982421875, 3.266845703125, 3.4638671875, 3.660888671875, 3.85791015625, 4.054931640625, 4.251953125, 4.448974609375, 4.64599609375, 4.843017578125, 5.0400390625, 5.237060546875, 5.43408203125, 5.631103515625, 5.828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 13.0, 11.0, 12.0, 13.0, 13.0, 18.0, 35.0, 41.0, 57.0, 68.0, 81.0, 116.0, 169.0, 238.0, 307.0, 485.0, 671.0, 1245.0, 2602.0, 6763.0, 24494.0, 115928.0, 473553.0, 328080.0, 68125.0, 15451.0, 4707.0, 2045.0, 1057.0, 642.0, 408.0, 313.0, 198.0, 157.0, 113.0, 79.0, 59.0, 45.0, 33.0, 24.0, 15.0, 19.0, 12.0, 10.0, 7.0, 4.0, 5.0, 2.0, 9.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-17.171875, -16.64892578125, -16.1259765625, -15.60302734375, -15.080078125, -14.55712890625, -14.0341796875, -13.51123046875, -12.98828125, -12.46533203125, -11.9423828125, -11.41943359375, -10.896484375, -10.37353515625, -9.8505859375, -9.32763671875, -8.8046875, -8.28173828125, -7.7587890625, -7.23583984375, -6.712890625, -6.18994140625, -5.6669921875, -5.14404296875, -4.62109375, -4.09814453125, -3.5751953125, -3.05224609375, -2.529296875, -2.00634765625, -1.4833984375, -0.96044921875, -0.4375, 0.08544921875, 0.6083984375, 1.13134765625, 1.654296875, 2.17724609375, 2.7001953125, 3.22314453125, 3.74609375, 4.26904296875, 4.7919921875, 5.31494140625, 5.837890625, 6.36083984375, 6.8837890625, 7.40673828125, 7.9296875, 8.45263671875, 8.9755859375, 9.49853515625, 10.021484375, 10.54443359375, 11.0673828125, 11.59033203125, 12.11328125, 12.63623046875, 13.1591796875, 13.68212890625, 14.205078125, 14.72802734375, 15.2509765625, 15.77392578125, 16.296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 13.0, 15.0, 18.0, 17.0, 15.0, 30.0, 28.0, 38.0, 31.0, 38.0, 36.0, 53.0, 48.0, 49.0, 62.0, 41.0, 50.0, 44.0, 43.0, 43.0, 41.0, 37.0, 41.0, 35.0, 28.0, 21.0, 11.0, 13.0, 11.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.265625, -25.43359375, -24.6015625, -23.76953125, -22.9375, -22.10546875, -21.2734375, -20.44140625, -19.609375, -18.77734375, -17.9453125, -17.11328125, -16.28125, -15.44921875, -14.6171875, -13.78515625, -12.953125, -12.12109375, -11.2890625, -10.45703125, -9.625, -8.79296875, -7.9609375, -7.12890625, -6.296875, -5.46484375, -4.6328125, -3.80078125, -2.96875, -2.13671875, -1.3046875, -0.47265625, 0.359375, 1.19140625, 2.0234375, 2.85546875, 3.6875, 4.51953125, 5.3515625, 6.18359375, 7.015625, 7.84765625, 8.6796875, 9.51171875, 10.34375, 11.17578125, 12.0078125, 12.83984375, 13.671875, 14.50390625, 15.3359375, 16.16796875, 17.0, 17.83203125, 18.6640625, 19.49609375, 20.328125, 21.16015625, 21.9921875, 22.82421875, 23.65625, 24.48828125, 25.3203125, 26.15234375, 26.984375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 1.0, 12.0, 11.0, 17.0, 11.0, 25.0, 30.0, 33.0, 42.0, 76.0, 157.0, 248.0, 482.0, 1088.0, 2846.0, 9708.0, 50884.0, 451359.0, 464040.0, 52417.0, 9844.0, 2923.0, 1134.0, 491.0, 211.0, 143.0, 104.0, 57.0, 44.0, 28.0, 19.0, 15.0, 8.0, 8.0, 12.0, 2.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -10.9979248046875, -10.605224609375, -10.2125244140625, -9.81982421875, -9.4271240234375, -9.034423828125, -8.6417236328125, -8.2490234375, -7.8563232421875, -7.463623046875, -7.0709228515625, -6.67822265625, -6.2855224609375, -5.892822265625, -5.5001220703125, -5.107421875, -4.7147216796875, -4.322021484375, -3.9293212890625, -3.53662109375, -3.1439208984375, -2.751220703125, -2.3585205078125, -1.9658203125, -1.5731201171875, -1.180419921875, -0.7877197265625, -0.39501953125, -0.0023193359375, 0.390380859375, 0.7830810546875, 1.17578125, 1.5684814453125, 1.961181640625, 2.3538818359375, 2.74658203125, 3.1392822265625, 3.531982421875, 3.9246826171875, 4.3173828125, 4.7100830078125, 5.102783203125, 5.4954833984375, 5.88818359375, 6.2808837890625, 6.673583984375, 7.0662841796875, 7.458984375, 7.8516845703125, 8.244384765625, 8.6370849609375, 9.02978515625, 9.4224853515625, 9.815185546875, 10.2078857421875, 10.6005859375, 10.9932861328125, 11.385986328125, 11.7786865234375, 12.17138671875, 12.5640869140625, 12.956787109375, 13.3494873046875, 13.7421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 8.0, 7.0, 9.0, 8.0, 3.0, 14.0, 20.0, 30.0, 40.0, 32.0, 61.0, 67.0, 64.0, 75.0, 96.0, 93.0, 89.0, 79.0, 44.0, 30.0, 27.0, 22.0, 22.0, 15.0, 9.0, 16.0, 6.0, 6.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018682479858398438, -0.0018123835325241089, -0.001756519079208374, -0.0017006546258926392, -0.0016447901725769043, -0.0015889257192611694, -0.0015330612659454346, -0.0014771968126296997, -0.0014213323593139648, -0.00136546790599823, -0.0013096034526824951, -0.0012537389993667603, -0.0011978745460510254, -0.0011420100927352905, -0.0010861456394195557, -0.0010302811861038208, -0.0009744167327880859, -0.0009185522794723511, -0.0008626878261566162, -0.0008068233728408813, -0.0007509589195251465, -0.0006950944662094116, -0.0006392300128936768, -0.0005833655595779419, -0.000527501106262207, -0.00047163665294647217, -0.0004157721996307373, -0.00035990774631500244, -0.0003040432929992676, -0.0002481788396835327, -0.00019231438636779785, -0.000136449933052063, -8.058547973632812e-05, -2.4721026420593262e-05, 3.11434268951416e-05, 8.700788021087646e-05, 0.00014287233352661133, 0.0001987367868423462, 0.00025460124015808105, 0.0003104656934738159, 0.0003663301467895508, 0.00042219460010528564, 0.0004780590534210205, 0.0005339235067367554, 0.0005897879600524902, 0.0006456524133682251, 0.00070151686668396, 0.0007573813199996948, 0.0008132457733154297, 0.0008691102266311646, 0.0009249746799468994, 0.0009808391332626343, 0.0010367035865783691, 0.001092568039894104, 0.0011484324932098389, 0.0012042969465255737, 0.0012601613998413086, 0.0013160258531570435, 0.0013718903064727783, 0.0014277547597885132, 0.001483619213104248, 0.001539483666419983, 0.0015953481197357178, 0.0016512125730514526, 0.0017070770263671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 9.0, 14.0, 52.0, 85.0, 174.0, 448.0, 1431.0, 6982.0, 124925.0, 862803.0, 45853.0, 4080.0, 1051.0, 346.0, 152.0, 67.0, 32.0, 16.0, 12.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.453125, -24.690185546875, -23.92724609375, -23.164306640625, -22.4013671875, -21.638427734375, -20.87548828125, -20.112548828125, -19.349609375, -18.586669921875, -17.82373046875, -17.060791015625, -16.2978515625, -15.534912109375, -14.77197265625, -14.009033203125, -13.24609375, -12.483154296875, -11.72021484375, -10.957275390625, -10.1943359375, -9.431396484375, -8.66845703125, -7.905517578125, -7.142578125, -6.379638671875, -5.61669921875, -4.853759765625, -4.0908203125, -3.327880859375, -2.56494140625, -1.802001953125, -1.0390625, -0.276123046875, 0.48681640625, 1.249755859375, 2.0126953125, 2.775634765625, 3.53857421875, 4.301513671875, 5.064453125, 5.827392578125, 6.59033203125, 7.353271484375, 8.1162109375, 8.879150390625, 9.64208984375, 10.405029296875, 11.16796875, 11.930908203125, 12.69384765625, 13.456787109375, 14.2197265625, 14.982666015625, 15.74560546875, 16.508544921875, 17.271484375, 18.034423828125, 18.79736328125, 19.560302734375, 20.3232421875, 21.086181640625, 21.84912109375, 22.612060546875, 23.375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 5.0, 5.0, 9.0, 17.0, 29.0, 29.0, 38.0, 50.0, 58.0, 63.0, 67.0, 77.0, 71.0, 83.0, 64.0, 66.0, 67.0, 40.0, 38.0, 34.0, 23.0, 20.0, 14.0, 9.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.313720703125, -9.97900390625, -9.644287109375, -9.3095703125, -8.974853515625, -8.64013671875, -8.305419921875, -7.970703125, -7.635986328125, -7.30126953125, -6.966552734375, -6.6318359375, -6.297119140625, -5.96240234375, -5.627685546875, -5.29296875, -4.958251953125, -4.62353515625, -4.288818359375, -3.9541015625, -3.619384765625, -3.28466796875, -2.949951171875, -2.615234375, -2.280517578125, -1.94580078125, -1.611083984375, -1.2763671875, -0.941650390625, -0.60693359375, -0.272216796875, 0.0625, 0.397216796875, 0.73193359375, 1.066650390625, 1.4013671875, 1.736083984375, 2.07080078125, 2.405517578125, 2.740234375, 3.074951171875, 3.40966796875, 3.744384765625, 4.0791015625, 4.413818359375, 4.74853515625, 5.083251953125, 5.41796875, 5.752685546875, 6.08740234375, 6.422119140625, 6.7568359375, 7.091552734375, 7.42626953125, 7.760986328125, 8.095703125, 8.430419921875, 8.76513671875, 9.099853515625, 9.4345703125, 9.769287109375, 10.10400390625, 10.438720703125, 10.7734375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 17.0, 59.0, 217.0, 412.0, 203.0, 67.0, 14.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.0657958984375, -149.918701171875, -135.77159118652344, -121.62449645996094, -107.47738647460938, -93.33029174804688, -79.18318939208984, -65.03608703613281, -50.88898468017578, -36.74188232421875, -22.59478187561035, -8.447681427001953, 5.699420928955078, 19.846519470214844, 33.993621826171875, 48.140724182128906, 62.28782653808594, 76.43492889404297, 90.58203125, 104.7291259765625, 118.87623596191406, 133.02333068847656, 147.17044067382812, 161.31753540039062, 175.46463012695312, 189.61172485351562, 203.7588348388672, 217.9059295654297, 232.05303955078125, 246.20013427734375, 260.34722900390625, 274.49432373046875, 288.6414489746094, 302.7885437011719, 316.9356384277344, 331.082763671875, 345.2298583984375, 359.376953125, 373.5240478515625, 387.671142578125, 401.8182678222656, 415.9653625488281, 430.1124572753906, 444.25958251953125, 458.40667724609375, 472.55377197265625, 486.70086669921875, 500.84796142578125, 514.9950561523438, 529.1421508789062, 543.2892456054688, 557.4363403320312, 571.5834350585938, 585.7305908203125, 599.877685546875, 614.0247802734375, 628.171875, 642.3189697265625, 656.466064453125, 670.6131591796875, 684.76025390625, 698.9073486328125, 713.0545043945312, 727.2015991210938, 741.3486938476562]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 5.0, 7.0, 12.0, 14.0, 13.0, 28.0, 18.0, 25.0, 30.0, 32.0, 43.0, 35.0, 34.0, 55.0, 51.0, 49.0, 62.0, 52.0, 54.0, 48.0, 39.0, 44.0, 38.0, 30.0, 26.0, 33.0, 23.0, 19.0, 12.0, 9.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.40972137451172, -119.37999725341797, -115.35027313232422, -111.320556640625, -107.29083251953125, -103.2611083984375, -99.23138427734375, -95.20166015625, -91.17193603515625, -87.1422119140625, -83.11248779296875, -79.082763671875, -75.05304718017578, -71.02332305908203, -66.99359893798828, -62.96387481689453, -58.93415832519531, -54.90443420410156, -50.87471389770508, -46.84498977661133, -42.815269470214844, -38.785545349121094, -34.755821228027344, -30.726099014282227, -26.69637680053711, -22.666654586791992, -18.636932373046875, -14.607208251953125, -10.577486038208008, -6.547763824462891, -2.5180397033691406, 1.5116825103759766, 5.541412353515625, 9.571134567260742, 13.600857734680176, 17.63058090209961, 21.660303115844727, 25.690025329589844, 29.719749450683594, 33.749473571777344, 37.77919387817383, 41.80891799926758, 45.83863830566406, 49.86836242675781, 53.89808654785156, 57.92780685424805, 61.9575309753418, 65.98725128173828, 70.01697540283203, 74.04669952392578, 78.07642364501953, 82.10614013671875, 86.1358642578125, 90.16558837890625, 94.1953125, 98.22503662109375, 102.2547607421875, 106.28448486328125, 110.314208984375, 114.34393310546875, 118.37364959716797, 122.40337371826172, 126.43309783935547, 130.4628143310547, 134.49253845214844]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 3.0, 6.0, 9.0, 7.0, 31.0, 51.0, 79.0, 138.0, 290.0, 955.0, 7995.0, 4165280.0, 17421.0, 1271.0, 370.0, 182.0, 65.0, 47.0, 27.0, 18.0, 15.0, 10.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.8125, -79.4482421875, -77.083984375, -74.7197265625, -72.35546875, -69.9912109375, -67.626953125, -65.2626953125, -62.8984375, -60.5341796875, -58.169921875, -55.8056640625, -53.44140625, -51.0771484375, -48.712890625, -46.3486328125, -43.984375, -41.6201171875, -39.255859375, -36.8916015625, -34.52734375, -32.1630859375, -29.798828125, -27.4345703125, -25.0703125, -22.7060546875, -20.341796875, -17.9775390625, -15.61328125, -13.2490234375, -10.884765625, -8.5205078125, -6.15625, -3.7919921875, -1.427734375, 0.9365234375, 3.30078125, 5.6650390625, 8.029296875, 10.3935546875, 12.7578125, 15.1220703125, 17.486328125, 19.8505859375, 22.21484375, 24.5791015625, 26.943359375, 29.3076171875, 31.671875, 34.0361328125, 36.400390625, 38.7646484375, 41.12890625, 43.4931640625, 45.857421875, 48.2216796875, 50.5859375, 52.9501953125, 55.314453125, 57.6787109375, 60.04296875, 62.4072265625, 64.771484375, 67.1357421875, 69.5]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 12.0, 10.0, 13.0, 17.0, 14.0, 27.0, 29.0, 40.0, 44.0, 65.0, 57.0, 52.0, 69.0, 64.0, 69.0, 55.0, 49.0, 54.0, 47.0, 37.0, 35.0, 30.0, 16.0, 23.0, 14.0, 13.0, 5.0, 6.0, 7.0, 3.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.890625, -8.66607666015625, -8.4415283203125, -8.21697998046875, -7.992431640625, -7.76788330078125, -7.5433349609375, -7.31878662109375, -7.09423828125, -6.86968994140625, -6.6451416015625, -6.42059326171875, -6.196044921875, -5.97149658203125, -5.7469482421875, -5.52239990234375, -5.2978515625, -5.07330322265625, -4.8487548828125, -4.62420654296875, -4.399658203125, -4.17510986328125, -3.9505615234375, -3.72601318359375, -3.50146484375, -3.27691650390625, -3.0523681640625, -2.82781982421875, -2.603271484375, -2.37872314453125, -2.1541748046875, -1.92962646484375, -1.705078125, -1.48052978515625, -1.2559814453125, -1.03143310546875, -0.806884765625, -0.58233642578125, -0.3577880859375, -0.13323974609375, 0.09130859375, 0.31585693359375, 0.5404052734375, 0.76495361328125, 0.989501953125, 1.21405029296875, 1.4385986328125, 1.66314697265625, 1.8876953125, 2.11224365234375, 2.3367919921875, 2.56134033203125, 2.785888671875, 3.01043701171875, 3.2349853515625, 3.45953369140625, 3.68408203125, 3.90863037109375, 4.1331787109375, 4.35772705078125, 4.582275390625, 4.80682373046875, 5.0313720703125, 5.25592041015625, 5.48046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 17.0, 11.0, 12.0, 23.0, 26.0, 35.0, 57.0, 70.0, 100.0, 147.0, 210.0, 308.0, 513.0, 807.0, 1303.0, 2182.0, 3682.0, 7881.0, 21216.0, 107319.0, 3873390.0, 132598.0, 23664.0, 8589.0, 3988.0, 2275.0, 1373.0, 881.0, 517.0, 341.0, 213.0, 153.0, 87.0, 84.0, 50.0, 38.0, 24.0, 19.0, 16.0, 20.0, 10.0, 4.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0], "bins": [-15.125, -14.699462890625, -14.27392578125, -13.848388671875, -13.4228515625, -12.997314453125, -12.57177734375, -12.146240234375, -11.720703125, -11.295166015625, -10.86962890625, -10.444091796875, -10.0185546875, -9.593017578125, -9.16748046875, -8.741943359375, -8.31640625, -7.890869140625, -7.46533203125, -7.039794921875, -6.6142578125, -6.188720703125, -5.76318359375, -5.337646484375, -4.912109375, -4.486572265625, -4.06103515625, -3.635498046875, -3.2099609375, -2.784423828125, -2.35888671875, -1.933349609375, -1.5078125, -1.082275390625, -0.65673828125, -0.231201171875, 0.1943359375, 0.619873046875, 1.04541015625, 1.470947265625, 1.896484375, 2.322021484375, 2.74755859375, 3.173095703125, 3.5986328125, 4.024169921875, 4.44970703125, 4.875244140625, 5.30078125, 5.726318359375, 6.15185546875, 6.577392578125, 7.0029296875, 7.428466796875, 7.85400390625, 8.279541015625, 8.705078125, 9.130615234375, 9.55615234375, 9.981689453125, 10.4072265625, 10.832763671875, 11.25830078125, 11.683837890625, 12.109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 6.0, 6.0, 8.0, 12.0, 20.0, 50.0, 95.0, 296.0, 3092.0, 260.0, 91.0, 41.0, 26.0, 15.0, 12.0, 7.0, 5.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.929656982421875, -3.80853271484375, -3.687408447265625, -3.5662841796875, -3.445159912109375, -3.32403564453125, -3.202911376953125, -3.081787109375, -2.960662841796875, -2.83953857421875, -2.718414306640625, -2.5972900390625, -2.476165771484375, -2.35504150390625, -2.233917236328125, -2.11279296875, -1.991668701171875, -1.87054443359375, -1.749420166015625, -1.6282958984375, -1.507171630859375, -1.38604736328125, -1.264923095703125, -1.143798828125, -1.022674560546875, -0.90155029296875, -0.780426025390625, -0.6593017578125, -0.538177490234375, -0.41705322265625, -0.295928955078125, -0.1748046875, -0.053680419921875, 0.06744384765625, 0.188568115234375, 0.3096923828125, 0.430816650390625, 0.55194091796875, 0.673065185546875, 0.794189453125, 0.915313720703125, 1.03643798828125, 1.157562255859375, 1.2786865234375, 1.399810791015625, 1.52093505859375, 1.642059326171875, 1.76318359375, 1.884307861328125, 2.00543212890625, 2.126556396484375, 2.2476806640625, 2.368804931640625, 2.48992919921875, 2.611053466796875, 2.732177734375, 2.853302001953125, 2.97442626953125, 3.095550537109375, 3.2166748046875, 3.337799072265625, 3.45892333984375, 3.580047607421875, 3.701171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 34.0, 51.0, 153.0, 217.0, 247.0, 143.0, 77.0, 41.0, 15.0, 11.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.020355224609375, -41.02103805541992, -40.021724700927734, -39.02240753173828, -38.023094177246094, -37.02377700805664, -36.02445983886719, -35.025146484375, -34.02582931518555, -33.026512145996094, -32.027198791503906, -31.027881622314453, -30.028566360473633, -29.029251098632812, -28.029935836791992, -27.030620574951172, -26.031307220458984, -25.031991958618164, -24.032676696777344, -23.03335952758789, -22.03404426574707, -21.03472900390625, -20.03541374206543, -19.03609848022461, -18.036781311035156, -17.037466049194336, -16.038150787353516, -15.038834571838379, -14.039519309997559, -13.040203094482422, -12.040887832641602, -11.041572570800781, -10.042257308959961, -9.04294204711914, -8.043625831604004, -7.044310569763184, -6.044995307922363, -5.045679569244385, -4.046363830566406, -3.047048568725586, -2.0477328300476074, -1.048417329788208, -0.04910171031951904, 0.9502139091491699, 1.9495294094085693, 2.9488449096679688, 3.9481606483459473, 4.947475910186768, 5.946791648864746, 6.946107387542725, 7.945422649383545, 8.944738388061523, 9.944053649902344, 10.943368911743164, 11.9426851272583, 12.942000389099121, 13.941316604614258, 14.940631866455078, 15.939948081970215, 16.93926239013672, 17.938579559326172, 18.937894821166992, 19.937210083007812, 20.936525344848633, 21.935840606689453]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 8.0, 5.0, 5.0, 7.0, 13.0, 12.0, 12.0, 20.0, 14.0, 21.0, 21.0, 25.0, 22.0, 30.0, 24.0, 28.0, 33.0, 29.0, 38.0, 33.0, 42.0, 44.0, 29.0, 38.0, 34.0, 43.0, 38.0, 41.0, 43.0, 29.0, 36.0, 23.0, 15.0, 16.0, 16.0, 14.0, 9.0, 10.0, 12.0, 15.0, 9.0, 9.0, 5.0, 8.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-6.314723014831543, -6.115884780883789, -5.917046070098877, -5.718207836151123, -5.519369125366211, -5.320530891418457, -5.121692657470703, -4.922853946685791, -4.724015235900879, -4.525177001953125, -4.326338291168213, -4.127500057220459, -3.928661346435547, -3.729823112487793, -3.53098464012146, -3.332146167755127, -3.133307933807373, -2.93446946144104, -2.735630989074707, -2.536792755126953, -2.337954044342041, -2.139115810394287, -1.940277338027954, -1.741438865661621, -1.542600393295288, -1.343761920928955, -1.144923448562622, -0.9460850954055786, -0.7472466230392456, -0.5484081506729126, -0.34956979751586914, -0.15073132514953613, 0.04810762405395508, 0.2469460666179657, 0.4457845091819763, 0.6446229219436646, 0.8434613943099976, 1.0422998666763306, 1.241138219833374, 1.439976692199707, 1.63881516456604, 1.837653636932373, 2.036492109298706, 2.235330581665039, 2.434168815612793, 2.633007526397705, 2.831845760345459, 3.030684232711792, 3.229522705078125, 3.428361177444458, 3.627199649810791, 3.826037883758545, 4.024876594543457, 4.223714828491211, 4.422553062438965, 4.621391773223877, 4.820230484008789, 5.019068717956543, 5.217907428741455, 5.416745662689209, 5.615584373474121, 5.814422607421875, 6.013260841369629, 6.212099552154541, 6.410937786102295]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 9.0, 6.0, 21.0, 37.0, 33.0, 65.0, 125.0, 213.0, 368.0, 627.0, 1176.0, 2224.0, 4520.0, 9545.0, 20496.0, 44412.0, 94831.0, 184226.0, 263943.0, 209214.0, 111884.0, 53235.0, 24527.0, 11509.0, 5516.0, 2669.0, 1355.0, 743.0, 433.0, 212.0, 136.0, 87.0, 56.0, 25.0, 24.0, 10.0, 12.0, 11.0, 2.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.8302001953125, -7.574462890625, -7.3187255859375, -7.06298828125, -6.8072509765625, -6.551513671875, -6.2957763671875, -6.0400390625, -5.7843017578125, -5.528564453125, -5.2728271484375, -5.01708984375, -4.7613525390625, -4.505615234375, -4.2498779296875, -3.994140625, -3.7384033203125, -3.482666015625, -3.2269287109375, -2.97119140625, -2.7154541015625, -2.459716796875, -2.2039794921875, -1.9482421875, -1.6925048828125, -1.436767578125, -1.1810302734375, -0.92529296875, -0.6695556640625, -0.413818359375, -0.1580810546875, 0.09765625, 0.3533935546875, 0.609130859375, 0.8648681640625, 1.12060546875, 1.3763427734375, 1.632080078125, 1.8878173828125, 2.1435546875, 2.3992919921875, 2.655029296875, 2.9107666015625, 3.16650390625, 3.4222412109375, 3.677978515625, 3.9337158203125, 4.189453125, 4.4451904296875, 4.700927734375, 4.9566650390625, 5.21240234375, 5.4681396484375, 5.723876953125, 5.9796142578125, 6.2353515625, 6.4910888671875, 6.746826171875, 7.0025634765625, 7.25830078125, 7.5140380859375, 7.769775390625, 8.0255126953125, 8.28125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 2.0, 6.0, 11.0, 15.0, 21.0, 24.0, 16.0, 35.0, 28.0, 29.0, 56.0, 54.0, 69.0, 48.0, 61.0, 62.0, 54.0, 48.0, 58.0, 52.0, 43.0, 34.0, 26.0, 23.0, 24.0, 16.0, 20.0, 13.0, 15.0, 6.0, 6.0, 7.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.43341064453125, -7.2222900390625, -7.01116943359375, -6.800048828125, -6.58892822265625, -6.3778076171875, -6.16668701171875, -5.95556640625, -5.74444580078125, -5.5333251953125, -5.32220458984375, -5.111083984375, -4.89996337890625, -4.6888427734375, -4.47772216796875, -4.2666015625, -4.05548095703125, -3.8443603515625, -3.63323974609375, -3.422119140625, -3.21099853515625, -2.9998779296875, -2.78875732421875, -2.57763671875, -2.36651611328125, -2.1553955078125, -1.94427490234375, -1.733154296875, -1.52203369140625, -1.3109130859375, -1.09979248046875, -0.888671875, -0.67755126953125, -0.4664306640625, -0.25531005859375, -0.044189453125, 0.16693115234375, 0.3780517578125, 0.58917236328125, 0.80029296875, 1.01141357421875, 1.2225341796875, 1.43365478515625, 1.644775390625, 1.85589599609375, 2.0670166015625, 2.27813720703125, 2.4892578125, 2.70037841796875, 2.9114990234375, 3.12261962890625, 3.333740234375, 3.54486083984375, 3.7559814453125, 3.96710205078125, 4.17822265625, 4.38934326171875, 4.6004638671875, 4.81158447265625, 5.022705078125, 5.23382568359375, 5.4449462890625, 5.65606689453125, 5.8671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 11.0, 14.0, 13.0, 25.0, 41.0, 73.0, 128.0, 283.0, 610.0, 1512.0, 7372.0, 190279.0, 811117.0, 32220.0, 2985.0, 990.0, 409.0, 206.0, 97.0, 51.0, 23.0, 25.0, 15.0, 10.0, 5.0, 9.0, 2.0, 4.0, 5.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.1904296875, -34.099609375, -33.0087890625, -31.91796875, -30.8271484375, -29.736328125, -28.6455078125, -27.5546875, -26.4638671875, -25.373046875, -24.2822265625, -23.19140625, -22.1005859375, -21.009765625, -19.9189453125, -18.828125, -17.7373046875, -16.646484375, -15.5556640625, -14.46484375, -13.3740234375, -12.283203125, -11.1923828125, -10.1015625, -9.0107421875, -7.919921875, -6.8291015625, -5.73828125, -4.6474609375, -3.556640625, -2.4658203125, -1.375, -0.2841796875, 0.806640625, 1.8974609375, 2.98828125, 4.0791015625, 5.169921875, 6.2607421875, 7.3515625, 8.4423828125, 9.533203125, 10.6240234375, 11.71484375, 12.8056640625, 13.896484375, 14.9873046875, 16.078125, 17.1689453125, 18.259765625, 19.3505859375, 20.44140625, 21.5322265625, 22.623046875, 23.7138671875, 24.8046875, 25.8955078125, 26.986328125, 28.0771484375, 29.16796875, 30.2587890625, 31.349609375, 32.4404296875, 33.53125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 14.0, 6.0, 8.0, 10.0, 12.0, 23.0, 19.0, 23.0, 24.0, 36.0, 30.0, 26.0, 56.0, 45.0, 45.0, 35.0, 50.0, 51.0, 48.0, 46.0, 44.0, 39.0, 43.0, 45.0, 32.0, 36.0, 40.0, 24.0, 11.0, 20.0, 15.0, 10.0, 8.0, 6.0, 2.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-30.859375, -30.01025390625, -29.1611328125, -28.31201171875, -27.462890625, -26.61376953125, -25.7646484375, -24.91552734375, -24.06640625, -23.21728515625, -22.3681640625, -21.51904296875, -20.669921875, -19.82080078125, -18.9716796875, -18.12255859375, -17.2734375, -16.42431640625, -15.5751953125, -14.72607421875, -13.876953125, -13.02783203125, -12.1787109375, -11.32958984375, -10.48046875, -9.63134765625, -8.7822265625, -7.93310546875, -7.083984375, -6.23486328125, -5.3857421875, -4.53662109375, -3.6875, -2.83837890625, -1.9892578125, -1.14013671875, -0.291015625, 0.55810546875, 1.4072265625, 2.25634765625, 3.10546875, 3.95458984375, 4.8037109375, 5.65283203125, 6.501953125, 7.35107421875, 8.2001953125, 9.04931640625, 9.8984375, 10.74755859375, 11.5966796875, 12.44580078125, 13.294921875, 14.14404296875, 14.9931640625, 15.84228515625, 16.69140625, 17.54052734375, 18.3896484375, 19.23876953125, 20.087890625, 20.93701171875, 21.7861328125, 22.63525390625, 23.484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 4.0, 3.0, 11.0, 15.0, 12.0, 31.0, 57.0, 68.0, 122.0, 234.0, 541.0, 1401.0, 6667.0, 119121.0, 873957.0, 40647.0, 3786.0, 995.0, 415.0, 185.0, 92.0, 66.0, 52.0, 25.0, 12.0, 11.0, 6.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.171875, -22.6114501953125, -22.051025390625, -21.4906005859375, -20.93017578125, -20.3697509765625, -19.809326171875, -19.2489013671875, -18.6884765625, -18.1280517578125, -17.567626953125, -17.0072021484375, -16.44677734375, -15.8863525390625, -15.325927734375, -14.7655029296875, -14.205078125, -13.6446533203125, -13.084228515625, -12.5238037109375, -11.96337890625, -11.4029541015625, -10.842529296875, -10.2821044921875, -9.7216796875, -9.1612548828125, -8.600830078125, -8.0404052734375, -7.47998046875, -6.9195556640625, -6.359130859375, -5.7987060546875, -5.23828125, -4.6778564453125, -4.117431640625, -3.5570068359375, -2.99658203125, -2.4361572265625, -1.875732421875, -1.3153076171875, -0.7548828125, -0.1944580078125, 0.365966796875, 0.9263916015625, 1.48681640625, 2.0472412109375, 2.607666015625, 3.1680908203125, 3.728515625, 4.2889404296875, 4.849365234375, 5.4097900390625, 5.97021484375, 6.5306396484375, 7.091064453125, 7.6514892578125, 8.2119140625, 8.7723388671875, 9.332763671875, 9.8931884765625, 10.45361328125, 11.0140380859375, 11.574462890625, 12.1348876953125, 12.6953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 14.0, 12.0, 19.0, 22.0, 20.0, 39.0, 30.0, 39.0, 73.0, 90.0, 113.0, 87.0, 92.0, 79.0, 56.0, 41.0, 25.0, 31.0, 23.0, 19.0, 17.0, 12.0, 7.0, 8.0, 2.0, 7.0, 7.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014171600341796875, -0.0013687461614608765, -0.0013203322887420654, -0.0012719184160232544, -0.0012235045433044434, -0.0011750906705856323, -0.0011266767978668213, -0.0010782629251480103, -0.0010298490524291992, -0.0009814351797103882, -0.0009330213069915771, -0.0008846074342727661, -0.0008361935615539551, -0.000787779688835144, -0.000739365816116333, -0.000690951943397522, -0.0006425380706787109, -0.0005941241979598999, -0.0005457103252410889, -0.0004972964525222778, -0.0004488825798034668, -0.00040046870708465576, -0.0003520548343658447, -0.0003036409616470337, -0.00025522708892822266, -0.00020681321620941162, -0.00015839934349060059, -0.00010998547077178955, -6.157159805297852e-05, -1.315772533416748e-05, 3.5256147384643555e-05, 8.367002010345459e-05, 0.00013208389282226562, 0.00018049776554107666, 0.0002289116382598877, 0.00027732551097869873, 0.00032573938369750977, 0.0003741532564163208, 0.00042256712913513184, 0.00047098100185394287, 0.0005193948745727539, 0.0005678087472915649, 0.000616222620010376, 0.000664636492729187, 0.000713050365447998, 0.0007614642381668091, 0.0008098781108856201, 0.0008582919836044312, 0.0009067058563232422, 0.0009551197290420532, 0.0010035336017608643, 0.0010519474744796753, 0.0011003613471984863, 0.0011487752199172974, 0.0011971890926361084, 0.0012456029653549194, 0.0012940168380737305, 0.0013424307107925415, 0.0013908445835113525, 0.0014392584562301636, 0.0014876723289489746, 0.0015360862016677856, 0.0015845000743865967, 0.0016329139471054077, 0.0016813278198242188]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 7.0, 18.0, 24.0, 33.0, 62.0, 112.0, 231.0, 434.0, 1127.0, 3291.0, 17682.0, 278770.0, 699393.0, 39126.0, 5405.0, 1634.0, 617.0, 256.0, 128.0, 90.0, 43.0, 20.0, 13.0, 8.0, 10.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.265625, -13.776611328125, -13.28759765625, -12.798583984375, -12.3095703125, -11.820556640625, -11.33154296875, -10.842529296875, -10.353515625, -9.864501953125, -9.37548828125, -8.886474609375, -8.3974609375, -7.908447265625, -7.41943359375, -6.930419921875, -6.44140625, -5.952392578125, -5.46337890625, -4.974365234375, -4.4853515625, -3.996337890625, -3.50732421875, -3.018310546875, -2.529296875, -2.040283203125, -1.55126953125, -1.062255859375, -0.5732421875, -0.084228515625, 0.40478515625, 0.893798828125, 1.3828125, 1.871826171875, 2.36083984375, 2.849853515625, 3.3388671875, 3.827880859375, 4.31689453125, 4.805908203125, 5.294921875, 5.783935546875, 6.27294921875, 6.761962890625, 7.2509765625, 7.739990234375, 8.22900390625, 8.718017578125, 9.20703125, 9.696044921875, 10.18505859375, 10.674072265625, 11.1630859375, 11.652099609375, 12.14111328125, 12.630126953125, 13.119140625, 13.608154296875, 14.09716796875, 14.586181640625, 15.0751953125, 15.564208984375, 16.05322265625, 16.542236328125, 17.03125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 5.0, 8.0, 14.0, 12.0, 20.0, 34.0, 25.0, 40.0, 64.0, 80.0, 91.0, 110.0, 104.0, 82.0, 83.0, 60.0, 49.0, 31.0, 21.0, 19.0, 18.0, 5.0, 8.0, 6.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5078125, -13.1597900390625, -12.811767578125, -12.4637451171875, -12.11572265625, -11.7677001953125, -11.419677734375, -11.0716552734375, -10.7236328125, -10.3756103515625, -10.027587890625, -9.6795654296875, -9.33154296875, -8.9835205078125, -8.635498046875, -8.2874755859375, -7.939453125, -7.5914306640625, -7.243408203125, -6.8953857421875, -6.54736328125, -6.1993408203125, -5.851318359375, -5.5032958984375, -5.1552734375, -4.8072509765625, -4.459228515625, -4.1112060546875, -3.76318359375, -3.4151611328125, -3.067138671875, -2.7191162109375, -2.37109375, -2.0230712890625, -1.675048828125, -1.3270263671875, -0.97900390625, -0.6309814453125, -0.282958984375, 0.0650634765625, 0.4130859375, 0.7611083984375, 1.109130859375, 1.4571533203125, 1.80517578125, 2.1531982421875, 2.501220703125, 2.8492431640625, 3.197265625, 3.5452880859375, 3.893310546875, 4.2413330078125, 4.58935546875, 4.9373779296875, 5.285400390625, 5.6334228515625, 5.9814453125, 6.3294677734375, 6.677490234375, 7.0255126953125, 7.37353515625, 7.7215576171875, 8.069580078125, 8.4176025390625, 8.765625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 8.0, 9.0, 36.0, 62.0, 199.0, 273.0, 228.0, 127.0, 41.0, 14.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-301.7027587890625, -293.015380859375, -284.3280029296875, -275.640625, -266.9532470703125, -258.265869140625, -249.5784912109375, -240.89111328125, -232.2037353515625, -223.516357421875, -214.8289794921875, -206.1416015625, -197.4542236328125, -188.766845703125, -180.0794677734375, -171.39208984375, -162.7047119140625, -154.017333984375, -145.3299560546875, -136.642578125, -127.9552001953125, -119.267822265625, -110.5804443359375, -101.89306640625, -93.2056884765625, -84.518310546875, -75.8309326171875, -67.1435546875, -58.4561767578125, -49.768798828125, -41.0814208984375, -32.39404296875, -23.706634521484375, -15.019256591796875, -6.331878662109375, 2.355499267578125, 11.042877197265625, 19.730255126953125, 28.417633056640625, 37.105010986328125, 45.792388916015625, 54.479766845703125, 63.167144775390625, 71.85452270507812, 80.54190063476562, 89.22927856445312, 97.91665649414062, 106.60403442382812, 115.29141235351562, 123.97879028320312, 132.66616821289062, 141.35354614257812, 150.04092407226562, 158.72830200195312, 167.41567993164062, 176.10305786132812, 184.79043579101562, 193.47781372070312, 202.16519165039062, 210.85256958007812, 219.53994750976562, 228.22732543945312, 236.91470336914062, 245.60208129882812, 254.28945922851562]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 3.0, 7.0, 13.0, 24.0, 21.0, 13.0, 18.0, 29.0, 38.0, 22.0, 32.0, 43.0, 49.0, 42.0, 50.0, 56.0, 64.0, 59.0, 49.0, 52.0, 38.0, 34.0, 47.0, 32.0, 19.0, 25.0, 19.0, 18.0, 14.0, 13.0, 8.0, 9.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.3512954711914, -123.29072570800781, -119.23015594482422, -115.16958618164062, -111.1090087890625, -107.04844665527344, -102.98786926269531, -98.92729949951172, -94.86672973632812, -90.80615997314453, -86.74559020996094, -82.68502044677734, -78.62445068359375, -74.56387329101562, -70.50330352783203, -66.44273376464844, -62.382164001464844, -58.32159423828125, -54.261024475097656, -50.2004508972168, -46.1398811340332, -42.07931137084961, -38.01873779296875, -33.958168029785156, -29.897598266601562, -25.83702850341797, -21.776456832885742, -17.715885162353516, -13.655315399169922, -9.594745635986328, -5.534173965454102, -1.473602294921875, 2.5869598388671875, 6.647530555725098, 10.708101272583008, 14.768671989440918, 18.829242706298828, 22.889812469482422, 26.95038414001465, 31.010955810546875, 35.07152557373047, 39.13209533691406, 43.192665100097656, 47.253238677978516, 51.31380844116211, 55.3743782043457, 59.43495178222656, 63.495521545410156, 67.55609130859375, 71.61666107177734, 75.67723083496094, 79.73780059814453, 83.79837036132812, 87.85894775390625, 91.91951751708984, 95.98008728027344, 100.04065704345703, 104.10122680664062, 108.16179656982422, 112.22236633300781, 116.28294372558594, 120.343505859375, 124.40408325195312, 128.46466064453125, 132.5252227783203]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 13.0, 20.0, 30.0, 43.0, 48.0, 108.0, 144.0, 270.0, 482.0, 888.0, 2019.0, 5119.0, 17727.0, 156354.0, 3935763.0, 57589.0, 10910.0, 3543.0, 1482.0, 706.0, 410.0, 220.0, 124.0, 89.0, 56.0, 33.0, 20.0, 15.0, 10.0, 11.0, 12.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.5625, -23.88623046875, -23.2099609375, -22.53369140625, -21.857421875, -21.18115234375, -20.5048828125, -19.82861328125, -19.15234375, -18.47607421875, -17.7998046875, -17.12353515625, -16.447265625, -15.77099609375, -15.0947265625, -14.41845703125, -13.7421875, -13.06591796875, -12.3896484375, -11.71337890625, -11.037109375, -10.36083984375, -9.6845703125, -9.00830078125, -8.33203125, -7.65576171875, -6.9794921875, -6.30322265625, -5.626953125, -4.95068359375, -4.2744140625, -3.59814453125, -2.921875, -2.24560546875, -1.5693359375, -0.89306640625, -0.216796875, 0.45947265625, 1.1357421875, 1.81201171875, 2.48828125, 3.16455078125, 3.8408203125, 4.51708984375, 5.193359375, 5.86962890625, 6.5458984375, 7.22216796875, 7.8984375, 8.57470703125, 9.2509765625, 9.92724609375, 10.603515625, 11.27978515625, 11.9560546875, 12.63232421875, 13.30859375, 13.98486328125, 14.6611328125, 15.33740234375, 16.013671875, 16.68994140625, 17.3662109375, 18.04248046875, 18.71875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 9.0, 5.0, 11.0, 15.0, 19.0, 16.0, 19.0, 24.0, 37.0, 30.0, 45.0, 36.0, 48.0, 60.0, 75.0, 60.0, 72.0, 52.0, 43.0, 48.0, 59.0, 32.0, 25.0, 27.0, 35.0, 24.0, 12.0, 12.0, 8.0, 5.0, 11.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.27734375, -7.07220458984375, -6.8670654296875, -6.66192626953125, -6.456787109375, -6.25164794921875, -6.0465087890625, -5.84136962890625, -5.63623046875, -5.43109130859375, -5.2259521484375, -5.02081298828125, -4.815673828125, -4.61053466796875, -4.4053955078125, -4.20025634765625, -3.9951171875, -3.78997802734375, -3.5848388671875, -3.37969970703125, -3.174560546875, -2.96942138671875, -2.7642822265625, -2.55914306640625, -2.35400390625, -2.14886474609375, -1.9437255859375, -1.73858642578125, -1.533447265625, -1.32830810546875, -1.1231689453125, -0.91802978515625, -0.712890625, -0.50775146484375, -0.3026123046875, -0.09747314453125, 0.107666015625, 0.31280517578125, 0.5179443359375, 0.72308349609375, 0.92822265625, 1.13336181640625, 1.3385009765625, 1.54364013671875, 1.748779296875, 1.95391845703125, 2.1590576171875, 2.36419677734375, 2.5693359375, 2.77447509765625, 2.9796142578125, 3.18475341796875, 3.389892578125, 3.59503173828125, 3.8001708984375, 4.00531005859375, 4.21044921875, 4.41558837890625, 4.6207275390625, 4.82586669921875, 5.031005859375, 5.23614501953125, 5.4412841796875, 5.64642333984375, 5.8515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 15.0, 19.0, 30.0, 42.0, 60.0, 80.0, 132.0, 188.0, 257.0, 476.0, 722.0, 1187.0, 2148.0, 4588.0, 11468.0, 41736.0, 662319.0, 3386632.0, 57131.0, 13983.0, 5201.0, 2445.0, 1282.0, 768.0, 451.0, 285.0, 180.0, 139.0, 109.0, 64.0, 39.0, 26.0, 19.0, 13.0, 11.0, 9.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.56298828125, -17.0322265625, -16.50146484375, -15.970703125, -15.43994140625, -14.9091796875, -14.37841796875, -13.84765625, -13.31689453125, -12.7861328125, -12.25537109375, -11.724609375, -11.19384765625, -10.6630859375, -10.13232421875, -9.6015625, -9.07080078125, -8.5400390625, -8.00927734375, -7.478515625, -6.94775390625, -6.4169921875, -5.88623046875, -5.35546875, -4.82470703125, -4.2939453125, -3.76318359375, -3.232421875, -2.70166015625, -2.1708984375, -1.64013671875, -1.109375, -0.57861328125, -0.0478515625, 0.48291015625, 1.013671875, 1.54443359375, 2.0751953125, 2.60595703125, 3.13671875, 3.66748046875, 4.1982421875, 4.72900390625, 5.259765625, 5.79052734375, 6.3212890625, 6.85205078125, 7.3828125, 7.91357421875, 8.4443359375, 8.97509765625, 9.505859375, 10.03662109375, 10.5673828125, 11.09814453125, 11.62890625, 12.15966796875, 12.6904296875, 13.22119140625, 13.751953125, 14.28271484375, 14.8134765625, 15.34423828125, 15.875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 5.0, 14.0, 9.0, 12.0, 20.0, 35.0, 58.0, 129.0, 312.0, 2594.0, 518.0, 160.0, 58.0, 43.0, 25.0, 20.0, 17.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80859375, -7.576416015625, -7.34423828125, -7.112060546875, -6.8798828125, -6.647705078125, -6.41552734375, -6.183349609375, -5.951171875, -5.718994140625, -5.48681640625, -5.254638671875, -5.0224609375, -4.790283203125, -4.55810546875, -4.325927734375, -4.09375, -3.861572265625, -3.62939453125, -3.397216796875, -3.1650390625, -2.932861328125, -2.70068359375, -2.468505859375, -2.236328125, -2.004150390625, -1.77197265625, -1.539794921875, -1.3076171875, -1.075439453125, -0.84326171875, -0.611083984375, -0.37890625, -0.146728515625, 0.08544921875, 0.317626953125, 0.5498046875, 0.781982421875, 1.01416015625, 1.246337890625, 1.478515625, 1.710693359375, 1.94287109375, 2.175048828125, 2.4072265625, 2.639404296875, 2.87158203125, 3.103759765625, 3.3359375, 3.568115234375, 3.80029296875, 4.032470703125, 4.2646484375, 4.496826171875, 4.72900390625, 4.961181640625, 5.193359375, 5.425537109375, 5.65771484375, 5.889892578125, 6.1220703125, 6.354248046875, 6.58642578125, 6.818603515625, 7.05078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 12.0, 31.0, 72.0, 193.0, 260.0, 197.0, 125.0, 59.0, 19.0, 13.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.33196258544922, -45.96194839477539, -43.59193420410156, -41.221920013427734, -38.851905822753906, -36.481895446777344, -34.111881256103516, -31.741867065429688, -29.37185287475586, -27.00183868408203, -24.631824493408203, -22.261812210083008, -19.89179801940918, -17.52178382873535, -15.15177059173584, -12.781757354736328, -10.4117431640625, -8.041728973388672, -5.67171573638916, -3.3017020225524902, -0.9316883087158203, 1.4383258819580078, 3.8083391189575195, 6.178352355957031, 8.54836654663086, 10.918380737304688, 13.2883939743042, 15.658407211303711, 18.02842140197754, 20.398435592651367, 22.768447875976562, 25.13846206665039, 27.508468627929688, 29.878482818603516, 32.248497009277344, 34.61851119995117, 36.988525390625, 39.35853576660156, 41.72854995727539, 44.09856414794922, 46.46857833862305, 48.838592529296875, 51.2086067199707, 53.57862091064453, 55.948631286621094, 58.31864929199219, 60.68865966796875, 63.05867385864258, 65.4286880493164, 67.79869842529297, 70.16871643066406, 72.53872680664062, 74.90874481201172, 77.27875518798828, 79.64877319335938, 82.01878356933594, 84.3887939453125, 86.75880432128906, 89.12882232666016, 91.49883270263672, 93.86885070800781, 96.23886108398438, 98.60887908935547, 100.97888946533203, 103.34890747070312]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 4.0, 5.0, 5.0, 6.0, 11.0, 10.0, 18.0, 22.0, 19.0, 20.0, 30.0, 38.0, 43.0, 43.0, 42.0, 46.0, 56.0, 55.0, 44.0, 54.0, 52.0, 48.0, 44.0, 43.0, 35.0, 48.0, 31.0, 28.0, 21.0, 15.0, 20.0, 14.0, 2.0, 11.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09188461303711, -18.37574005126953, -17.659595489501953, -16.943450927734375, -16.227306365966797, -15.511161804199219, -14.795016288757324, -14.078871726989746, -13.362727165222168, -12.64658260345459, -11.930438041687012, -11.214292526245117, -10.498147964477539, -9.782003402709961, -9.065858840942383, -8.349714279174805, -7.633569717407227, -6.917425155639648, -6.20128059387207, -5.485135555267334, -4.768990993499756, -4.052846431732178, -3.3367013931274414, -2.6205568313598633, -1.9044122695922852, -1.1882675886154175, -0.4721229076385498, 0.24402189254760742, 0.9601664543151855, 1.6763110160827637, 2.3924560546875, 3.108600616455078, 3.8247451782226562, 4.540889739990234, 5.2570343017578125, 5.973179340362549, 6.689323902130127, 7.405468463897705, 8.121613502502441, 8.83775806427002, 9.553902626037598, 10.270047187805176, 10.986191749572754, 11.702337265014648, 12.418481826782227, 13.134626388549805, 13.850770950317383, 14.566915512084961, 15.283060073852539, 15.999204635620117, 16.715349197387695, 17.431493759155273, 18.14763832092285, 18.86378288269043, 19.57992935180664, 20.29607391357422, 21.012218475341797, 21.728363037109375, 22.444507598876953, 23.16065216064453, 23.87679672241211, 24.592941284179688, 25.309085845947266, 26.025230407714844, 26.741374969482422]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 10.0, 7.0, 17.0, 26.0, 25.0, 70.0, 116.0, 176.0, 331.0, 535.0, 1029.0, 1967.0, 4409.0, 10151.0, 25252.0, 67966.0, 184712.0, 357084.0, 243136.0, 92905.0, 34179.0, 13356.0, 5745.0, 2523.0, 1290.0, 658.0, 367.0, 190.0, 114.0, 61.0, 52.0, 35.0, 23.0, 10.0, 12.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3671875, -10.017578125, -9.66796875, -9.318359375, -8.96875, -8.619140625, -8.26953125, -7.919921875, -7.5703125, -7.220703125, -6.87109375, -6.521484375, -6.171875, -5.822265625, -5.47265625, -5.123046875, -4.7734375, -4.423828125, -4.07421875, -3.724609375, -3.375, -3.025390625, -2.67578125, -2.326171875, -1.9765625, -1.626953125, -1.27734375, -0.927734375, -0.578125, -0.228515625, 0.12109375, 0.470703125, 0.8203125, 1.169921875, 1.51953125, 1.869140625, 2.21875, 2.568359375, 2.91796875, 3.267578125, 3.6171875, 3.966796875, 4.31640625, 4.666015625, 5.015625, 5.365234375, 5.71484375, 6.064453125, 6.4140625, 6.763671875, 7.11328125, 7.462890625, 7.8125, 8.162109375, 8.51171875, 8.861328125, 9.2109375, 9.560546875, 9.91015625, 10.259765625, 10.609375, 10.958984375, 11.30859375, 11.658203125, 12.0078125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 0.0, 4.0, 6.0, 6.0, 4.0, 11.0, 10.0, 22.0, 6.0, 15.0, 17.0, 22.0, 37.0, 31.0, 43.0, 50.0, 58.0, 42.0, 58.0, 58.0, 54.0, 53.0, 60.0, 54.0, 46.0, 37.0, 24.0, 33.0, 24.0, 29.0, 22.0, 15.0, 10.0, 11.0, 10.0, 8.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.96484375, -6.760009765625, -6.55517578125, -6.350341796875, -6.1455078125, -5.940673828125, -5.73583984375, -5.531005859375, -5.326171875, -5.121337890625, -4.91650390625, -4.711669921875, -4.5068359375, -4.302001953125, -4.09716796875, -3.892333984375, -3.6875, -3.482666015625, -3.27783203125, -3.072998046875, -2.8681640625, -2.663330078125, -2.45849609375, -2.253662109375, -2.048828125, -1.843994140625, -1.63916015625, -1.434326171875, -1.2294921875, -1.024658203125, -0.81982421875, -0.614990234375, -0.41015625, -0.205322265625, -0.00048828125, 0.204345703125, 0.4091796875, 0.614013671875, 0.81884765625, 1.023681640625, 1.228515625, 1.433349609375, 1.63818359375, 1.843017578125, 2.0478515625, 2.252685546875, 2.45751953125, 2.662353515625, 2.8671875, 3.072021484375, 3.27685546875, 3.481689453125, 3.6865234375, 3.891357421875, 4.09619140625, 4.301025390625, 4.505859375, 4.710693359375, 4.91552734375, 5.120361328125, 5.3251953125, 5.530029296875, 5.73486328125, 5.939697265625, 6.14453125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 10.0, 12.0, 4.0, 19.0, 19.0, 25.0, 45.0, 55.0, 118.0, 183.0, 297.0, 561.0, 1365.0, 4655.0, 45907.0, 834003.0, 148664.0, 9006.0, 1931.0, 751.0, 342.0, 192.0, 126.0, 84.0, 44.0, 35.0, 22.0, 19.0, 12.0, 15.0, 5.0, 13.0, 2.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.3125, -37.238525390625, -36.16455078125, -35.090576171875, -34.0166015625, -32.942626953125, -31.86865234375, -30.794677734375, -29.720703125, -28.646728515625, -27.57275390625, -26.498779296875, -25.4248046875, -24.350830078125, -23.27685546875, -22.202880859375, -21.12890625, -20.054931640625, -18.98095703125, -17.906982421875, -16.8330078125, -15.759033203125, -14.68505859375, -13.611083984375, -12.537109375, -11.463134765625, -10.38916015625, -9.315185546875, -8.2412109375, -7.167236328125, -6.09326171875, -5.019287109375, -3.9453125, -2.871337890625, -1.79736328125, -0.723388671875, 0.3505859375, 1.424560546875, 2.49853515625, 3.572509765625, 4.646484375, 5.720458984375, 6.79443359375, 7.868408203125, 8.9423828125, 10.016357421875, 11.09033203125, 12.164306640625, 13.23828125, 14.312255859375, 15.38623046875, 16.460205078125, 17.5341796875, 18.608154296875, 19.68212890625, 20.756103515625, 21.830078125, 22.904052734375, 23.97802734375, 25.052001953125, 26.1259765625, 27.199951171875, 28.27392578125, 29.347900390625, 30.421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 3.0, 3.0, 6.0, 7.0, 8.0, 15.0, 15.0, 18.0, 13.0, 20.0, 19.0, 22.0, 43.0, 28.0, 31.0, 28.0, 48.0, 37.0, 33.0, 37.0, 53.0, 52.0, 48.0, 41.0, 35.0, 48.0, 40.0, 42.0, 20.0, 32.0, 21.0, 21.0, 15.0, 19.0, 20.0, 9.0, 9.0, 8.0, 4.0, 9.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-23.28125, -22.603515625, -21.92578125, -21.248046875, -20.5703125, -19.892578125, -19.21484375, -18.537109375, -17.859375, -17.181640625, -16.50390625, -15.826171875, -15.1484375, -14.470703125, -13.79296875, -13.115234375, -12.4375, -11.759765625, -11.08203125, -10.404296875, -9.7265625, -9.048828125, -8.37109375, -7.693359375, -7.015625, -6.337890625, -5.66015625, -4.982421875, -4.3046875, -3.626953125, -2.94921875, -2.271484375, -1.59375, -0.916015625, -0.23828125, 0.439453125, 1.1171875, 1.794921875, 2.47265625, 3.150390625, 3.828125, 4.505859375, 5.18359375, 5.861328125, 6.5390625, 7.216796875, 7.89453125, 8.572265625, 9.25, 9.927734375, 10.60546875, 11.283203125, 11.9609375, 12.638671875, 13.31640625, 13.994140625, 14.671875, 15.349609375, 16.02734375, 16.705078125, 17.3828125, 18.060546875, 18.73828125, 19.416015625, 20.09375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 10.0, 15.0, 17.0, 32.0, 38.0, 68.0, 84.0, 151.0, 256.0, 425.0, 882.0, 2161.0, 6475.0, 29529.0, 262538.0, 658604.0, 69607.0, 11583.0, 3385.0, 1263.0, 583.0, 319.0, 198.0, 116.0, 52.0, 54.0, 32.0, 19.0, 15.0, 9.0, 6.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7109375, -9.4185791015625, -9.126220703125, -8.8338623046875, -8.54150390625, -8.2491455078125, -7.956787109375, -7.6644287109375, -7.3720703125, -7.0797119140625, -6.787353515625, -6.4949951171875, -6.20263671875, -5.9102783203125, -5.617919921875, -5.3255615234375, -5.033203125, -4.7408447265625, -4.448486328125, -4.1561279296875, -3.86376953125, -3.5714111328125, -3.279052734375, -2.9866943359375, -2.6943359375, -2.4019775390625, -2.109619140625, -1.8172607421875, -1.52490234375, -1.2325439453125, -0.940185546875, -0.6478271484375, -0.35546875, -0.0631103515625, 0.229248046875, 0.5216064453125, 0.81396484375, 1.1063232421875, 1.398681640625, 1.6910400390625, 1.9833984375, 2.2757568359375, 2.568115234375, 2.8604736328125, 3.15283203125, 3.4451904296875, 3.737548828125, 4.0299072265625, 4.322265625, 4.6146240234375, 4.906982421875, 5.1993408203125, 5.49169921875, 5.7840576171875, 6.076416015625, 6.3687744140625, 6.6611328125, 6.9534912109375, 7.245849609375, 7.5382080078125, 7.83056640625, 8.1229248046875, 8.415283203125, 8.7076416015625, 9.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 8.0, 18.0, 22.0, 30.0, 42.0, 54.0, 61.0, 99.0, 135.0, 162.0, 72.0, 59.0, 49.0, 34.0, 32.0, 19.0, 15.0, 16.0, 15.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.002811431884765625, -0.0027356743812561035, -0.002659916877746582, -0.0025841593742370605, -0.002508401870727539, -0.0024326443672180176, -0.002356886863708496, -0.0022811293601989746, -0.002205371856689453, -0.0021296143531799316, -0.00205385684967041, -0.0019780993461608887, -0.0019023418426513672, -0.0018265843391418457, -0.0017508268356323242, -0.0016750693321228027, -0.0015993118286132812, -0.0015235543251037598, -0.0014477968215942383, -0.0013720393180847168, -0.0012962818145751953, -0.0012205243110656738, -0.0011447668075561523, -0.0010690093040466309, -0.0009932518005371094, -0.0009174942970275879, -0.0008417367935180664, -0.0007659792900085449, -0.0006902217864990234, -0.000614464282989502, -0.0005387067794799805, -0.000462949275970459, -0.0003871917724609375, -0.000311434268951416, -0.00023567676544189453, -0.00015991926193237305, -8.416175842285156e-05, -8.404254913330078e-06, 6.73532485961914e-05, 0.0001431107521057129, 0.00021886825561523438, 0.00029462575912475586, 0.00037038326263427734, 0.00044614076614379883, 0.0005218982696533203, 0.0005976557731628418, 0.0006734132766723633, 0.0007491707801818848, 0.0008249282836914062, 0.0009006857872009277, 0.0009764432907104492, 0.0010522007942199707, 0.0011279582977294922, 0.0012037158012390137, 0.0012794733047485352, 0.0013552308082580566, 0.0014309883117675781, 0.0015067458152770996, 0.001582503318786621, 0.0016582608222961426, 0.001734018325805664, 0.0018097758293151855, 0.001885533332824707, 0.0019612908363342285, 0.00203704833984375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 7.0, 12.0, 34.0, 36.0, 54.0, 58.0, 125.0, 244.0, 392.0, 980.0, 2605.0, 10110.0, 75216.0, 751212.0, 182943.0, 18088.0, 3859.0, 1316.0, 537.0, 275.0, 157.0, 108.0, 58.0, 45.0, 28.0, 14.0, 13.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.09375, -14.7132568359375, -14.332763671875, -13.9522705078125, -13.57177734375, -13.1912841796875, -12.810791015625, -12.4302978515625, -12.0498046875, -11.6693115234375, -11.288818359375, -10.9083251953125, -10.52783203125, -10.1473388671875, -9.766845703125, -9.3863525390625, -9.005859375, -8.6253662109375, -8.244873046875, -7.8643798828125, -7.48388671875, -7.1033935546875, -6.722900390625, -6.3424072265625, -5.9619140625, -5.5814208984375, -5.200927734375, -4.8204345703125, -4.43994140625, -4.0594482421875, -3.678955078125, -3.2984619140625, -2.91796875, -2.5374755859375, -2.156982421875, -1.7764892578125, -1.39599609375, -1.0155029296875, -0.635009765625, -0.2545166015625, 0.1259765625, 0.5064697265625, 0.886962890625, 1.2674560546875, 1.64794921875, 2.0284423828125, 2.408935546875, 2.7894287109375, 3.169921875, 3.5504150390625, 3.930908203125, 4.3114013671875, 4.69189453125, 5.0723876953125, 5.452880859375, 5.8333740234375, 6.2138671875, 6.5943603515625, 6.974853515625, 7.3553466796875, 7.73583984375, 8.1163330078125, 8.496826171875, 8.8773193359375, 9.2578125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 10.0, 9.0, 10.0, 22.0, 26.0, 26.0, 36.0, 45.0, 58.0, 82.0, 71.0, 71.0, 79.0, 87.0, 68.0, 52.0, 52.0, 37.0, 30.0, 32.0, 11.0, 15.0, 12.0, 10.0, 9.0, 5.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.31866455078125, -7.0904541015625, -6.86224365234375, -6.634033203125, -6.40582275390625, -6.1776123046875, -5.94940185546875, -5.72119140625, -5.49298095703125, -5.2647705078125, -5.03656005859375, -4.808349609375, -4.58013916015625, -4.3519287109375, -4.12371826171875, -3.8955078125, -3.66729736328125, -3.4390869140625, -3.21087646484375, -2.982666015625, -2.75445556640625, -2.5262451171875, -2.29803466796875, -2.06982421875, -1.84161376953125, -1.6134033203125, -1.38519287109375, -1.156982421875, -0.92877197265625, -0.7005615234375, -0.47235107421875, -0.244140625, -0.01593017578125, 0.2122802734375, 0.44049072265625, 0.668701171875, 0.89691162109375, 1.1251220703125, 1.35333251953125, 1.58154296875, 1.80975341796875, 2.0379638671875, 2.26617431640625, 2.494384765625, 2.72259521484375, 2.9508056640625, 3.17901611328125, 3.4072265625, 3.63543701171875, 3.8636474609375, 4.09185791015625, 4.320068359375, 4.54827880859375, 4.7764892578125, 5.00469970703125, 5.23291015625, 5.46112060546875, 5.6893310546875, 5.91754150390625, 6.145751953125, 6.37396240234375, 6.6021728515625, 6.83038330078125, 7.05859375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 10.0, 27.0, 79.0, 187.0, 236.0, 226.0, 130.0, 56.0, 18.0, 11.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.1764678955078, -205.19822692871094, -197.22000122070312, -189.24176025390625, -181.26351928710938, -173.2852783203125, -165.3070526123047, -157.3288116455078, -149.3505859375, -141.37234497070312, -133.3941192626953, -125.41587829589844, -117.43763732910156, -109.45940399169922, -101.48117065429688, -93.5029296875, -85.52468872070312, -77.54645538330078, -69.5682144165039, -61.58998107910156, -53.61174392700195, -45.633506774902344, -37.6552734375, -29.67703628540039, -21.69879913330078, -13.720562934875488, -5.742326736450195, 2.2359085083007812, 10.21414566040039, 18.1923828125, 26.170616149902344, 34.14885330200195, 42.1270751953125, 50.10531234741211, 58.08354949951172, 66.06178283691406, 74.04002380371094, 82.01825714111328, 89.99649047851562, 97.9747314453125, 105.95296478271484, 113.93119812011719, 121.90943908691406, 129.88766479492188, 137.86590576171875, 145.84414672851562, 153.8223876953125, 161.8006134033203, 169.7788543701172, 177.75709533691406, 185.73532104492188, 193.71356201171875, 201.69180297851562, 209.6700439453125, 217.6482696533203, 225.6265106201172, 233.604736328125, 241.58297729492188, 249.5612030029297, 257.5394287109375, 265.5176696777344, 273.49591064453125, 281.4741516113281, 289.452392578125, 297.4306335449219]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 3.0, 8.0, 13.0, 9.0, 12.0, 15.0, 9.0, 25.0, 14.0, 26.0, 29.0, 39.0, 36.0, 31.0, 38.0, 33.0, 50.0, 42.0, 51.0, 50.0, 45.0, 42.0, 55.0, 32.0, 46.0, 35.0, 29.0, 28.0, 19.0, 24.0, 27.0, 15.0, 9.0, 14.0, 16.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.564453125, -96.45973205566406, -93.35501098632812, -90.25028991699219, -87.14556884765625, -84.04084777832031, -80.93612670898438, -77.83140563964844, -74.7266845703125, -71.62196350097656, -68.51724243164062, -65.41252136230469, -62.30780029296875, -59.20307922363281, -56.09835433959961, -52.99363327026367, -49.88890838623047, -46.78418731689453, -43.679466247558594, -40.574745178222656, -37.47002410888672, -34.36530303955078, -31.260578155517578, -28.15585708618164, -25.051136016845703, -21.946414947509766, -18.841693878173828, -15.736970901489258, -12.63224983215332, -9.527528762817383, -6.4228057861328125, -3.318084716796875, -0.21337127685546875, 2.891350269317627, 5.996071815490723, 9.100793838500977, 12.205514907836914, 15.310235977172852, 18.414958953857422, 21.51968002319336, 24.624401092529297, 27.729122161865234, 30.833843231201172, 33.938568115234375, 37.04328918457031, 40.14801025390625, 43.25273132324219, 46.357452392578125, 49.46217346191406, 52.56689453125, 55.67161560058594, 58.776336669921875, 61.88105773925781, 64.98577880859375, 68.09049987792969, 71.19522094726562, 74.29994201660156, 77.4046630859375, 80.50938415527344, 83.61410522460938, 86.71882629394531, 89.82354736328125, 92.92826843261719, 96.03298950195312, 99.1377182006836]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 6.0, 14.0, 25.0, 32.0, 41.0, 76.0, 145.0, 263.0, 470.0, 922.0, 1879.0, 4429.0, 11849.0, 41558.0, 323744.0, 3332786.0, 406817.0, 46950.0, 13188.0, 4865.0, 2031.0, 962.0, 528.0, 285.0, 156.0, 92.0, 58.0, 31.0, 14.0, 16.0, 9.0, 5.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.03125, -14.619873046875, -14.20849609375, -13.797119140625, -13.3857421875, -12.974365234375, -12.56298828125, -12.151611328125, -11.740234375, -11.328857421875, -10.91748046875, -10.506103515625, -10.0947265625, -9.683349609375, -9.27197265625, -8.860595703125, -8.44921875, -8.037841796875, -7.62646484375, -7.215087890625, -6.8037109375, -6.392333984375, -5.98095703125, -5.569580078125, -5.158203125, -4.746826171875, -4.33544921875, -3.924072265625, -3.5126953125, -3.101318359375, -2.68994140625, -2.278564453125, -1.8671875, -1.455810546875, -1.04443359375, -0.633056640625, -0.2216796875, 0.189697265625, 0.60107421875, 1.012451171875, 1.423828125, 1.835205078125, 2.24658203125, 2.657958984375, 3.0693359375, 3.480712890625, 3.89208984375, 4.303466796875, 4.71484375, 5.126220703125, 5.53759765625, 5.948974609375, 6.3603515625, 6.771728515625, 7.18310546875, 7.594482421875, 8.005859375, 8.417236328125, 8.82861328125, 9.239990234375, 9.6513671875, 10.062744140625, 10.47412109375, 10.885498046875, 11.296875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 5.0, 10.0, 11.0, 18.0, 16.0, 14.0, 22.0, 27.0, 41.0, 45.0, 47.0, 60.0, 59.0, 48.0, 54.0, 57.0, 52.0, 58.0, 51.0, 47.0, 50.0, 37.0, 30.0, 31.0, 19.0, 23.0, 14.0, 13.0, 10.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.234375, -6.0400390625, -5.845703125, -5.6513671875, -5.45703125, -5.2626953125, -5.068359375, -4.8740234375, -4.6796875, -4.4853515625, -4.291015625, -4.0966796875, -3.90234375, -3.7080078125, -3.513671875, -3.3193359375, -3.125, -2.9306640625, -2.736328125, -2.5419921875, -2.34765625, -2.1533203125, -1.958984375, -1.7646484375, -1.5703125, -1.3759765625, -1.181640625, -0.9873046875, -0.79296875, -0.5986328125, -0.404296875, -0.2099609375, -0.015625, 0.1787109375, 0.373046875, 0.5673828125, 0.76171875, 0.9560546875, 1.150390625, 1.3447265625, 1.5390625, 1.7333984375, 1.927734375, 2.1220703125, 2.31640625, 2.5107421875, 2.705078125, 2.8994140625, 3.09375, 3.2880859375, 3.482421875, 3.6767578125, 3.87109375, 4.0654296875, 4.259765625, 4.4541015625, 4.6484375, 4.8427734375, 5.037109375, 5.2314453125, 5.42578125, 5.6201171875, 5.814453125, 6.0087890625, 6.203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 7.0, 5.0, 1.0, 6.0, 9.0, 9.0, 8.0, 16.0, 17.0, 30.0, 43.0, 63.0, 133.0, 251.0, 513.0, 1282.0, 3896.0, 14903.0, 96726.0, 3548930.0, 482343.0, 33976.0, 7449.0, 2177.0, 750.0, 298.0, 175.0, 83.0, 55.0, 41.0, 18.0, 17.0, 14.0, 12.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-24.171875, -23.45556640625, -22.7392578125, -22.02294921875, -21.306640625, -20.59033203125, -19.8740234375, -19.15771484375, -18.44140625, -17.72509765625, -17.0087890625, -16.29248046875, -15.576171875, -14.85986328125, -14.1435546875, -13.42724609375, -12.7109375, -11.99462890625, -11.2783203125, -10.56201171875, -9.845703125, -9.12939453125, -8.4130859375, -7.69677734375, -6.98046875, -6.26416015625, -5.5478515625, -4.83154296875, -4.115234375, -3.39892578125, -2.6826171875, -1.96630859375, -1.25, -0.53369140625, 0.1826171875, 0.89892578125, 1.615234375, 2.33154296875, 3.0478515625, 3.76416015625, 4.48046875, 5.19677734375, 5.9130859375, 6.62939453125, 7.345703125, 8.06201171875, 8.7783203125, 9.49462890625, 10.2109375, 10.92724609375, 11.6435546875, 12.35986328125, 13.076171875, 13.79248046875, 14.5087890625, 15.22509765625, 15.94140625, 16.65771484375, 17.3740234375, 18.09033203125, 18.806640625, 19.52294921875, 20.2392578125, 20.95556640625, 21.671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 3.0, 10.0, 8.0, 9.0, 5.0, 19.0, 15.0, 24.0, 39.0, 49.0, 60.0, 124.0, 252.0, 485.0, 905.0, 879.0, 516.0, 244.0, 119.0, 94.0, 56.0, 38.0, 30.0, 21.0, 14.0, 9.0, 8.0, 11.0, 1.0, 4.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.83447265625, -11.3408203125, -10.84716796875, -10.353515625, -9.85986328125, -9.3662109375, -8.87255859375, -8.37890625, -7.88525390625, -7.3916015625, -6.89794921875, -6.404296875, -5.91064453125, -5.4169921875, -4.92333984375, -4.4296875, -3.93603515625, -3.4423828125, -2.94873046875, -2.455078125, -1.96142578125, -1.4677734375, -0.97412109375, -0.48046875, 0.01318359375, 0.5068359375, 1.00048828125, 1.494140625, 1.98779296875, 2.4814453125, 2.97509765625, 3.46875, 3.96240234375, 4.4560546875, 4.94970703125, 5.443359375, 5.93701171875, 6.4306640625, 6.92431640625, 7.41796875, 7.91162109375, 8.4052734375, 8.89892578125, 9.392578125, 9.88623046875, 10.3798828125, 10.87353515625, 11.3671875, 11.86083984375, 12.3544921875, 12.84814453125, 13.341796875, 13.83544921875, 14.3291015625, 14.82275390625, 15.31640625, 15.81005859375, 16.3037109375, 16.79736328125, 17.291015625, 17.78466796875, 18.2783203125, 18.77197265625, 19.265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 9.0, 9.0, 34.0, 61.0, 113.0, 176.0, 196.0, 170.0, 93.0, 66.0, 26.0, 21.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.44546508789062, -200.82093811035156, -195.1964111328125, -189.57186889648438, -183.9473419189453, -178.32281494140625, -172.69827270507812, -167.07374572753906, -161.44921875, -155.82469177246094, -150.20016479492188, -144.57562255859375, -138.9510955810547, -133.32656860351562, -127.70203399658203, -122.07749938964844, -116.45297241210938, -110.82844543457031, -105.20391082763672, -99.57937622070312, -93.95484924316406, -88.330322265625, -82.7057876586914, -77.08125305175781, -71.45672607421875, -65.83219909667969, -60.207664489746094, -54.583133697509766, -48.95860290527344, -43.33407211303711, -37.70954132080078, -32.08501052856445, -26.460479736328125, -20.835948944091797, -15.211418151855469, -9.58688735961914, -3.9623565673828125, 1.6621742248535156, 7.286705017089844, 12.911235809326172, 18.5357666015625, 24.160297393798828, 29.784828186035156, 35.409358978271484, 41.03388977050781, 46.65842056274414, 52.28295135498047, 57.9074821472168, 63.532012939453125, 69.15653991699219, 74.78107452392578, 80.40560913085938, 86.03013610839844, 91.6546630859375, 97.2791976928711, 102.90373229980469, 108.52825927734375, 114.15278625488281, 119.7773208618164, 125.40185546875, 131.02638244628906, 136.65090942382812, 142.27545166015625, 147.8999786376953, 153.52450561523438]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 11.0, 8.0, 22.0, 22.0, 17.0, 34.0, 32.0, 33.0, 45.0, 54.0, 43.0, 60.0, 53.0, 52.0, 63.0, 62.0, 56.0, 42.0, 48.0, 35.0, 43.0, 36.0, 25.0, 20.0, 14.0, 16.0, 11.0, 5.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.94668579101562, -70.21439361572266, -67.48210144042969, -64.74980926513672, -62.01751708984375, -59.28522491455078, -56.55292892456055, -53.82063674926758, -51.08834457397461, -48.35605239868164, -45.62376022338867, -42.89146423339844, -40.15917205810547, -37.4268798828125, -34.69458770751953, -31.962295532226562, -29.230003356933594, -26.497711181640625, -23.765419006347656, -21.033124923706055, -18.300832748413086, -15.568540573120117, -12.836246490478516, -10.103954315185547, -7.371662139892578, -4.639369487762451, -1.9070768356323242, 0.8252162933349609, 3.5575084686279297, 6.289800643920898, 9.0220947265625, 11.754386901855469, 14.486679077148438, 17.218971252441406, 19.951263427734375, 22.683557510375977, 25.415849685668945, 28.148141860961914, 30.880435943603516, 33.612728118896484, 36.34502029418945, 39.07731246948242, 41.80960464477539, 44.541900634765625, 47.274192810058594, 50.00648498535156, 52.73877716064453, 55.4710693359375, 58.20336151123047, 60.93565368652344, 63.667945861816406, 66.40023803710938, 69.13253021240234, 71.86482238769531, 74.59712219238281, 77.32940673828125, 80.06170654296875, 82.79399871826172, 85.52629089355469, 88.25858306884766, 90.99087524414062, 93.7231674194336, 96.45545959472656, 99.18775939941406, 101.9200439453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 7.0, 9.0, 8.0, 21.0, 30.0, 41.0, 59.0, 100.0, 157.0, 255.0, 409.0, 695.0, 1216.0, 2151.0, 4282.0, 8832.0, 19162.0, 42858.0, 102329.0, 244536.0, 330661.0, 166154.0, 68541.0, 29242.0, 13388.0, 6136.0, 3174.0, 1698.0, 962.0, 573.0, 323.0, 189.0, 120.0, 71.0, 54.0, 31.0, 23.0, 12.0, 9.0, 9.0, 6.0, 3.0, 7.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.9293212890625, -8.624267578125, -8.3192138671875, -8.01416015625, -7.7091064453125, -7.404052734375, -7.0989990234375, -6.7939453125, -6.4888916015625, -6.183837890625, -5.8787841796875, -5.57373046875, -5.2686767578125, -4.963623046875, -4.6585693359375, -4.353515625, -4.0484619140625, -3.743408203125, -3.4383544921875, -3.13330078125, -2.8282470703125, -2.523193359375, -2.2181396484375, -1.9130859375, -1.6080322265625, -1.302978515625, -0.9979248046875, -0.69287109375, -0.3878173828125, -0.082763671875, 0.2222900390625, 0.52734375, 0.8323974609375, 1.137451171875, 1.4425048828125, 1.74755859375, 2.0526123046875, 2.357666015625, 2.6627197265625, 2.9677734375, 3.2728271484375, 3.577880859375, 3.8829345703125, 4.18798828125, 4.4930419921875, 4.798095703125, 5.1031494140625, 5.408203125, 5.7132568359375, 6.018310546875, 6.3233642578125, 6.62841796875, 6.9334716796875, 7.238525390625, 7.5435791015625, 7.8486328125, 8.1536865234375, 8.458740234375, 8.7637939453125, 9.06884765625, 9.3739013671875, 9.678955078125, 9.9840087890625, 10.2890625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 4.0, 6.0, 11.0, 10.0, 16.0, 17.0, 26.0, 29.0, 22.0, 33.0, 33.0, 36.0, 46.0, 59.0, 55.0, 50.0, 58.0, 46.0, 51.0, 42.0, 46.0, 40.0, 37.0, 39.0, 29.0, 23.0, 20.0, 26.0, 14.0, 20.0, 10.0, 5.0, 10.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.9151611328125, -4.732666015625, -4.5501708984375, -4.36767578125, -4.1851806640625, -4.002685546875, -3.8201904296875, -3.6376953125, -3.4552001953125, -3.272705078125, -3.0902099609375, -2.90771484375, -2.7252197265625, -2.542724609375, -2.3602294921875, -2.177734375, -1.9952392578125, -1.812744140625, -1.6302490234375, -1.44775390625, -1.2652587890625, -1.082763671875, -0.9002685546875, -0.7177734375, -0.5352783203125, -0.352783203125, -0.1702880859375, 0.01220703125, 0.1947021484375, 0.377197265625, 0.5596923828125, 0.7421875, 0.9246826171875, 1.107177734375, 1.2896728515625, 1.47216796875, 1.6546630859375, 1.837158203125, 2.0196533203125, 2.2021484375, 2.3846435546875, 2.567138671875, 2.7496337890625, 2.93212890625, 3.1146240234375, 3.297119140625, 3.4796142578125, 3.662109375, 3.8446044921875, 4.027099609375, 4.2095947265625, 4.39208984375, 4.5745849609375, 4.757080078125, 4.9395751953125, 5.1220703125, 5.3045654296875, 5.487060546875, 5.6695556640625, 5.85205078125, 6.0345458984375, 6.217041015625, 6.3995361328125, 6.58203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 9.0, 7.0, 12.0, 18.0, 25.0, 32.0, 68.0, 92.0, 148.0, 277.0, 515.0, 1322.0, 4650.0, 73431.0, 925864.0, 36399.0, 3535.0, 1045.0, 485.0, 243.0, 142.0, 78.0, 42.0, 34.0, 18.0, 16.0, 11.0, 8.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.03125, -50.60205078125, -49.1728515625, -47.74365234375, -46.314453125, -44.88525390625, -43.4560546875, -42.02685546875, -40.59765625, -39.16845703125, -37.7392578125, -36.31005859375, -34.880859375, -33.45166015625, -32.0224609375, -30.59326171875, -29.1640625, -27.73486328125, -26.3056640625, -24.87646484375, -23.447265625, -22.01806640625, -20.5888671875, -19.15966796875, -17.73046875, -16.30126953125, -14.8720703125, -13.44287109375, -12.013671875, -10.58447265625, -9.1552734375, -7.72607421875, -6.296875, -4.86767578125, -3.4384765625, -2.00927734375, -0.580078125, 0.84912109375, 2.2783203125, 3.70751953125, 5.13671875, 6.56591796875, 7.9951171875, 9.42431640625, 10.853515625, 12.28271484375, 13.7119140625, 15.14111328125, 16.5703125, 17.99951171875, 19.4287109375, 20.85791015625, 22.287109375, 23.71630859375, 25.1455078125, 26.57470703125, 28.00390625, 29.43310546875, 30.8623046875, 32.29150390625, 33.720703125, 35.14990234375, 36.5791015625, 38.00830078125, 39.4375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 4.0, 11.0, 5.0, 6.0, 8.0, 10.0, 19.0, 22.0, 19.0, 31.0, 33.0, 52.0, 40.0, 38.0, 55.0, 51.0, 64.0, 49.0, 47.0, 63.0, 45.0, 44.0, 43.0, 45.0, 33.0, 31.0, 29.0, 22.0, 14.0, 13.0, 16.0, 8.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-34.53125, -33.63330078125, -32.7353515625, -31.83740234375, -30.939453125, -30.04150390625, -29.1435546875, -28.24560546875, -27.34765625, -26.44970703125, -25.5517578125, -24.65380859375, -23.755859375, -22.85791015625, -21.9599609375, -21.06201171875, -20.1640625, -19.26611328125, -18.3681640625, -17.47021484375, -16.572265625, -15.67431640625, -14.7763671875, -13.87841796875, -12.98046875, -12.08251953125, -11.1845703125, -10.28662109375, -9.388671875, -8.49072265625, -7.5927734375, -6.69482421875, -5.796875, -4.89892578125, -4.0009765625, -3.10302734375, -2.205078125, -1.30712890625, -0.4091796875, 0.48876953125, 1.38671875, 2.28466796875, 3.1826171875, 4.08056640625, 4.978515625, 5.87646484375, 6.7744140625, 7.67236328125, 8.5703125, 9.46826171875, 10.3662109375, 11.26416015625, 12.162109375, 13.06005859375, 13.9580078125, 14.85595703125, 15.75390625, 16.65185546875, 17.5498046875, 18.44775390625, 19.345703125, 20.24365234375, 21.1416015625, 22.03955078125, 22.9375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 15.0, 18.0, 35.0, 56.0, 86.0, 141.0, 353.0, 965.0, 3620.0, 39267.0, 923369.0, 73647.0, 4979.0, 1106.0, 412.0, 206.0, 108.0, 57.0, 30.0, 19.0, 13.0, 12.0, 4.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.765625, -23.097900390625, -22.43017578125, -21.762451171875, -21.0947265625, -20.427001953125, -19.75927734375, -19.091552734375, -18.423828125, -17.756103515625, -17.08837890625, -16.420654296875, -15.7529296875, -15.085205078125, -14.41748046875, -13.749755859375, -13.08203125, -12.414306640625, -11.74658203125, -11.078857421875, -10.4111328125, -9.743408203125, -9.07568359375, -8.407958984375, -7.740234375, -7.072509765625, -6.40478515625, -5.737060546875, -5.0693359375, -4.401611328125, -3.73388671875, -3.066162109375, -2.3984375, -1.730712890625, -1.06298828125, -0.395263671875, 0.2724609375, 0.940185546875, 1.60791015625, 2.275634765625, 2.943359375, 3.611083984375, 4.27880859375, 4.946533203125, 5.6142578125, 6.281982421875, 6.94970703125, 7.617431640625, 8.28515625, 8.952880859375, 9.62060546875, 10.288330078125, 10.9560546875, 11.623779296875, 12.29150390625, 12.959228515625, 13.626953125, 14.294677734375, 14.96240234375, 15.630126953125, 16.2978515625, 16.965576171875, 17.63330078125, 18.301025390625, 18.96875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 15.0, 13.0, 18.0, 28.0, 30.0, 31.0, 62.0, 73.0, 163.0, 197.0, 124.0, 73.0, 36.0, 26.0, 29.0, 19.0, 12.0, 11.0, 9.0, 6.0, 4.0, 1.0, 9.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034656524658203125, -0.003367602825164795, -0.0032695531845092773, -0.0031715035438537598, -0.003073453903198242, -0.0029754042625427246, -0.002877354621887207, -0.0027793049812316895, -0.002681255340576172, -0.0025832056999206543, -0.0024851560592651367, -0.002387106418609619, -0.0022890567779541016, -0.002191007137298584, -0.0020929574966430664, -0.001994907855987549, -0.0018968582153320312, -0.0017988085746765137, -0.001700758934020996, -0.0016027092933654785, -0.001504659652709961, -0.0014066100120544434, -0.0013085603713989258, -0.0012105107307434082, -0.0011124610900878906, -0.001014411449432373, -0.0009163618087768555, -0.0008183121681213379, -0.0007202625274658203, -0.0006222128868103027, -0.0005241632461547852, -0.0004261136054992676, -0.00032806396484375, -0.00023001432418823242, -0.00013196468353271484, -3.3915042877197266e-05, 6.413459777832031e-05, 0.0001621842384338379, 0.00026023387908935547, 0.00035828351974487305, 0.0004563331604003906, 0.0005543828010559082, 0.0006524324417114258, 0.0007504820823669434, 0.0008485317230224609, 0.0009465813636779785, 0.001044631004333496, 0.0011426806449890137, 0.0012407302856445312, 0.0013387799263000488, 0.0014368295669555664, 0.001534879207611084, 0.0016329288482666016, 0.0017309784889221191, 0.0018290281295776367, 0.0019270777702331543, 0.002025127410888672, 0.0021231770515441895, 0.002221226692199707, 0.0023192763328552246, 0.002417325973510742, 0.0025153756141662598, 0.0026134252548217773, 0.002711474895477295, 0.0028095245361328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 5.0, 7.0, 8.0, 9.0, 24.0, 26.0, 42.0, 70.0, 117.0, 182.0, 340.0, 694.0, 1738.0, 5434.0, 28359.0, 575113.0, 403910.0, 24641.0, 4800.0, 1553.0, 676.0, 303.0, 189.0, 91.0, 54.0, 50.0, 34.0, 20.0, 18.0, 11.0, 12.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.15625, -17.60546875, -17.0546875, -16.50390625, -15.953125, -15.40234375, -14.8515625, -14.30078125, -13.75, -13.19921875, -12.6484375, -12.09765625, -11.546875, -10.99609375, -10.4453125, -9.89453125, -9.34375, -8.79296875, -8.2421875, -7.69140625, -7.140625, -6.58984375, -6.0390625, -5.48828125, -4.9375, -4.38671875, -3.8359375, -3.28515625, -2.734375, -2.18359375, -1.6328125, -1.08203125, -0.53125, 0.01953125, 0.5703125, 1.12109375, 1.671875, 2.22265625, 2.7734375, 3.32421875, 3.875, 4.42578125, 4.9765625, 5.52734375, 6.078125, 6.62890625, 7.1796875, 7.73046875, 8.28125, 8.83203125, 9.3828125, 9.93359375, 10.484375, 11.03515625, 11.5859375, 12.13671875, 12.6875, 13.23828125, 13.7890625, 14.33984375, 14.890625, 15.44140625, 15.9921875, 16.54296875, 17.09375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 8.0, 18.0, 17.0, 16.0, 25.0, 22.0, 49.0, 72.0, 63.0, 122.0, 122.0, 112.0, 80.0, 81.0, 45.0, 36.0, 32.0, 14.0, 13.0, 4.0, 14.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.6767578125, -11.283203125, -10.8896484375, -10.49609375, -10.1025390625, -9.708984375, -9.3154296875, -8.921875, -8.5283203125, -8.134765625, -7.7412109375, -7.34765625, -6.9541015625, -6.560546875, -6.1669921875, -5.7734375, -5.3798828125, -4.986328125, -4.5927734375, -4.19921875, -3.8056640625, -3.412109375, -3.0185546875, -2.625, -2.2314453125, -1.837890625, -1.4443359375, -1.05078125, -0.6572265625, -0.263671875, 0.1298828125, 0.5234375, 0.9169921875, 1.310546875, 1.7041015625, 2.09765625, 2.4912109375, 2.884765625, 3.2783203125, 3.671875, 4.0654296875, 4.458984375, 4.8525390625, 5.24609375, 5.6396484375, 6.033203125, 6.4267578125, 6.8203125, 7.2138671875, 7.607421875, 8.0009765625, 8.39453125, 8.7880859375, 9.181640625, 9.5751953125, 9.96875, 10.3623046875, 10.755859375, 11.1494140625, 11.54296875, 11.9365234375, 12.330078125, 12.7236328125, 13.1171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 67.0, 203.0, 474.0, 185.0, 43.0, 13.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-606.1787109375, -592.8401489257812, -579.5016479492188, -566.1630859375, -552.8245849609375, -539.4860229492188, -526.1475219726562, -512.8089599609375, -499.4704284667969, -486.13189697265625, -472.7933654785156, -459.454833984375, -446.1163024902344, -432.77777099609375, -419.439208984375, -406.1006774902344, -392.76214599609375, -379.4236145019531, -366.0850830078125, -352.7465515136719, -339.40802001953125, -326.0694580078125, -312.73095703125, -299.39239501953125, -286.05389404296875, -272.7153625488281, -259.3768310546875, -246.03829956054688, -232.6997528076172, -219.36122131347656, -206.02268981933594, -192.68414306640625, -179.34559631347656, -166.00706481933594, -152.6685333251953, -139.32998657226562, -125.991455078125, -112.65292358398438, -99.31439208984375, -85.9758529663086, -72.63732147216797, -59.29878616333008, -45.96025085449219, -32.62171936035156, -19.283184051513672, -5.944648742675781, 7.393882751464844, 20.732421875, 34.070953369140625, 47.409488677978516, 60.748023986816406, 74.08655548095703, 87.42509460449219, 100.76362609863281, 114.10215759277344, 127.4406967163086, 140.77923583984375, 154.11776733398438, 167.456298828125, 180.79483032226562, 194.1333770751953, 207.47190856933594, 220.81044006347656, 234.14898681640625, 247.4875030517578]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 1.0, 9.0, 7.0, 10.0, 9.0, 10.0, 16.0, 15.0, 28.0, 30.0, 41.0, 39.0, 46.0, 43.0, 60.0, 51.0, 72.0, 54.0, 56.0, 64.0, 46.0, 56.0, 38.0, 39.0, 30.0, 36.0, 16.0, 17.0, 16.0, 13.0, 10.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-149.04537963867188, -145.2171173095703, -141.3888702392578, -137.56060791015625, -133.73236083984375, -129.9040985107422, -126.07583618164062, -122.2475814819336, -118.41932678222656, -114.59107208251953, -110.7628173828125, -106.93455505371094, -103.1063003540039, -99.27804565429688, -95.44978332519531, -91.62152862548828, -87.79327392578125, -83.96501922607422, -80.13676452636719, -76.30850219726562, -72.4802474975586, -68.65199279785156, -64.82373046875, -60.99547576904297, -57.16722106933594, -53.338966369628906, -49.51070785522461, -45.68244934082031, -41.85419464111328, -38.02593994140625, -34.19768142700195, -30.36942481994629, -26.541168212890625, -22.71291160583496, -18.884654998779297, -15.056398391723633, -11.228141784667969, -7.399885177612305, -3.5716285705566406, 0.25662803649902344, 4.0848846435546875, 7.913141250610352, 11.741397857666016, 15.56965446472168, 19.397911071777344, 23.226167678833008, 27.054424285888672, 30.882680892944336, 34.7109375, 38.53919219970703, 42.36745071411133, 46.195709228515625, 50.023963928222656, 53.85221862792969, 57.680477142333984, 61.50873565673828, 65.33699035644531, 69.16524505615234, 72.99349975585938, 76.82176208496094, 80.65001678466797, 84.478271484375, 88.30653381347656, 92.1347885131836, 95.96304321289062]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 5.0, 12.0, 19.0, 20.0, 34.0, 42.0, 69.0, 96.0, 160.0, 269.0, 933.0, 55139.0, 4132557.0, 3936.0, 406.0, 180.0, 118.0, 73.0, 57.0, 49.0, 22.0, 19.0, 13.0, 8.0, 7.0, 9.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-99.125, -96.462890625, -93.80078125, -91.138671875, -88.4765625, -85.814453125, -83.15234375, -80.490234375, -77.828125, -75.166015625, -72.50390625, -69.841796875, -67.1796875, -64.517578125, -61.85546875, -59.193359375, -56.53125, -53.869140625, -51.20703125, -48.544921875, -45.8828125, -43.220703125, -40.55859375, -37.896484375, -35.234375, -32.572265625, -29.91015625, -27.248046875, -24.5859375, -21.923828125, -19.26171875, -16.599609375, -13.9375, -11.275390625, -8.61328125, -5.951171875, -3.2890625, -0.626953125, 2.03515625, 4.697265625, 7.359375, 10.021484375, 12.68359375, 15.345703125, 18.0078125, 20.669921875, 23.33203125, 25.994140625, 28.65625, 31.318359375, 33.98046875, 36.642578125, 39.3046875, 41.966796875, 44.62890625, 47.291015625, 49.953125, 52.615234375, 55.27734375, 57.939453125, 60.6015625, 63.263671875, 65.92578125, 68.587890625, 71.25]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 18.0, 11.0, 26.0, 36.0, 49.0, 53.0, 62.0, 67.0, 86.0, 96.0, 70.0, 77.0, 63.0, 72.0, 51.0, 31.0, 38.0, 24.0, 21.0, 17.0, 6.0, 10.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8125, -10.53607177734375, -10.2596435546875, -9.98321533203125, -9.706787109375, -9.43035888671875, -9.1539306640625, -8.87750244140625, -8.60107421875, -8.32464599609375, -8.0482177734375, -7.77178955078125, -7.495361328125, -7.21893310546875, -6.9425048828125, -6.66607666015625, -6.3896484375, -6.11322021484375, -5.8367919921875, -5.56036376953125, -5.283935546875, -5.00750732421875, -4.7310791015625, -4.45465087890625, -4.17822265625, -3.90179443359375, -3.6253662109375, -3.34893798828125, -3.072509765625, -2.79608154296875, -2.5196533203125, -2.24322509765625, -1.966796875, -1.69036865234375, -1.4139404296875, -1.13751220703125, -0.861083984375, -0.58465576171875, -0.3082275390625, -0.03179931640625, 0.24462890625, 0.52105712890625, 0.7974853515625, 1.07391357421875, 1.350341796875, 1.62677001953125, 1.9031982421875, 2.17962646484375, 2.4560546875, 2.73248291015625, 3.0089111328125, 3.28533935546875, 3.561767578125, 3.83819580078125, 4.1146240234375, 4.39105224609375, 4.66748046875, 4.94390869140625, 5.2203369140625, 5.49676513671875, 5.773193359375, 6.04962158203125, 6.3260498046875, 6.60247802734375, 6.87890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 17.0, 19.0, 46.0, 61.0, 87.0, 135.0, 305.0, 533.0, 1097.0, 2654.0, 7076.0, 25620.0, 252955.0, 3653848.0, 216295.0, 23015.0, 6286.0, 2218.0, 926.0, 441.0, 205.0, 153.0, 85.0, 63.0, 38.0, 24.0, 15.0, 9.0, 11.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8046875, -15.1590576171875, -14.513427734375, -13.8677978515625, -13.22216796875, -12.5765380859375, -11.930908203125, -11.2852783203125, -10.6396484375, -9.9940185546875, -9.348388671875, -8.7027587890625, -8.05712890625, -7.4114990234375, -6.765869140625, -6.1202392578125, -5.474609375, -4.8289794921875, -4.183349609375, -3.5377197265625, -2.89208984375, -2.2464599609375, -1.600830078125, -0.9552001953125, -0.3095703125, 0.3360595703125, 0.981689453125, 1.6273193359375, 2.27294921875, 2.9185791015625, 3.564208984375, 4.2098388671875, 4.85546875, 5.5010986328125, 6.146728515625, 6.7923583984375, 7.43798828125, 8.0836181640625, 8.729248046875, 9.3748779296875, 10.0205078125, 10.6661376953125, 11.311767578125, 11.9573974609375, 12.60302734375, 13.2486572265625, 13.894287109375, 14.5399169921875, 15.185546875, 15.8311767578125, 16.476806640625, 17.1224365234375, 17.76806640625, 18.4136962890625, 19.059326171875, 19.7049560546875, 20.3505859375, 20.9962158203125, 21.641845703125, 22.2874755859375, 22.93310546875, 23.5787353515625, 24.224365234375, 24.8699951171875, 25.515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 12.0, 16.0, 18.0, 43.0, 40.0, 96.0, 215.0, 472.0, 984.0, 1096.0, 592.0, 233.0, 105.0, 65.0, 22.0, 18.0, 5.0, 12.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.4375, -20.789794921875, -20.14208984375, -19.494384765625, -18.8466796875, -18.198974609375, -17.55126953125, -16.903564453125, -16.255859375, -15.608154296875, -14.96044921875, -14.312744140625, -13.6650390625, -13.017333984375, -12.36962890625, -11.721923828125, -11.07421875, -10.426513671875, -9.77880859375, -9.131103515625, -8.4833984375, -7.835693359375, -7.18798828125, -6.540283203125, -5.892578125, -5.244873046875, -4.59716796875, -3.949462890625, -3.3017578125, -2.654052734375, -2.00634765625, -1.358642578125, -0.7109375, -0.063232421875, 0.58447265625, 1.232177734375, 1.8798828125, 2.527587890625, 3.17529296875, 3.822998046875, 4.470703125, 5.118408203125, 5.76611328125, 6.413818359375, 7.0615234375, 7.709228515625, 8.35693359375, 9.004638671875, 9.65234375, 10.300048828125, 10.94775390625, 11.595458984375, 12.2431640625, 12.890869140625, 13.53857421875, 14.186279296875, 14.833984375, 15.481689453125, 16.12939453125, 16.777099609375, 17.4248046875, 18.072509765625, 18.72021484375, 19.367919921875, 20.015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 12.0, 29.0, 85.0, 181.0, 249.0, 232.0, 116.0, 41.0, 23.0, 12.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.39412689208984, -113.67118835449219, -106.9482421875, -100.22530364990234, -93.50235748291016, -86.7794189453125, -80.05647277832031, -73.33353424072266, -66.610595703125, -59.88765335083008, -53.164710998535156, -46.4417724609375, -39.71882629394531, -32.995887756347656, -26.272945404052734, -19.550003051757812, -12.827056884765625, -6.104115009307861, 0.6188268661499023, 7.341768264770508, 14.06471061706543, 20.78765106201172, 27.51059341430664, 34.23353576660156, 40.956478118896484, 47.679420471191406, 54.40236282348633, 61.12530517578125, 67.8482437133789, 74.57118225097656, 81.29412841796875, 88.01707458496094, 94.74000549316406, 101.46294403076172, 108.1858901977539, 114.90882873535156, 121.63177490234375, 128.35470581054688, 135.07765197753906, 141.80059814453125, 148.52354431152344, 155.24649047851562, 161.96942138671875, 168.69236755371094, 175.41531372070312, 182.13824462890625, 188.86119079589844, 195.58413696289062, 202.30706787109375, 209.03001403808594, 215.75294494628906, 222.47589111328125, 229.19883728027344, 235.92178344726562, 242.64471435546875, 249.36766052246094, 256.0906066894531, 262.81353759765625, 269.5364990234375, 276.2594299316406, 282.98236083984375, 289.705322265625, 296.4282531738281, 303.15118408203125, 309.8741455078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 8.0, 9.0, 8.0, 12.0, 14.0, 15.0, 19.0, 23.0, 27.0, 32.0, 35.0, 49.0, 49.0, 48.0, 40.0, 51.0, 57.0, 44.0, 57.0, 49.0, 51.0, 33.0, 49.0, 38.0, 28.0, 26.0, 20.0, 21.0, 18.0, 6.0, 15.0, 13.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-73.71693420410156, -71.59661102294922, -69.47628784179688, -67.35596466064453, -65.23564147949219, -63.115318298339844, -60.994991302490234, -58.87466812133789, -56.75434494018555, -54.6340217590332, -52.51369857788086, -50.393375396728516, -48.273048400878906, -46.15272521972656, -44.03240203857422, -41.912078857421875, -39.79175567626953, -37.67143249511719, -35.551109313964844, -33.4307861328125, -31.310461044311523, -29.19013786315918, -27.069812774658203, -24.94948959350586, -22.829166412353516, -20.708843231201172, -18.588520050048828, -16.46819496154785, -14.347871780395508, -12.227548599243164, -10.107224464416504, -7.986900329589844, -5.866569519042969, -3.746245861053467, -1.6259222030639648, 0.4944014549255371, 2.614725112915039, 4.735048294067383, 6.855372428894043, 8.975696563720703, 11.096019744873047, 13.21634292602539, 15.33666706085205, 17.45699119567871, 19.577314376831055, 21.6976375579834, 23.817962646484375, 25.93828582763672, 28.058609008789062, 30.178932189941406, 32.29925537109375, 34.419578552246094, 36.53990173339844, 38.66022491455078, 40.78055191040039, 42.900875091552734, 45.02119827270508, 47.14152145385742, 49.261844635009766, 51.38216781616211, 53.50249481201172, 55.62281799316406, 57.743141174316406, 59.86346435546875, 61.983787536621094]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 9.0, 10.0, 26.0, 36.0, 64.0, 123.0, 204.0, 429.0, 863.0, 2072.0, 5443.0, 15316.0, 49287.0, 198369.0, 522963.0, 183569.0, 46229.0, 14687.0, 5151.0, 1898.0, 915.0, 400.0, 201.0, 119.0, 76.0, 30.0, 23.0, 18.0, 5.0, 9.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1796875, -13.6986083984375, -13.217529296875, -12.7364501953125, -12.25537109375, -11.7742919921875, -11.293212890625, -10.8121337890625, -10.3310546875, -9.8499755859375, -9.368896484375, -8.8878173828125, -8.40673828125, -7.9256591796875, -7.444580078125, -6.9635009765625, -6.482421875, -6.0013427734375, -5.520263671875, -5.0391845703125, -4.55810546875, -4.0770263671875, -3.595947265625, -3.1148681640625, -2.6337890625, -2.1527099609375, -1.671630859375, -1.1905517578125, -0.70947265625, -0.2283935546875, 0.252685546875, 0.7337646484375, 1.21484375, 1.6959228515625, 2.177001953125, 2.6580810546875, 3.13916015625, 3.6202392578125, 4.101318359375, 4.5823974609375, 5.0634765625, 5.5445556640625, 6.025634765625, 6.5067138671875, 6.98779296875, 7.4688720703125, 7.949951171875, 8.4310302734375, 8.912109375, 9.3931884765625, 9.874267578125, 10.3553466796875, 10.83642578125, 11.3175048828125, 11.798583984375, 12.2796630859375, 12.7607421875, 13.2418212890625, 13.722900390625, 14.2039794921875, 14.68505859375, 15.1661376953125, 15.647216796875, 16.1282958984375, 16.609375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 8.0, 5.0, 7.0, 6.0, 9.0, 15.0, 18.0, 23.0, 21.0, 17.0, 29.0, 35.0, 31.0, 41.0, 40.0, 46.0, 47.0, 48.0, 61.0, 43.0, 49.0, 46.0, 44.0, 40.0, 45.0, 45.0, 28.0, 28.0, 24.0, 16.0, 21.0, 16.0, 10.0, 6.0, 10.0, 5.0, 4.0, 9.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9140625, -5.72900390625, -5.5439453125, -5.35888671875, -5.173828125, -4.98876953125, -4.8037109375, -4.61865234375, -4.43359375, -4.24853515625, -4.0634765625, -3.87841796875, -3.693359375, -3.50830078125, -3.3232421875, -3.13818359375, -2.953125, -2.76806640625, -2.5830078125, -2.39794921875, -2.212890625, -2.02783203125, -1.8427734375, -1.65771484375, -1.47265625, -1.28759765625, -1.1025390625, -0.91748046875, -0.732421875, -0.54736328125, -0.3623046875, -0.17724609375, 0.0078125, 0.19287109375, 0.3779296875, 0.56298828125, 0.748046875, 0.93310546875, 1.1181640625, 1.30322265625, 1.48828125, 1.67333984375, 1.8583984375, 2.04345703125, 2.228515625, 2.41357421875, 2.5986328125, 2.78369140625, 2.96875, 3.15380859375, 3.3388671875, 3.52392578125, 3.708984375, 3.89404296875, 4.0791015625, 4.26416015625, 4.44921875, 4.63427734375, 4.8193359375, 5.00439453125, 5.189453125, 5.37451171875, 5.5595703125, 5.74462890625, 5.9296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 15.0, 34.0, 49.0, 90.0, 145.0, 285.0, 713.0, 2082.0, 11139.0, 169772.0, 821350.0, 36270.0, 4475.0, 1240.0, 454.0, 186.0, 94.0, 65.0, 30.0, 18.0, 15.0, 9.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.53125, -33.26416015625, -31.9970703125, -30.72998046875, -29.462890625, -28.19580078125, -26.9287109375, -25.66162109375, -24.39453125, -23.12744140625, -21.8603515625, -20.59326171875, -19.326171875, -18.05908203125, -16.7919921875, -15.52490234375, -14.2578125, -12.99072265625, -11.7236328125, -10.45654296875, -9.189453125, -7.92236328125, -6.6552734375, -5.38818359375, -4.12109375, -2.85400390625, -1.5869140625, -0.31982421875, 0.947265625, 2.21435546875, 3.4814453125, 4.74853515625, 6.015625, 7.28271484375, 8.5498046875, 9.81689453125, 11.083984375, 12.35107421875, 13.6181640625, 14.88525390625, 16.15234375, 17.41943359375, 18.6865234375, 19.95361328125, 21.220703125, 22.48779296875, 23.7548828125, 25.02197265625, 26.2890625, 27.55615234375, 28.8232421875, 30.09033203125, 31.357421875, 32.62451171875, 33.8916015625, 35.15869140625, 36.42578125, 37.69287109375, 38.9599609375, 40.22705078125, 41.494140625, 42.76123046875, 44.0283203125, 45.29541015625, 46.5625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 5.0, 12.0, 13.0, 11.0, 26.0, 21.0, 22.0, 26.0, 35.0, 34.0, 46.0, 44.0, 50.0, 50.0, 53.0, 51.0, 49.0, 61.0, 48.0, 47.0, 37.0, 43.0, 25.0, 35.0, 30.0, 20.0, 15.0, 24.0, 16.0, 10.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-27.484375, -26.662841796875, -25.84130859375, -25.019775390625, -24.1982421875, -23.376708984375, -22.55517578125, -21.733642578125, -20.912109375, -20.090576171875, -19.26904296875, -18.447509765625, -17.6259765625, -16.804443359375, -15.98291015625, -15.161376953125, -14.33984375, -13.518310546875, -12.69677734375, -11.875244140625, -11.0537109375, -10.232177734375, -9.41064453125, -8.589111328125, -7.767578125, -6.946044921875, -6.12451171875, -5.302978515625, -4.4814453125, -3.659912109375, -2.83837890625, -2.016845703125, -1.1953125, -0.373779296875, 0.44775390625, 1.269287109375, 2.0908203125, 2.912353515625, 3.73388671875, 4.555419921875, 5.376953125, 6.198486328125, 7.02001953125, 7.841552734375, 8.6630859375, 9.484619140625, 10.30615234375, 11.127685546875, 11.94921875, 12.770751953125, 13.59228515625, 14.413818359375, 15.2353515625, 16.056884765625, 16.87841796875, 17.699951171875, 18.521484375, 19.343017578125, 20.16455078125, 20.986083984375, 21.8076171875, 22.629150390625, 23.45068359375, 24.272216796875, 25.09375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 16.0, 22.0, 31.0, 40.0, 71.0, 133.0, 210.0, 623.0, 1929.0, 10416.0, 664264.0, 358883.0, 9002.0, 1756.0, 575.0, 242.0, 116.0, 69.0, 41.0, 27.0, 17.0, 13.0, 12.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.0625, -33.0595703125, -32.056640625, -31.0537109375, -30.05078125, -29.0478515625, -28.044921875, -27.0419921875, -26.0390625, -25.0361328125, -24.033203125, -23.0302734375, -22.02734375, -21.0244140625, -20.021484375, -19.0185546875, -18.015625, -17.0126953125, -16.009765625, -15.0068359375, -14.00390625, -13.0009765625, -11.998046875, -10.9951171875, -9.9921875, -8.9892578125, -7.986328125, -6.9833984375, -5.98046875, -4.9775390625, -3.974609375, -2.9716796875, -1.96875, -0.9658203125, 0.037109375, 1.0400390625, 2.04296875, 3.0458984375, 4.048828125, 5.0517578125, 6.0546875, 7.0576171875, 8.060546875, 9.0634765625, 10.06640625, 11.0693359375, 12.072265625, 13.0751953125, 14.078125, 15.0810546875, 16.083984375, 17.0869140625, 18.08984375, 19.0927734375, 20.095703125, 21.0986328125, 22.1015625, 23.1044921875, 24.107421875, 25.1103515625, 26.11328125, 27.1162109375, 28.119140625, 29.1220703125, 30.125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 13.0, 19.0, 34.0, 55.0, 124.0, 323.0, 216.0, 104.0, 34.0, 23.0, 7.0, 14.0, 4.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0047760009765625, -0.004620969295501709, -0.004465937614440918, -0.004310905933380127, -0.004155874252319336, -0.004000842571258545, -0.003845810890197754, -0.003690779209136963, -0.003535747528076172, -0.003380715847015381, -0.00322568416595459, -0.003070652484893799, -0.002915620803833008, -0.002760589122772217, -0.0026055574417114258, -0.0024505257606506348, -0.0022954940795898438, -0.0021404623985290527, -0.0019854307174682617, -0.0018303990364074707, -0.0016753673553466797, -0.0015203356742858887, -0.0013653039932250977, -0.0012102723121643066, -0.0010552406311035156, -0.0009002089500427246, -0.0007451772689819336, -0.0005901455879211426, -0.00043511390686035156, -0.00028008222579956055, -0.00012505054473876953, 2.9981136322021484e-05, 0.0001850128173828125, 0.0003400444984436035, 0.0004950761795043945, 0.0006501078605651855, 0.0008051395416259766, 0.0009601712226867676, 0.0011152029037475586, 0.0012702345848083496, 0.0014252662658691406, 0.0015802979469299316, 0.0017353296279907227, 0.0018903613090515137, 0.0020453929901123047, 0.0022004246711730957, 0.0023554563522338867, 0.0025104880332946777, 0.0026655197143554688, 0.0028205513954162598, 0.0029755830764770508, 0.003130614757537842, 0.003285646438598633, 0.003440678119659424, 0.003595709800720215, 0.003750741481781006, 0.003905773162841797, 0.004060804843902588, 0.004215836524963379, 0.00437086820602417, 0.004525899887084961, 0.004680931568145752, 0.004835963249206543, 0.004990994930267334, 0.005146026611328125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 11.0, 8.0, 12.0, 18.0, 31.0, 36.0, 57.0, 120.0, 208.0, 514.0, 1557.0, 6959.0, 76768.0, 916889.0, 38425.0, 4785.0, 1238.0, 454.0, 199.0, 103.0, 54.0, 42.0, 24.0, 16.0, 9.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.0322265625, -18.251953125, -17.4716796875, -16.69140625, -15.9111328125, -15.130859375, -14.3505859375, -13.5703125, -12.7900390625, -12.009765625, -11.2294921875, -10.44921875, -9.6689453125, -8.888671875, -8.1083984375, -7.328125, -6.5478515625, -5.767578125, -4.9873046875, -4.20703125, -3.4267578125, -2.646484375, -1.8662109375, -1.0859375, -0.3056640625, 0.474609375, 1.2548828125, 2.03515625, 2.8154296875, 3.595703125, 4.3759765625, 5.15625, 5.9365234375, 6.716796875, 7.4970703125, 8.27734375, 9.0576171875, 9.837890625, 10.6181640625, 11.3984375, 12.1787109375, 12.958984375, 13.7392578125, 14.51953125, 15.2998046875, 16.080078125, 16.8603515625, 17.640625, 18.4208984375, 19.201171875, 19.9814453125, 20.76171875, 21.5419921875, 22.322265625, 23.1025390625, 23.8828125, 24.6630859375, 25.443359375, 26.2236328125, 27.00390625, 27.7841796875, 28.564453125, 29.3447265625, 30.125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 7.0, 14.0, 17.0, 43.0, 64.0, 154.0, 262.0, 201.0, 96.0, 49.0, 32.0, 17.0, 18.0, 12.0, 4.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.546875, -30.824462890625, -30.10205078125, -29.379638671875, -28.6572265625, -27.934814453125, -27.21240234375, -26.489990234375, -25.767578125, -25.045166015625, -24.32275390625, -23.600341796875, -22.8779296875, -22.155517578125, -21.43310546875, -20.710693359375, -19.98828125, -19.265869140625, -18.54345703125, -17.821044921875, -17.0986328125, -16.376220703125, -15.65380859375, -14.931396484375, -14.208984375, -13.486572265625, -12.76416015625, -12.041748046875, -11.3193359375, -10.596923828125, -9.87451171875, -9.152099609375, -8.4296875, -7.707275390625, -6.98486328125, -6.262451171875, -5.5400390625, -4.817626953125, -4.09521484375, -3.372802734375, -2.650390625, -1.927978515625, -1.20556640625, -0.483154296875, 0.2392578125, 0.961669921875, 1.68408203125, 2.406494140625, 3.12890625, 3.851318359375, 4.57373046875, 5.296142578125, 6.0185546875, 6.740966796875, 7.46337890625, 8.185791015625, 8.908203125, 9.630615234375, 10.35302734375, 11.075439453125, 11.7978515625, 12.520263671875, 13.24267578125, 13.965087890625, 14.6875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 13.0, 58.0, 364.0, 429.0, 95.0, 34.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-691.30908203125, -673.5811157226562, -655.8531494140625, -638.1251220703125, -620.3971557617188, -602.669189453125, -584.941162109375, -567.2131958007812, -549.4852294921875, -531.7572631835938, -514.029296875, -496.30126953125, -478.57330322265625, -460.8453369140625, -443.1173400878906, -425.38934326171875, -407.661376953125, -389.93341064453125, -372.2054138183594, -354.4774169921875, -336.74945068359375, -319.021484375, -301.2934875488281, -283.56549072265625, -265.8375244140625, -248.1095428466797, -230.38156127929688, -212.65357971191406, -194.92559814453125, -177.19761657714844, -159.46963500976562, -141.7416534423828, -124.01370239257812, -106.28572082519531, -88.5577392578125, -70.82975769042969, -53.101776123046875, -35.37379455566406, -17.64581298828125, 0.0821685791015625, 17.810150146484375, 35.53813171386719, 53.26611328125, 70.99409484863281, 88.72207641601562, 106.45005798339844, 124.17803955078125, 141.90602111816406, 159.63400268554688, 177.3619842529297, 195.0899658203125, 212.8179473876953, 230.54592895507812, 248.27391052246094, 266.00189208984375, 283.7298583984375, 301.4578552246094, 319.18585205078125, 336.913818359375, 354.64178466796875, 372.3697814941406, 390.0977783203125, 407.82574462890625, 425.5537109375, 443.2817077636719]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 3.0, 7.0, 8.0, 11.0, 14.0, 20.0, 19.0, 20.0, 26.0, 34.0, 41.0, 46.0, 46.0, 53.0, 59.0, 89.0, 82.0, 70.0, 58.0, 53.0, 49.0, 48.0, 30.0, 17.0, 24.0, 16.0, 18.0, 13.0, 10.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-162.4191131591797, -157.65037536621094, -152.88165283203125, -148.1129150390625, -143.34417724609375, -138.575439453125, -133.8067169189453, -129.03797912597656, -124.26924896240234, -119.50051879882812, -114.73178100585938, -109.96305084228516, -105.19432067871094, -100.42558288574219, -95.65685272216797, -90.88812255859375, -86.119384765625, -81.35065460205078, -76.58191680908203, -71.81318664550781, -67.04444885253906, -62.275718688964844, -57.506988525390625, -52.73825454711914, -47.969520568847656, -43.20078659057617, -38.43205261230469, -33.66332244873047, -28.894588470458984, -24.1258544921875, -19.35712242126465, -14.588390350341797, -9.819671630859375, -5.050938606262207, -0.28220558166503906, 4.486527442932129, 9.255260467529297, 14.023994445800781, 18.792726516723633, 23.561458587646484, 28.33019256591797, 33.09892654418945, 37.86766052246094, 42.636390686035156, 47.40512466430664, 52.173858642578125, 56.942588806152344, 61.71132278442383, 66.48005676269531, 71.24878692626953, 76.01752471923828, 80.7862548828125, 85.55499267578125, 90.32372283935547, 95.09245300292969, 99.86119079589844, 104.62992095947266, 109.39865112304688, 114.16738891601562, 118.93611907958984, 123.70484924316406, 128.4735870361328, 133.24232482910156, 138.01104736328125, 142.77978515625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 8.0, 6.0, 6.0, 11.0, 8.0, 14.0, 16.0, 29.0, 36.0, 50.0, 78.0, 104.0, 166.0, 257.0, 476.0, 951.0, 2016.0, 4909.0, 14659.0, 70174.0, 1424708.0, 2539906.0, 106425.0, 18575.0, 5924.0, 2452.0, 1032.0, 529.0, 266.0, 162.0, 98.0, 65.0, 42.0, 40.0, 13.0, 22.0, 7.0, 12.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-18.109375, -17.562255859375, -17.01513671875, -16.468017578125, -15.9208984375, -15.373779296875, -14.82666015625, -14.279541015625, -13.732421875, -13.185302734375, -12.63818359375, -12.091064453125, -11.5439453125, -10.996826171875, -10.44970703125, -9.902587890625, -9.35546875, -8.808349609375, -8.26123046875, -7.714111328125, -7.1669921875, -6.619873046875, -6.07275390625, -5.525634765625, -4.978515625, -4.431396484375, -3.88427734375, -3.337158203125, -2.7900390625, -2.242919921875, -1.69580078125, -1.148681640625, -0.6015625, -0.054443359375, 0.49267578125, 1.039794921875, 1.5869140625, 2.134033203125, 2.68115234375, 3.228271484375, 3.775390625, 4.322509765625, 4.86962890625, 5.416748046875, 5.9638671875, 6.510986328125, 7.05810546875, 7.605224609375, 8.15234375, 8.699462890625, 9.24658203125, 9.793701171875, 10.3408203125, 10.887939453125, 11.43505859375, 11.982177734375, 12.529296875, 13.076416015625, 13.62353515625, 14.170654296875, 14.7177734375, 15.264892578125, 15.81201171875, 16.359130859375, 16.90625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 2.0, 9.0, 14.0, 21.0, 26.0, 31.0, 36.0, 50.0, 63.0, 61.0, 89.0, 61.0, 58.0, 57.0, 71.0, 66.0, 50.0, 44.0, 44.0, 29.0, 25.0, 16.0, 20.0, 12.0, 15.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.04229736328125, -4.7994384765625, -4.55657958984375, -4.313720703125, -4.07086181640625, -3.8280029296875, -3.58514404296875, -3.34228515625, -3.09942626953125, -2.8565673828125, -2.61370849609375, -2.370849609375, -2.12799072265625, -1.8851318359375, -1.64227294921875, -1.3994140625, -1.15655517578125, -0.9136962890625, -0.67083740234375, -0.427978515625, -0.18511962890625, 0.0577392578125, 0.30059814453125, 0.54345703125, 0.78631591796875, 1.0291748046875, 1.27203369140625, 1.514892578125, 1.75775146484375, 2.0006103515625, 2.24346923828125, 2.486328125, 2.72918701171875, 2.9720458984375, 3.21490478515625, 3.457763671875, 3.70062255859375, 3.9434814453125, 4.18634033203125, 4.42919921875, 4.67205810546875, 4.9149169921875, 5.15777587890625, 5.400634765625, 5.64349365234375, 5.8863525390625, 6.12921142578125, 6.3720703125, 6.61492919921875, 6.8577880859375, 7.10064697265625, 7.343505859375, 7.58636474609375, 7.8292236328125, 8.07208251953125, 8.31494140625, 8.55780029296875, 8.8006591796875, 9.04351806640625, 9.286376953125, 9.52923583984375, 9.7720947265625, 10.01495361328125, 10.2578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 16.0, 23.0, 30.0, 40.0, 72.0, 136.0, 256.0, 536.0, 1361.0, 4785.0, 26969.0, 475258.0, 3559770.0, 108897.0, 11974.0, 2616.0, 863.0, 350.0, 156.0, 68.0, 37.0, 22.0, 16.0, 11.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.75, -28.906982421875, -28.06396484375, -27.220947265625, -26.3779296875, -25.534912109375, -24.69189453125, -23.848876953125, -23.005859375, -22.162841796875, -21.31982421875, -20.476806640625, -19.6337890625, -18.790771484375, -17.94775390625, -17.104736328125, -16.26171875, -15.418701171875, -14.57568359375, -13.732666015625, -12.8896484375, -12.046630859375, -11.20361328125, -10.360595703125, -9.517578125, -8.674560546875, -7.83154296875, -6.988525390625, -6.1455078125, -5.302490234375, -4.45947265625, -3.616455078125, -2.7734375, -1.930419921875, -1.08740234375, -0.244384765625, 0.5986328125, 1.441650390625, 2.28466796875, 3.127685546875, 3.970703125, 4.813720703125, 5.65673828125, 6.499755859375, 7.3427734375, 8.185791015625, 9.02880859375, 9.871826171875, 10.71484375, 11.557861328125, 12.40087890625, 13.243896484375, 14.0869140625, 14.929931640625, 15.77294921875, 16.615966796875, 17.458984375, 18.302001953125, 19.14501953125, 19.988037109375, 20.8310546875, 21.674072265625, 22.51708984375, 23.360107421875, 24.203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 7.0, 9.0, 10.0, 30.0, 32.0, 60.0, 102.0, 205.0, 372.0, 786.0, 1072.0, 658.0, 323.0, 169.0, 95.0, 50.0, 37.0, 17.0, 14.0, 7.0, 10.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.859375, -29.082763671875, -28.30615234375, -27.529541015625, -26.7529296875, -25.976318359375, -25.19970703125, -24.423095703125, -23.646484375, -22.869873046875, -22.09326171875, -21.316650390625, -20.5400390625, -19.763427734375, -18.98681640625, -18.210205078125, -17.43359375, -16.656982421875, -15.88037109375, -15.103759765625, -14.3271484375, -13.550537109375, -12.77392578125, -11.997314453125, -11.220703125, -10.444091796875, -9.66748046875, -8.890869140625, -8.1142578125, -7.337646484375, -6.56103515625, -5.784423828125, -5.0078125, -4.231201171875, -3.45458984375, -2.677978515625, -1.9013671875, -1.124755859375, -0.34814453125, 0.428466796875, 1.205078125, 1.981689453125, 2.75830078125, 3.534912109375, 4.3115234375, 5.088134765625, 5.86474609375, 6.641357421875, 7.41796875, 8.194580078125, 8.97119140625, 9.747802734375, 10.5244140625, 11.301025390625, 12.07763671875, 12.854248046875, 13.630859375, 14.407470703125, 15.18408203125, 15.960693359375, 16.7373046875, 17.513916015625, 18.29052734375, 19.067138671875, 19.84375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 17.0, 33.0, 115.0, 307.0, 314.0, 153.0, 30.0, 19.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-532.1575317382812, -520.6707763671875, -509.18402099609375, -497.697265625, -486.21051025390625, -474.7237548828125, -463.23699951171875, -451.7502136230469, -440.2634582519531, -428.7767028808594, -417.2899475097656, -405.8031921386719, -394.3164367675781, -382.82965087890625, -371.3428955078125, -359.85614013671875, -348.369384765625, -336.88262939453125, -325.3958740234375, -313.90911865234375, -302.42236328125, -290.93560791015625, -279.4488525390625, -267.9620666503906, -256.475341796875, -244.98858642578125, -233.5018310546875, -222.01507568359375, -210.52830505371094, -199.0415496826172, -187.55479431152344, -176.06802368164062, -164.58126831054688, -153.09451293945312, -141.60775756835938, -130.12100219726562, -118.63423156738281, -107.14747619628906, -95.66072082519531, -84.17395782470703, -72.68720245361328, -61.200443267822266, -49.71368408203125, -38.2269287109375, -26.740169525146484, -15.253410339355469, -3.7666549682617188, 7.7201080322265625, 19.206863403320312, 30.693622589111328, 42.180381774902344, 53.667137145996094, 65.15390014648438, 76.64065551757812, 88.12741088867188, 99.61417388916016, 111.1009292602539, 122.58768463134766, 134.07444763183594, 145.5612030029297, 157.04795837402344, 168.53472900390625, 180.021484375, 191.50823974609375, 202.9949951171875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 7.0, 10.0, 12.0, 6.0, 8.0, 15.0, 16.0, 24.0, 32.0, 38.0, 37.0, 31.0, 34.0, 40.0, 52.0, 48.0, 48.0, 55.0, 55.0, 36.0, 40.0, 57.0, 44.0, 41.0, 35.0, 34.0, 20.0, 20.0, 23.0, 14.0, 17.0, 15.0, 11.0, 9.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.20802307128906, -91.28093719482422, -88.35384368896484, -85.4267578125, -82.49967193603516, -79.57258605957031, -76.64549255371094, -73.7184066772461, -70.79132080078125, -67.8642349243164, -64.93714141845703, -62.01005554199219, -59.082969665527344, -56.155879974365234, -53.228790283203125, -50.30170440673828, -47.374610900878906, -44.4475212097168, -41.52043533325195, -38.593345642089844, -35.666259765625, -32.73917007446289, -29.81208038330078, -26.884992599487305, -23.957904815673828, -21.03081703186035, -18.103729248046875, -15.176639556884766, -12.249551773071289, -9.322463989257812, -6.395374298095703, -3.4682865142822266, -0.5412063598632812, 2.3858819007873535, 5.312970161437988, 8.240058898925781, 11.167146682739258, 14.094234466552734, 17.021324157714844, 19.94841194152832, 22.875499725341797, 25.802587509155273, 28.72967529296875, 31.65676498413086, 34.58385467529297, 37.51094055175781, 40.43803024291992, 43.36511993408203, 46.292205810546875, 49.219295501708984, 52.14638137817383, 55.07347106933594, 58.00055694580078, 60.92764663696289, 63.854736328125, 66.78182220458984, 69.70890808105469, 72.63599395751953, 75.5630874633789, 78.49017333984375, 81.4172592163086, 84.34434509277344, 87.27143859863281, 90.19852447509766, 93.12561798095703]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 11.0, 13.0, 13.0, 22.0, 34.0, 46.0, 101.0, 141.0, 231.0, 441.0, 885.0, 1872.0, 4865.0, 13932.0, 45036.0, 162263.0, 461985.0, 255141.0, 68966.0, 20563.0, 6941.0, 2561.0, 1190.0, 549.0, 284.0, 189.0, 88.0, 54.0, 41.0, 28.0, 18.0, 15.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.34375, -15.843505859375, -15.34326171875, -14.843017578125, -14.3427734375, -13.842529296875, -13.34228515625, -12.842041015625, -12.341796875, -11.841552734375, -11.34130859375, -10.841064453125, -10.3408203125, -9.840576171875, -9.34033203125, -8.840087890625, -8.33984375, -7.839599609375, -7.33935546875, -6.839111328125, -6.3388671875, -5.838623046875, -5.33837890625, -4.838134765625, -4.337890625, -3.837646484375, -3.33740234375, -2.837158203125, -2.3369140625, -1.836669921875, -1.33642578125, -0.836181640625, -0.3359375, 0.164306640625, 0.66455078125, 1.164794921875, 1.6650390625, 2.165283203125, 2.66552734375, 3.165771484375, 3.666015625, 4.166259765625, 4.66650390625, 5.166748046875, 5.6669921875, 6.167236328125, 6.66748046875, 7.167724609375, 7.66796875, 8.168212890625, 8.66845703125, 9.168701171875, 9.6689453125, 10.169189453125, 10.66943359375, 11.169677734375, 11.669921875, 12.170166015625, 12.67041015625, 13.170654296875, 13.6708984375, 14.171142578125, 14.67138671875, 15.171630859375, 15.671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 7.0, 13.0, 23.0, 32.0, 29.0, 44.0, 52.0, 40.0, 52.0, 58.0, 59.0, 63.0, 63.0, 56.0, 53.0, 52.0, 45.0, 46.0, 37.0, 35.0, 28.0, 25.0, 15.0, 19.0, 10.0, 8.0, 7.0, 9.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.234619140625, -8.00830078125, -7.781982421875, -7.5556640625, -7.329345703125, -7.10302734375, -6.876708984375, -6.650390625, -6.424072265625, -6.19775390625, -5.971435546875, -5.7451171875, -5.518798828125, -5.29248046875, -5.066162109375, -4.83984375, -4.613525390625, -4.38720703125, -4.160888671875, -3.9345703125, -3.708251953125, -3.48193359375, -3.255615234375, -3.029296875, -2.802978515625, -2.57666015625, -2.350341796875, -2.1240234375, -1.897705078125, -1.67138671875, -1.445068359375, -1.21875, -0.992431640625, -0.76611328125, -0.539794921875, -0.3134765625, -0.087158203125, 0.13916015625, 0.365478515625, 0.591796875, 0.818115234375, 1.04443359375, 1.270751953125, 1.4970703125, 1.723388671875, 1.94970703125, 2.176025390625, 2.40234375, 2.628662109375, 2.85498046875, 3.081298828125, 3.3076171875, 3.533935546875, 3.76025390625, 3.986572265625, 4.212890625, 4.439208984375, 4.66552734375, 4.891845703125, 5.1181640625, 5.344482421875, 5.57080078125, 5.797119140625, 6.0234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 12.0, 10.0, 16.0, 22.0, 53.0, 71.0, 134.0, 210.0, 393.0, 833.0, 1793.0, 5301.0, 31580.0, 694975.0, 287569.0, 18762.0, 3863.0, 1383.0, 673.0, 370.0, 186.0, 139.0, 79.0, 42.0, 28.0, 16.0, 8.0, 10.0, 8.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.15625, -33.93896484375, -32.7216796875, -31.50439453125, -30.287109375, -29.06982421875, -27.8525390625, -26.63525390625, -25.41796875, -24.20068359375, -22.9833984375, -21.76611328125, -20.548828125, -19.33154296875, -18.1142578125, -16.89697265625, -15.6796875, -14.46240234375, -13.2451171875, -12.02783203125, -10.810546875, -9.59326171875, -8.3759765625, -7.15869140625, -5.94140625, -4.72412109375, -3.5068359375, -2.28955078125, -1.072265625, 0.14501953125, 1.3623046875, 2.57958984375, 3.796875, 5.01416015625, 6.2314453125, 7.44873046875, 8.666015625, 9.88330078125, 11.1005859375, 12.31787109375, 13.53515625, 14.75244140625, 15.9697265625, 17.18701171875, 18.404296875, 19.62158203125, 20.8388671875, 22.05615234375, 23.2734375, 24.49072265625, 25.7080078125, 26.92529296875, 28.142578125, 29.35986328125, 30.5771484375, 31.79443359375, 33.01171875, 34.22900390625, 35.4462890625, 36.66357421875, 37.880859375, 39.09814453125, 40.3154296875, 41.53271484375, 42.75]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 13.0, 11.0, 21.0, 12.0, 18.0, 15.0, 27.0, 23.0, 28.0, 33.0, 41.0, 39.0, 36.0, 34.0, 52.0, 44.0, 44.0, 43.0, 44.0, 38.0, 35.0, 36.0, 36.0, 37.0, 30.0, 31.0, 22.0, 20.0, 24.0, 13.0, 13.0, 12.0, 9.0, 9.0, 9.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.53125, -22.79931640625, -22.0673828125, -21.33544921875, -20.603515625, -19.87158203125, -19.1396484375, -18.40771484375, -17.67578125, -16.94384765625, -16.2119140625, -15.47998046875, -14.748046875, -14.01611328125, -13.2841796875, -12.55224609375, -11.8203125, -11.08837890625, -10.3564453125, -9.62451171875, -8.892578125, -8.16064453125, -7.4287109375, -6.69677734375, -5.96484375, -5.23291015625, -4.5009765625, -3.76904296875, -3.037109375, -2.30517578125, -1.5732421875, -0.84130859375, -0.109375, 0.62255859375, 1.3544921875, 2.08642578125, 2.818359375, 3.55029296875, 4.2822265625, 5.01416015625, 5.74609375, 6.47802734375, 7.2099609375, 7.94189453125, 8.673828125, 9.40576171875, 10.1376953125, 10.86962890625, 11.6015625, 12.33349609375, 13.0654296875, 13.79736328125, 14.529296875, 15.26123046875, 15.9931640625, 16.72509765625, 17.45703125, 18.18896484375, 18.9208984375, 19.65283203125, 20.384765625, 21.11669921875, 21.8486328125, 22.58056640625, 23.3125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 9.0, 8.0, 4.0, 11.0, 22.0, 22.0, 27.0, 44.0, 53.0, 76.0, 118.0, 156.0, 335.0, 585.0, 1223.0, 2908.0, 8520.0, 34861.0, 239735.0, 674432.0, 64407.0, 13316.0, 4242.0, 1644.0, 728.0, 417.0, 200.0, 133.0, 77.0, 64.0, 51.0, 30.0, 19.0, 20.0, 12.0, 10.0, 9.0, 6.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.0467529296875, -10.624755859375, -10.2027587890625, -9.78076171875, -9.3587646484375, -8.936767578125, -8.5147705078125, -8.0927734375, -7.6707763671875, -7.248779296875, -6.8267822265625, -6.40478515625, -5.9827880859375, -5.560791015625, -5.1387939453125, -4.716796875, -4.2947998046875, -3.872802734375, -3.4508056640625, -3.02880859375, -2.6068115234375, -2.184814453125, -1.7628173828125, -1.3408203125, -0.9188232421875, -0.496826171875, -0.0748291015625, 0.34716796875, 0.7691650390625, 1.191162109375, 1.6131591796875, 2.03515625, 2.4571533203125, 2.879150390625, 3.3011474609375, 3.72314453125, 4.1451416015625, 4.567138671875, 4.9891357421875, 5.4111328125, 5.8331298828125, 6.255126953125, 6.6771240234375, 7.09912109375, 7.5211181640625, 7.943115234375, 8.3651123046875, 8.787109375, 9.2091064453125, 9.631103515625, 10.0531005859375, 10.47509765625, 10.8970947265625, 11.319091796875, 11.7410888671875, 12.1630859375, 12.5850830078125, 13.007080078125, 13.4290771484375, 13.85107421875, 14.2730712890625, 14.695068359375, 15.1170654296875, 15.5390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 12.0, 19.0, 36.0, 41.0, 53.0, 88.0, 186.0, 260.0, 111.0, 56.0, 50.0, 30.0, 22.0, 4.0, 9.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.009490966796875, -0.009289741516113281, -0.009088516235351562, -0.008887290954589844, -0.008686065673828125, -0.008484840393066406, -0.008283615112304688, -0.008082389831542969, -0.00788116455078125, -0.007679939270019531, -0.0074787139892578125, -0.007277488708496094, -0.007076263427734375, -0.006875038146972656, -0.0066738128662109375, -0.006472587585449219, -0.0062713623046875, -0.006070137023925781, -0.0058689117431640625, -0.005667686462402344, -0.005466461181640625, -0.005265235900878906, -0.0050640106201171875, -0.004862785339355469, -0.00466156005859375, -0.004460334777832031, -0.0042591094970703125, -0.004057884216308594, -0.003856658935546875, -0.0036554336547851562, -0.0034542083740234375, -0.0032529830932617188, -0.0030517578125, -0.0028505325317382812, -0.0026493072509765625, -0.0024480819702148438, -0.002246856689453125, -0.0020456314086914062, -0.0018444061279296875, -0.0016431808471679688, -0.00144195556640625, -0.0012407302856445312, -0.0010395050048828125, -0.0008382797241210938, -0.000637054443359375, -0.00043582916259765625, -0.0002346038818359375, -3.337860107421875e-05, 0.0001678466796875, 0.00036907196044921875, 0.0005702972412109375, 0.0007715225219726562, 0.000972747802734375, 0.0011739730834960938, 0.0013751983642578125, 0.0015764236450195312, 0.00177764892578125, 0.0019788742065429688, 0.0021800994873046875, 0.0023813247680664062, 0.002582550048828125, 0.0027837753295898438, 0.0029850006103515625, 0.0031862258911132812, 0.003387451171875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 6.0, 6.0, 9.0, 7.0, 6.0, 18.0, 16.0, 23.0, 29.0, 52.0, 69.0, 91.0, 125.0, 260.0, 372.0, 588.0, 1055.0, 2113.0, 4801.0, 13305.0, 52475.0, 578033.0, 331602.0, 43284.0, 11354.0, 4323.0, 1907.0, 1033.0, 560.0, 358.0, 201.0, 139.0, 84.0, 56.0, 41.0, 36.0, 20.0, 19.0, 17.0, 8.0, 7.0, 11.0, 11.0, 4.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1640625, -12.724365234375, -12.28466796875, -11.844970703125, -11.4052734375, -10.965576171875, -10.52587890625, -10.086181640625, -9.646484375, -9.206787109375, -8.76708984375, -8.327392578125, -7.8876953125, -7.447998046875, -7.00830078125, -6.568603515625, -6.12890625, -5.689208984375, -5.24951171875, -4.809814453125, -4.3701171875, -3.930419921875, -3.49072265625, -3.051025390625, -2.611328125, -2.171630859375, -1.73193359375, -1.292236328125, -0.8525390625, -0.412841796875, 0.02685546875, 0.466552734375, 0.90625, 1.345947265625, 1.78564453125, 2.225341796875, 2.6650390625, 3.104736328125, 3.54443359375, 3.984130859375, 4.423828125, 4.863525390625, 5.30322265625, 5.742919921875, 6.1826171875, 6.622314453125, 7.06201171875, 7.501708984375, 7.94140625, 8.381103515625, 8.82080078125, 9.260498046875, 9.7001953125, 10.139892578125, 10.57958984375, 11.019287109375, 11.458984375, 11.898681640625, 12.33837890625, 12.778076171875, 13.2177734375, 13.657470703125, 14.09716796875, 14.536865234375, 14.9765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 7.0, 6.0, 9.0, 6.0, 8.0, 10.0, 21.0, 24.0, 15.0, 33.0, 34.0, 39.0, 59.0, 72.0, 92.0, 127.0, 94.0, 55.0, 45.0, 54.0, 30.0, 38.0, 30.0, 23.0, 19.0, 8.0, 3.0, 6.0, 5.0, 7.0, 2.0, 2.0, 5.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-11.4609375, -11.119873046875, -10.77880859375, -10.437744140625, -10.0966796875, -9.755615234375, -9.41455078125, -9.073486328125, -8.732421875, -8.391357421875, -8.05029296875, -7.709228515625, -7.3681640625, -7.027099609375, -6.68603515625, -6.344970703125, -6.00390625, -5.662841796875, -5.32177734375, -4.980712890625, -4.6396484375, -4.298583984375, -3.95751953125, -3.616455078125, -3.275390625, -2.934326171875, -2.59326171875, -2.252197265625, -1.9111328125, -1.570068359375, -1.22900390625, -0.887939453125, -0.546875, -0.205810546875, 0.13525390625, 0.476318359375, 0.8173828125, 1.158447265625, 1.49951171875, 1.840576171875, 2.181640625, 2.522705078125, 2.86376953125, 3.204833984375, 3.5458984375, 3.886962890625, 4.22802734375, 4.569091796875, 4.91015625, 5.251220703125, 5.59228515625, 5.933349609375, 6.2744140625, 6.615478515625, 6.95654296875, 7.297607421875, 7.638671875, 7.979736328125, 8.32080078125, 8.661865234375, 9.0029296875, 9.343994140625, 9.68505859375, 10.026123046875, 10.3671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 9.0, 20.0, 23.0, 77.0, 159.0, 309.0, 220.0, 90.0, 48.0, 11.0, 13.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.3929443359375, -293.54205322265625, -283.6911926269531, -273.84033203125, -263.98944091796875, -254.13856506347656, -244.28768920898438, -234.4368133544922, -224.5859375, -214.7350616455078, -204.88418579101562, -195.03330993652344, -185.18243408203125, -175.33155822753906, -165.48068237304688, -155.6298065185547, -145.7789306640625, -135.9280548095703, -126.07717895507812, -116.22630310058594, -106.37542724609375, -96.52455139160156, -86.67367553710938, -76.82279968261719, -66.971923828125, -57.12104797363281, -47.270172119140625, -37.41929626464844, -27.56842041015625, -17.717544555664062, -7.866668701171875, 1.9842071533203125, 11.8350830078125, 21.685958862304688, 31.536834716796875, 41.38771057128906, 51.23858642578125, 61.08946228027344, 70.94033813476562, 80.79121398925781, 90.64208984375, 100.49296569824219, 110.34384155273438, 120.19471740722656, 130.04559326171875, 139.89646911621094, 149.74734497070312, 159.5982208251953, 169.4490966796875, 179.2999725341797, 189.15084838867188, 199.00172424316406, 208.85260009765625, 218.70347595214844, 228.55435180664062, 238.4052276611328, 248.256103515625, 258.10699462890625, 267.9578552246094, 277.8087158203125, 287.65960693359375, 297.510498046875, 307.3613586425781, 317.21221923828125, 327.0631103515625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 10.0, 17.0, 11.0, 12.0, 20.0, 20.0, 18.0, 33.0, 30.0, 27.0, 33.0, 40.0, 57.0, 46.0, 58.0, 71.0, 64.0, 59.0, 41.0, 39.0, 31.0, 31.0, 30.0, 35.0, 25.0, 15.0, 21.0, 17.0, 9.0, 14.0, 10.0, 3.0, 7.0, 9.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-129.80667114257812, -126.37604522705078, -122.94541931152344, -119.5147933959961, -116.08416748046875, -112.6535415649414, -109.22291564941406, -105.79228973388672, -102.36166381835938, -98.93103790283203, -95.50041198730469, -92.06978607177734, -88.63916015625, -85.20853424072266, -81.77790832519531, -78.34728240966797, -74.91665649414062, -71.48603057861328, -68.05540466308594, -64.6247787475586, -61.19415283203125, -57.763526916503906, -54.33290100097656, -50.90227508544922, -47.471649169921875, -44.04102325439453, -40.61039733886719, -37.179771423339844, -33.7491455078125, -30.318519592285156, -26.887893676757812, -23.45726776123047, -20.026634216308594, -16.59600830078125, -13.165382385253906, -9.734756469726562, -6.304130554199219, -2.873504638671875, 0.5571212768554688, 3.9877471923828125, 7.418373107910156, 10.8489990234375, 14.279624938964844, 17.710250854492188, 21.14087677001953, 24.571502685546875, 28.00212860107422, 31.432754516601562, 34.863380432128906, 38.29400634765625, 41.724632263183594, 45.15525817871094, 48.58588409423828, 52.016510009765625, 55.44713592529297, 58.87776184082031, 62.308387756347656, 65.739013671875, 69.16963958740234, 72.60026550292969, 76.03089141845703, 79.46151733398438, 82.89214324951172, 86.32276916503906, 89.7533950805664]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 7.0, 8.0, 9.0, 8.0, 14.0, 16.0, 24.0, 13.0, 39.0, 57.0, 96.0, 194.0, 303.0, 679.0, 1543.0, 4450.0, 20004.0, 348701.0, 3697065.0, 103666.0, 11885.0, 3112.0, 1148.0, 518.0, 282.0, 152.0, 86.0, 53.0, 38.0, 19.0, 21.0, 18.0, 6.0, 4.0, 3.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.703125, -25.90234375, -25.1015625, -24.30078125, -23.5, -22.69921875, -21.8984375, -21.09765625, -20.296875, -19.49609375, -18.6953125, -17.89453125, -17.09375, -16.29296875, -15.4921875, -14.69140625, -13.890625, -13.08984375, -12.2890625, -11.48828125, -10.6875, -9.88671875, -9.0859375, -8.28515625, -7.484375, -6.68359375, -5.8828125, -5.08203125, -4.28125, -3.48046875, -2.6796875, -1.87890625, -1.078125, -0.27734375, 0.5234375, 1.32421875, 2.125, 2.92578125, 3.7265625, 4.52734375, 5.328125, 6.12890625, 6.9296875, 7.73046875, 8.53125, 9.33203125, 10.1328125, 10.93359375, 11.734375, 12.53515625, 13.3359375, 14.13671875, 14.9375, 15.73828125, 16.5390625, 17.33984375, 18.140625, 18.94140625, 19.7421875, 20.54296875, 21.34375, 22.14453125, 22.9453125, 23.74609375, 24.546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 6.0, 5.0, 4.0, 13.0, 12.0, 20.0, 29.0, 35.0, 43.0, 51.0, 43.0, 50.0, 67.0, 74.0, 67.0, 69.0, 74.0, 49.0, 60.0, 36.0, 42.0, 36.0, 28.0, 25.0, 15.0, 19.0, 13.0, 5.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44140625, -6.18145751953125, -5.9215087890625, -5.66156005859375, -5.401611328125, -5.14166259765625, -4.8817138671875, -4.62176513671875, -4.36181640625, -4.10186767578125, -3.8419189453125, -3.58197021484375, -3.322021484375, -3.06207275390625, -2.8021240234375, -2.54217529296875, -2.2822265625, -2.02227783203125, -1.7623291015625, -1.50238037109375, -1.242431640625, -0.98248291015625, -0.7225341796875, -0.46258544921875, -0.20263671875, 0.05731201171875, 0.3172607421875, 0.57720947265625, 0.837158203125, 1.09710693359375, 1.3570556640625, 1.61700439453125, 1.876953125, 2.13690185546875, 2.3968505859375, 2.65679931640625, 2.916748046875, 3.17669677734375, 3.4366455078125, 3.69659423828125, 3.95654296875, 4.21649169921875, 4.4764404296875, 4.73638916015625, 4.996337890625, 5.25628662109375, 5.5162353515625, 5.77618408203125, 6.0361328125, 6.29608154296875, 6.5560302734375, 6.81597900390625, 7.075927734375, 7.33587646484375, 7.5958251953125, 7.85577392578125, 8.11572265625, 8.37567138671875, 8.6356201171875, 8.89556884765625, 9.155517578125, 9.41546630859375, 9.6754150390625, 9.93536376953125, 10.1953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 13.0, 24.0, 42.0, 81.0, 161.0, 355.0, 1169.0, 21598.0, 4145510.0, 23758.0, 1137.0, 258.0, 99.0, 45.0, 23.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.5, -83.9189453125, -81.337890625, -78.7568359375, -76.17578125, -73.5947265625, -71.013671875, -68.4326171875, -65.8515625, -63.2705078125, -60.689453125, -58.1083984375, -55.52734375, -52.9462890625, -50.365234375, -47.7841796875, -45.203125, -42.6220703125, -40.041015625, -37.4599609375, -34.87890625, -32.2978515625, -29.716796875, -27.1357421875, -24.5546875, -21.9736328125, -19.392578125, -16.8115234375, -14.23046875, -11.6494140625, -9.068359375, -6.4873046875, -3.90625, -1.3251953125, 1.255859375, 3.8369140625, 6.41796875, 8.9990234375, 11.580078125, 14.1611328125, 16.7421875, 19.3232421875, 21.904296875, 24.4853515625, 27.06640625, 29.6474609375, 32.228515625, 34.8095703125, 37.390625, 39.9716796875, 42.552734375, 45.1337890625, 47.71484375, 50.2958984375, 52.876953125, 55.4580078125, 58.0390625, 60.6201171875, 63.201171875, 65.7822265625, 68.36328125, 70.9443359375, 73.525390625, 76.1064453125, 78.6875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 13.0, 12.0, 49.0, 97.0, 297.0, 1254.0, 1641.0, 505.0, 126.0, 52.0, 16.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-72.6875, -71.14697265625, -69.6064453125, -68.06591796875, -66.525390625, -64.98486328125, -63.4443359375, -61.90380859375, -60.36328125, -58.82275390625, -57.2822265625, -55.74169921875, -54.201171875, -52.66064453125, -51.1201171875, -49.57958984375, -48.0390625, -46.49853515625, -44.9580078125, -43.41748046875, -41.876953125, -40.33642578125, -38.7958984375, -37.25537109375, -35.71484375, -34.17431640625, -32.6337890625, -31.09326171875, -29.552734375, -28.01220703125, -26.4716796875, -24.93115234375, -23.390625, -21.85009765625, -20.3095703125, -18.76904296875, -17.228515625, -15.68798828125, -14.1474609375, -12.60693359375, -11.06640625, -9.52587890625, -7.9853515625, -6.44482421875, -4.904296875, -3.36376953125, -1.8232421875, -0.28271484375, 1.2578125, 2.79833984375, 4.3388671875, 5.87939453125, 7.419921875, 8.96044921875, 10.5009765625, 12.04150390625, 13.58203125, 15.12255859375, 16.6630859375, 18.20361328125, 19.744140625, 21.28466796875, 22.8251953125, 24.36572265625, 25.90625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 14.0, 35.0, 92.0, 265.0, 358.0, 163.0, 54.0, 12.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-521.3150024414062, -508.3994445800781, -495.48388671875, -482.5683288574219, -469.65277099609375, -456.73724365234375, -443.8216552734375, -430.9061279296875, -417.9905700683594, -405.07501220703125, -392.1594543457031, -379.243896484375, -366.3283386230469, -353.41278076171875, -340.49725341796875, -327.5816955566406, -314.6661376953125, -301.7505798339844, -288.83502197265625, -275.9194641113281, -263.00390625, -250.08836364746094, -237.1728057861328, -224.25726318359375, -211.3416748046875, -198.42611694335938, -185.51055908203125, -172.59500122070312, -159.67945861816406, -146.76390075683594, -133.8483428955078, -120.93279266357422, -108.01724243164062, -95.1016845703125, -82.1861343383789, -69.27057647705078, -56.35502243041992, -43.43946838378906, -30.523910522460938, -17.608360290527344, -4.692802429199219, 8.222752571105957, 21.138307571411133, 34.053863525390625, 46.969417572021484, 59.884971618652344, 72.80052947998047, 85.71607971191406, 98.63163757324219, 111.54719543457031, 124.4627456665039, 137.3782958984375, 150.29385375976562, 163.20941162109375, 176.12496948242188, 189.04052734375, 201.95608520507812, 214.87164306640625, 227.78720092773438, 240.7027587890625, 253.61830139160156, 266.53387451171875, 279.44940185546875, 292.3649597167969, 305.280517578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 12.0, 26.0, 22.0, 50.0, 65.0, 99.0, 94.0, 118.0, 117.0, 128.0, 95.0, 62.0, 54.0, 26.0, 20.0, 10.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-345.9951477050781, -338.9222717285156, -331.8493957519531, -324.7764892578125, -317.70361328125, -310.6307373046875, -303.557861328125, -296.4849853515625, -289.412109375, -282.3392333984375, -275.266357421875, -268.1934814453125, -261.1205749511719, -254.04769897460938, -246.97482299804688, -239.90194702148438, -232.8290557861328, -225.7561798095703, -218.68328857421875, -211.61041259765625, -204.53753662109375, -197.46466064453125, -190.3917694091797, -183.3188934326172, -176.24600219726562, -169.17312622070312, -162.10023498535156, -155.02735900878906, -147.95448303222656, -140.881591796875, -133.8087158203125, -126.73583984375, -119.66297912597656, -112.59009552001953, -105.51721954345703, -98.4443359375, -91.3714599609375, -84.29857635498047, -77.22569274902344, -70.15281677246094, -63.079933166503906, -56.00705337524414, -48.934173583984375, -41.861289978027344, -34.78841018676758, -27.715530395507812, -20.64264678955078, -13.569766998291016, -6.49688720703125, 0.575993537902832, 7.648874282836914, 14.721755981445312, 21.794635772705078, 28.867515563964844, 35.940399169921875, 43.01327896118164, 50.086158752441406, 57.15903854370117, 64.23191833496094, 71.30480194091797, 78.377685546875, 85.4505615234375, 92.52344512939453, 99.59632873535156, 106.66920471191406]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 7.0, 4.0, 10.0, 15.0, 17.0, 26.0, 46.0, 63.0, 141.0, 353.0, 866.0, 2538.0, 10654.0, 69176.0, 598419.0, 322348.0, 34504.0, 6511.0, 1667.0, 655.0, 258.0, 114.0, 54.0, 42.0, 29.0, 17.0, 11.0, 5.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -20.942138671875, -20.02490234375, -19.107666015625, -18.1904296875, -17.273193359375, -16.35595703125, -15.438720703125, -14.521484375, -13.604248046875, -12.68701171875, -11.769775390625, -10.8525390625, -9.935302734375, -9.01806640625, -8.100830078125, -7.18359375, -6.266357421875, -5.34912109375, -4.431884765625, -3.5146484375, -2.597412109375, -1.68017578125, -0.762939453125, 0.154296875, 1.071533203125, 1.98876953125, 2.906005859375, 3.8232421875, 4.740478515625, 5.65771484375, 6.574951171875, 7.4921875, 8.409423828125, 9.32666015625, 10.243896484375, 11.1611328125, 12.078369140625, 12.99560546875, 13.912841796875, 14.830078125, 15.747314453125, 16.66455078125, 17.581787109375, 18.4990234375, 19.416259765625, 20.33349609375, 21.250732421875, 22.16796875, 23.085205078125, 24.00244140625, 24.919677734375, 25.8369140625, 26.754150390625, 27.67138671875, 28.588623046875, 29.505859375, 30.423095703125, 31.34033203125, 32.257568359375, 33.1748046875, 34.092041015625, 35.00927734375, 35.926513671875, 36.84375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 12.0, 9.0, 17.0, 17.0, 17.0, 28.0, 41.0, 47.0, 41.0, 43.0, 37.0, 51.0, 57.0, 62.0, 61.0, 47.0, 49.0, 41.0, 50.0, 42.0, 41.0, 40.0, 30.0, 28.0, 14.0, 16.0, 13.0, 8.0, 11.0, 9.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.859375, -8.628173828125, -8.39697265625, -8.165771484375, -7.9345703125, -7.703369140625, -7.47216796875, -7.240966796875, -7.009765625, -6.778564453125, -6.54736328125, -6.316162109375, -6.0849609375, -5.853759765625, -5.62255859375, -5.391357421875, -5.16015625, -4.928955078125, -4.69775390625, -4.466552734375, -4.2353515625, -4.004150390625, -3.77294921875, -3.541748046875, -3.310546875, -3.079345703125, -2.84814453125, -2.616943359375, -2.3857421875, -2.154541015625, -1.92333984375, -1.692138671875, -1.4609375, -1.229736328125, -0.99853515625, -0.767333984375, -0.5361328125, -0.304931640625, -0.07373046875, 0.157470703125, 0.388671875, 0.619873046875, 0.85107421875, 1.082275390625, 1.3134765625, 1.544677734375, 1.77587890625, 2.007080078125, 2.23828125, 2.469482421875, 2.70068359375, 2.931884765625, 3.1630859375, 3.394287109375, 3.62548828125, 3.856689453125, 4.087890625, 4.319091796875, 4.55029296875, 4.781494140625, 5.0126953125, 5.243896484375, 5.47509765625, 5.706298828125, 5.9375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 14.0, 27.0, 53.0, 104.0, 216.0, 599.0, 1774.0, 9168.0, 335459.0, 686068.0, 11844.0, 2061.0, 658.0, 255.0, 94.0, 62.0, 23.0, 20.0, 12.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.28125, -58.13232421875, -55.9833984375, -53.83447265625, -51.685546875, -49.53662109375, -47.3876953125, -45.23876953125, -43.08984375, -40.94091796875, -38.7919921875, -36.64306640625, -34.494140625, -32.34521484375, -30.1962890625, -28.04736328125, -25.8984375, -23.74951171875, -21.6005859375, -19.45166015625, -17.302734375, -15.15380859375, -13.0048828125, -10.85595703125, -8.70703125, -6.55810546875, -4.4091796875, -2.26025390625, -0.111328125, 2.03759765625, 4.1865234375, 6.33544921875, 8.484375, 10.63330078125, 12.7822265625, 14.93115234375, 17.080078125, 19.22900390625, 21.3779296875, 23.52685546875, 25.67578125, 27.82470703125, 29.9736328125, 32.12255859375, 34.271484375, 36.42041015625, 38.5693359375, 40.71826171875, 42.8671875, 45.01611328125, 47.1650390625, 49.31396484375, 51.462890625, 53.61181640625, 55.7607421875, 57.90966796875, 60.05859375, 62.20751953125, 64.3564453125, 66.50537109375, 68.654296875, 70.80322265625, 72.9521484375, 75.10107421875, 77.25]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 4.0, 4.0, 15.0, 17.0, 8.0, 27.0, 18.0, 23.0, 34.0, 46.0, 47.0, 51.0, 74.0, 70.0, 56.0, 50.0, 51.0, 53.0, 52.0, 50.0, 52.0, 36.0, 31.0, 27.0, 15.0, 25.0, 9.0, 4.0, 13.0, 8.0, 8.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.0, -35.849609375, -34.69921875, -33.548828125, -32.3984375, -31.248046875, -30.09765625, -28.947265625, -27.796875, -26.646484375, -25.49609375, -24.345703125, -23.1953125, -22.044921875, -20.89453125, -19.744140625, -18.59375, -17.443359375, -16.29296875, -15.142578125, -13.9921875, -12.841796875, -11.69140625, -10.541015625, -9.390625, -8.240234375, -7.08984375, -5.939453125, -4.7890625, -3.638671875, -2.48828125, -1.337890625, -0.1875, 0.962890625, 2.11328125, 3.263671875, 4.4140625, 5.564453125, 6.71484375, 7.865234375, 9.015625, 10.166015625, 11.31640625, 12.466796875, 13.6171875, 14.767578125, 15.91796875, 17.068359375, 18.21875, 19.369140625, 20.51953125, 21.669921875, 22.8203125, 23.970703125, 25.12109375, 26.271484375, 27.421875, 28.572265625, 29.72265625, 30.873046875, 32.0234375, 33.173828125, 34.32421875, 35.474609375, 36.625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 12.0, 26.0, 29.0, 95.0, 223.0, 707.0, 3091.0, 32344.0, 953712.0, 53148.0, 3889.0, 832.0, 249.0, 107.0, 38.0, 23.0, 16.0, 6.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.40625, -23.09228515625, -21.7783203125, -20.46435546875, -19.150390625, -17.83642578125, -16.5224609375, -15.20849609375, -13.89453125, -12.58056640625, -11.2666015625, -9.95263671875, -8.638671875, -7.32470703125, -6.0107421875, -4.69677734375, -3.3828125, -2.06884765625, -0.7548828125, 0.55908203125, 1.873046875, 3.18701171875, 4.5009765625, 5.81494140625, 7.12890625, 8.44287109375, 9.7568359375, 11.07080078125, 12.384765625, 13.69873046875, 15.0126953125, 16.32666015625, 17.640625, 18.95458984375, 20.2685546875, 21.58251953125, 22.896484375, 24.21044921875, 25.5244140625, 26.83837890625, 28.15234375, 29.46630859375, 30.7802734375, 32.09423828125, 33.408203125, 34.72216796875, 36.0361328125, 37.35009765625, 38.6640625, 39.97802734375, 41.2919921875, 42.60595703125, 43.919921875, 45.23388671875, 46.5478515625, 47.86181640625, 49.17578125, 50.48974609375, 51.8037109375, 53.11767578125, 54.431640625, 55.74560546875, 57.0595703125, 58.37353515625, 59.6875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 16.0, 13.0, 20.0, 24.0, 29.0, 71.0, 171.0, 333.0, 138.0, 71.0, 33.0, 25.0, 16.0, 7.0, 10.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0099029541015625, -0.009638309478759766, -0.009373664855957031, -0.009109020233154297, -0.008844375610351562, -0.008579730987548828, -0.008315086364746094, -0.00805044174194336, -0.007785797119140625, -0.007521152496337891, -0.007256507873535156, -0.006991863250732422, -0.0067272186279296875, -0.006462574005126953, -0.006197929382324219, -0.005933284759521484, -0.00566864013671875, -0.005403995513916016, -0.005139350891113281, -0.004874706268310547, -0.0046100616455078125, -0.004345417022705078, -0.004080772399902344, -0.0038161277770996094, -0.003551483154296875, -0.0032868385314941406, -0.0030221939086914062, -0.002757549285888672, -0.0024929046630859375, -0.002228260040283203, -0.0019636154174804688, -0.0016989707946777344, -0.001434326171875, -0.0011696815490722656, -0.0009050369262695312, -0.0006403923034667969, -0.0003757476806640625, -0.00011110305786132812, 0.00015354156494140625, 0.0004181861877441406, 0.000682830810546875, 0.0009474754333496094, 0.0012121200561523438, 0.0014767646789550781, 0.0017414093017578125, 0.002006053924560547, 0.0022706985473632812, 0.0025353431701660156, 0.00279998779296875, 0.0030646324157714844, 0.0033292770385742188, 0.003593921661376953, 0.0038585662841796875, 0.004123210906982422, 0.004387855529785156, 0.004652500152587891, 0.004917144775390625, 0.005181789398193359, 0.005446434020996094, 0.005711078643798828, 0.0059757232666015625, 0.006240367889404297, 0.006505012512207031, 0.006769657135009766, 0.0070343017578125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 7.0, 9.0, 10.0, 15.0, 15.0, 42.0, 45.0, 53.0, 71.0, 111.0, 187.0, 327.0, 486.0, 983.0, 1818.0, 3749.0, 9543.0, 29381.0, 151285.0, 739439.0, 77973.0, 19751.0, 6872.0, 2990.0, 1418.0, 731.0, 431.0, 245.0, 186.0, 105.0, 65.0, 50.0, 43.0, 28.0, 29.0, 18.0, 17.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0], "bins": [-19.09375, -18.5682373046875, -18.042724609375, -17.5172119140625, -16.99169921875, -16.4661865234375, -15.940673828125, -15.4151611328125, -14.8896484375, -14.3641357421875, -13.838623046875, -13.3131103515625, -12.78759765625, -12.2620849609375, -11.736572265625, -11.2110595703125, -10.685546875, -10.1600341796875, -9.634521484375, -9.1090087890625, -8.58349609375, -8.0579833984375, -7.532470703125, -7.0069580078125, -6.4814453125, -5.9559326171875, -5.430419921875, -4.9049072265625, -4.37939453125, -3.8538818359375, -3.328369140625, -2.8028564453125, -2.27734375, -1.7518310546875, -1.226318359375, -0.7008056640625, -0.17529296875, 0.3502197265625, 0.875732421875, 1.4012451171875, 1.9267578125, 2.4522705078125, 2.977783203125, 3.5032958984375, 4.02880859375, 4.5543212890625, 5.079833984375, 5.6053466796875, 6.130859375, 6.6563720703125, 7.181884765625, 7.7073974609375, 8.23291015625, 8.7584228515625, 9.283935546875, 9.8094482421875, 10.3349609375, 10.8604736328125, 11.385986328125, 11.9114990234375, 12.43701171875, 12.9625244140625, 13.488037109375, 14.0135498046875, 14.5390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 7.0, 6.0, 10.0, 12.0, 7.0, 10.0, 11.0, 18.0, 24.0, 34.0, 41.0, 86.0, 123.0, 174.0, 131.0, 83.0, 50.0, 35.0, 27.0, 24.0, 16.0, 11.0, 8.0, 12.0, 7.0, 2.0, 9.0, 4.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.5, -15.9923095703125, -15.484619140625, -14.9769287109375, -14.46923828125, -13.9615478515625, -13.453857421875, -12.9461669921875, -12.4384765625, -11.9307861328125, -11.423095703125, -10.9154052734375, -10.40771484375, -9.9000244140625, -9.392333984375, -8.8846435546875, -8.376953125, -7.8692626953125, -7.361572265625, -6.8538818359375, -6.34619140625, -5.8385009765625, -5.330810546875, -4.8231201171875, -4.3154296875, -3.8077392578125, -3.300048828125, -2.7923583984375, -2.28466796875, -1.7769775390625, -1.269287109375, -0.7615966796875, -0.25390625, 0.2537841796875, 0.761474609375, 1.2691650390625, 1.77685546875, 2.2845458984375, 2.792236328125, 3.2999267578125, 3.8076171875, 4.3153076171875, 4.822998046875, 5.3306884765625, 5.83837890625, 6.3460693359375, 6.853759765625, 7.3614501953125, 7.869140625, 8.3768310546875, 8.884521484375, 9.3922119140625, 9.89990234375, 10.4075927734375, 10.915283203125, 11.4229736328125, 11.9306640625, 12.4383544921875, 12.946044921875, 13.4537353515625, 13.96142578125, 14.4691162109375, 14.976806640625, 15.4844970703125, 15.9921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 22.0, 67.0, 197.0, 448.0, 175.0, 47.0, 15.0, 8.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-558.3154296875, -543.3786010742188, -528.4417724609375, -513.5048828125, -498.5680847167969, -483.6312255859375, -468.69439697265625, -453.757568359375, -438.82073974609375, -423.8839111328125, -408.9470520019531, -394.0102233886719, -379.0733947753906, -364.13653564453125, -349.19970703125, -334.26287841796875, -319.3260192871094, -304.3891906738281, -289.45233154296875, -274.5155029296875, -259.57867431640625, -244.64183044433594, -229.70498657226562, -214.76815795898438, -199.83131408691406, -184.89447021484375, -169.9576416015625, -155.0207977294922, -140.08395385742188, -125.14712524414062, -110.21028137207031, -95.27344512939453, -80.33660888671875, -65.39977264404297, -50.46293258666992, -35.526092529296875, -20.589256286621094, -5.6524200439453125, 9.284423828125, 24.22126007080078, 39.15809631347656, 54.094932556152344, 69.03176879882812, 83.96861267089844, 98.90544891357422, 113.84228515625, 128.7791290283203, 143.71597290039062, 158.65280151367188, 173.5896453857422, 188.52647399902344, 203.46331787109375, 218.400146484375, 233.3369903564453, 248.27383422851562, 263.2106628417969, 278.14752197265625, 293.0843505859375, 308.0212097167969, 322.9580383300781, 337.8948669433594, 352.83172607421875, 367.7685546875, 382.70538330078125, 397.6422119140625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 4.0, 7.0, 5.0, 6.0, 6.0, 6.0, 14.0, 6.0, 12.0, 16.0, 17.0, 18.0, 20.0, 24.0, 28.0, 32.0, 40.0, 31.0, 53.0, 55.0, 59.0, 72.0, 67.0, 69.0, 48.0, 36.0, 29.0, 30.0, 37.0, 23.0, 26.0, 26.0, 17.0, 12.0, 13.0, 9.0, 6.0, 2.0, 9.0, 8.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-107.08128356933594, -102.89578247070312, -98.71028137207031, -94.5247802734375, -90.33927917480469, -86.15377807617188, -81.9682846069336, -77.78278350830078, -73.59728240966797, -69.41178131103516, -65.22628021240234, -61.0407829284668, -56.855281829833984, -52.66978073120117, -48.484283447265625, -44.29878234863281, -40.11328125, -35.92778015136719, -31.742280960083008, -27.556781768798828, -23.371280670166016, -19.185779571533203, -15.000280380249023, -10.814781188964844, -6.629280090332031, -2.443779945373535, 1.741720199584961, 5.927220344543457, 10.112720489501953, 14.298221588134766, 18.483720779418945, 22.669219970703125, 26.854705810546875, 31.040206909179688, 35.2257080078125, 39.41120529174805, 43.59670639038086, 47.78220748901367, 51.96770477294922, 56.15320587158203, 60.338706970214844, 64.52420806884766, 68.70970916748047, 72.89521026611328, 77.08070373535156, 81.26620483398438, 85.45170593261719, 89.63720703125, 93.82270812988281, 98.00820922851562, 102.19371032714844, 106.37921142578125, 110.56471252441406, 114.75021362304688, 118.93570709228516, 123.12120819091797, 127.30670928955078, 131.49220275878906, 135.67770385742188, 139.8632049560547, 144.0487060546875, 148.2342071533203, 152.41970825195312, 156.60520935058594, 160.79071044921875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 4.0, 4.0, 11.0, 17.0, 16.0, 25.0, 36.0, 56.0, 97.0, 156.0, 423.0, 1148.0, 5302.0, 66158.0, 4051580.0, 62832.0, 4627.0, 981.0, 329.0, 144.0, 77.0, 47.0, 49.0, 38.0, 17.0, 20.0, 13.0, 8.0, 9.0, 8.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.5625, -39.03173828125, -37.5009765625, -35.97021484375, -34.439453125, -32.90869140625, -31.3779296875, -29.84716796875, -28.31640625, -26.78564453125, -25.2548828125, -23.72412109375, -22.193359375, -20.66259765625, -19.1318359375, -17.60107421875, -16.0703125, -14.53955078125, -13.0087890625, -11.47802734375, -9.947265625, -8.41650390625, -6.8857421875, -5.35498046875, -3.82421875, -2.29345703125, -0.7626953125, 0.76806640625, 2.298828125, 3.82958984375, 5.3603515625, 6.89111328125, 8.421875, 9.95263671875, 11.4833984375, 13.01416015625, 14.544921875, 16.07568359375, 17.6064453125, 19.13720703125, 20.66796875, 22.19873046875, 23.7294921875, 25.26025390625, 26.791015625, 28.32177734375, 29.8525390625, 31.38330078125, 32.9140625, 34.44482421875, 35.9755859375, 37.50634765625, 39.037109375, 40.56787109375, 42.0986328125, 43.62939453125, 45.16015625, 46.69091796875, 48.2216796875, 49.75244140625, 51.283203125, 52.81396484375, 54.3447265625, 55.87548828125, 57.40625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 6.0, 13.0, 17.0, 17.0, 25.0, 21.0, 47.0, 46.0, 58.0, 56.0, 53.0, 79.0, 75.0, 67.0, 63.0, 66.0, 45.0, 63.0, 50.0, 29.0, 25.0, 22.0, 13.0, 10.0, 9.0, 8.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55859375, -6.25897216796875, -5.9593505859375, -5.65972900390625, -5.360107421875, -5.06048583984375, -4.7608642578125, -4.46124267578125, -4.16162109375, -3.86199951171875, -3.5623779296875, -3.26275634765625, -2.963134765625, -2.66351318359375, -2.3638916015625, -2.06427001953125, -1.7646484375, -1.46502685546875, -1.1654052734375, -0.86578369140625, -0.566162109375, -0.26654052734375, 0.0330810546875, 0.33270263671875, 0.63232421875, 0.93194580078125, 1.2315673828125, 1.53118896484375, 1.830810546875, 2.13043212890625, 2.4300537109375, 2.72967529296875, 3.029296875, 3.32891845703125, 3.6285400390625, 3.92816162109375, 4.227783203125, 4.52740478515625, 4.8270263671875, 5.12664794921875, 5.42626953125, 5.72589111328125, 6.0255126953125, 6.32513427734375, 6.624755859375, 6.92437744140625, 7.2239990234375, 7.52362060546875, 7.8232421875, 8.12286376953125, 8.4224853515625, 8.72210693359375, 9.021728515625, 9.32135009765625, 9.6209716796875, 9.92059326171875, 10.22021484375, 10.51983642578125, 10.8194580078125, 11.11907958984375, 11.418701171875, 11.71832275390625, 12.0179443359375, 12.31756591796875, 12.6171875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 11.0, 18.0, 30.0, 61.0, 102.0, 187.0, 354.0, 772.0, 2255.0, 20897.0, 4124745.0, 41066.0, 2530.0, 712.0, 277.0, 133.0, 65.0, 28.0, 16.0, 8.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.6875, -75.833984375, -72.98046875, -70.126953125, -67.2734375, -64.419921875, -61.56640625, -58.712890625, -55.859375, -53.005859375, -50.15234375, -47.298828125, -44.4453125, -41.591796875, -38.73828125, -35.884765625, -33.03125, -30.177734375, -27.32421875, -24.470703125, -21.6171875, -18.763671875, -15.91015625, -13.056640625, -10.203125, -7.349609375, -4.49609375, -1.642578125, 1.2109375, 4.064453125, 6.91796875, 9.771484375, 12.625, 15.478515625, 18.33203125, 21.185546875, 24.0390625, 26.892578125, 29.74609375, 32.599609375, 35.453125, 38.306640625, 41.16015625, 44.013671875, 46.8671875, 49.720703125, 52.57421875, 55.427734375, 58.28125, 61.134765625, 63.98828125, 66.841796875, 69.6953125, 72.548828125, 75.40234375, 78.255859375, 81.109375, 83.962890625, 86.81640625, 89.669921875, 92.5234375, 95.376953125, 98.23046875, 101.083984375, 103.9375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 16.0, 23.0, 64.0, 173.0, 641.0, 1790.0, 944.0, 231.0, 98.0, 46.0, 16.0, 11.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -65.3076171875, -63.740234375, -62.1728515625, -60.60546875, -59.0380859375, -57.470703125, -55.9033203125, -54.3359375, -52.7685546875, -51.201171875, -49.6337890625, -48.06640625, -46.4990234375, -44.931640625, -43.3642578125, -41.796875, -40.2294921875, -38.662109375, -37.0947265625, -35.52734375, -33.9599609375, -32.392578125, -30.8251953125, -29.2578125, -27.6904296875, -26.123046875, -24.5556640625, -22.98828125, -21.4208984375, -19.853515625, -18.2861328125, -16.71875, -15.1513671875, -13.583984375, -12.0166015625, -10.44921875, -8.8818359375, -7.314453125, -5.7470703125, -4.1796875, -2.6123046875, -1.044921875, 0.5224609375, 2.08984375, 3.6572265625, 5.224609375, 6.7919921875, 8.359375, 9.9267578125, 11.494140625, 13.0615234375, 14.62890625, 16.1962890625, 17.763671875, 19.3310546875, 20.8984375, 22.4658203125, 24.033203125, 25.6005859375, 27.16796875, 28.7353515625, 30.302734375, 31.8701171875, 33.4375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 8.0, 17.0, 31.0, 78.0, 203.0, 304.0, 189.0, 83.0, 45.0, 12.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-494.77117919921875, -483.129638671875, -471.4880676269531, -459.8465270996094, -448.2049560546875, -436.56341552734375, -424.921875, -413.28033447265625, -401.6387634277344, -389.9972229003906, -378.35565185546875, -366.714111328125, -355.07257080078125, -343.4309997558594, -331.7894592285156, -320.14788818359375, -308.50634765625, -296.86480712890625, -285.2232360839844, -273.5816955566406, -261.94012451171875, -250.298583984375, -238.65704345703125, -227.01548767089844, -215.37393188476562, -203.7323760986328, -192.0908203125, -180.44927978515625, -168.80772399902344, -157.16616821289062, -145.52462768554688, -133.88307189941406, -122.24154663085938, -110.59999084472656, -98.95844268798828, -87.31689453125, -75.67533874511719, -64.03378295898438, -52.392234802246094, -40.75068664550781, -29.109130859375, -17.467578887939453, -5.826026916503906, 5.815525054931641, 17.457077026367188, 29.098628997802734, 40.74018096923828, 52.38172912597656, 64.02328491210938, 75.66484069824219, 87.30638885498047, 98.94793701171875, 110.58949279785156, 122.23104858398438, 133.87258911132812, 145.51414489746094, 157.15570068359375, 168.79725646972656, 180.43881225585938, 192.08035278320312, 203.72190856933594, 215.36346435546875, 227.0050048828125, 238.6465606689453, 250.28811645507812]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 7.0, 17.0, 26.0, 42.0, 65.0, 84.0, 118.0, 124.0, 134.0, 130.0, 96.0, 69.0, 40.0, 16.0, 18.0, 4.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-223.9552459716797, -215.48777770996094, -207.0203094482422, -198.55282592773438, -190.08535766601562, -181.61788940429688, -173.15042114257812, -164.68295288085938, -156.21548461914062, -147.74801635742188, -139.28054809570312, -130.81307983398438, -122.34559631347656, -113.87812805175781, -105.41065979003906, -96.94319152832031, -88.4757080078125, -80.00823974609375, -71.54076385498047, -63.07329559326172, -54.6058235168457, -46.13835144042969, -37.67088317871094, -29.203411102294922, -20.735939025878906, -12.268467903137207, -3.800996780395508, 4.666473388671875, 13.13394546508789, 21.601417541503906, 30.068885803222656, 38.53635787963867, 47.003814697265625, 55.47128677368164, 63.938758850097656, 72.4062271118164, 80.87370300292969, 89.34117126464844, 97.80863952636719, 106.27610778808594, 114.74358367919922, 123.21105194091797, 131.67852783203125, 140.14599609375, 148.61346435546875, 157.0809326171875, 165.54840087890625, 174.01588439941406, 182.4833526611328, 190.95082092285156, 199.4182891845703, 207.88577270507812, 216.35324096679688, 224.82070922851562, 233.28817749023438, 241.75564575195312, 250.22311401367188, 258.6905822753906, 267.1580505371094, 275.6255187988281, 284.0929870605469, 292.56048583984375, 301.0279541015625, 309.49542236328125, 317.962890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 3.0, 6.0, 7.0, 13.0, 20.0, 26.0, 28.0, 34.0, 59.0, 96.0, 125.0, 204.0, 384.0, 799.0, 2102.0, 6577.0, 27284.0, 202285.0, 652902.0, 127665.0, 19473.0, 5122.0, 1746.0, 704.0, 313.0, 164.0, 113.0, 77.0, 66.0, 40.0, 23.0, 27.0, 17.0, 5.0, 7.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.421875, -23.591064453125, -22.76025390625, -21.929443359375, -21.0986328125, -20.267822265625, -19.43701171875, -18.606201171875, -17.775390625, -16.944580078125, -16.11376953125, -15.282958984375, -14.4521484375, -13.621337890625, -12.79052734375, -11.959716796875, -11.12890625, -10.298095703125, -9.46728515625, -8.636474609375, -7.8056640625, -6.974853515625, -6.14404296875, -5.313232421875, -4.482421875, -3.651611328125, -2.82080078125, -1.989990234375, -1.1591796875, -0.328369140625, 0.50244140625, 1.333251953125, 2.1640625, 2.994873046875, 3.82568359375, 4.656494140625, 5.4873046875, 6.318115234375, 7.14892578125, 7.979736328125, 8.810546875, 9.641357421875, 10.47216796875, 11.302978515625, 12.1337890625, 12.964599609375, 13.79541015625, 14.626220703125, 15.45703125, 16.287841796875, 17.11865234375, 17.949462890625, 18.7802734375, 19.611083984375, 20.44189453125, 21.272705078125, 22.103515625, 22.934326171875, 23.76513671875, 24.595947265625, 25.4267578125, 26.257568359375, 27.08837890625, 27.919189453125, 28.75]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 19.0, 37.0, 50.0, 105.0, 115.0, 156.0, 152.0, 123.0, 117.0, 73.0, 31.0, 12.0, 9.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.78125, -25.971435546875, -25.16162109375, -24.351806640625, -23.5419921875, -22.732177734375, -21.92236328125, -21.112548828125, -20.302734375, -19.492919921875, -18.68310546875, -17.873291015625, -17.0634765625, -16.253662109375, -15.44384765625, -14.634033203125, -13.82421875, -13.014404296875, -12.20458984375, -11.394775390625, -10.5849609375, -9.775146484375, -8.96533203125, -8.155517578125, -7.345703125, -6.535888671875, -5.72607421875, -4.916259765625, -4.1064453125, -3.296630859375, -2.48681640625, -1.677001953125, -0.8671875, -0.057373046875, 0.75244140625, 1.562255859375, 2.3720703125, 3.181884765625, 3.99169921875, 4.801513671875, 5.611328125, 6.421142578125, 7.23095703125, 8.040771484375, 8.8505859375, 9.660400390625, 10.47021484375, 11.280029296875, 12.08984375, 12.899658203125, 13.70947265625, 14.519287109375, 15.3291015625, 16.138916015625, 16.94873046875, 17.758544921875, 18.568359375, 19.378173828125, 20.18798828125, 20.997802734375, 21.8076171875, 22.617431640625, 23.42724609375, 24.237060546875, 25.046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 14.0, 15.0, 24.0, 45.0, 74.0, 164.0, 400.0, 1082.0, 3882.0, 27091.0, 692707.0, 302041.0, 16615.0, 2823.0, 878.0, 340.0, 168.0, 85.0, 38.0, 22.0, 17.0, 10.0, 4.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.59375, -51.16845703125, -49.7431640625, -48.31787109375, -46.892578125, -45.46728515625, -44.0419921875, -42.61669921875, -41.19140625, -39.76611328125, -38.3408203125, -36.91552734375, -35.490234375, -34.06494140625, -32.6396484375, -31.21435546875, -29.7890625, -28.36376953125, -26.9384765625, -25.51318359375, -24.087890625, -22.66259765625, -21.2373046875, -19.81201171875, -18.38671875, -16.96142578125, -15.5361328125, -14.11083984375, -12.685546875, -11.26025390625, -9.8349609375, -8.40966796875, -6.984375, -5.55908203125, -4.1337890625, -2.70849609375, -1.283203125, 0.14208984375, 1.5673828125, 2.99267578125, 4.41796875, 5.84326171875, 7.2685546875, 8.69384765625, 10.119140625, 11.54443359375, 12.9697265625, 14.39501953125, 15.8203125, 17.24560546875, 18.6708984375, 20.09619140625, 21.521484375, 22.94677734375, 24.3720703125, 25.79736328125, 27.22265625, 28.64794921875, 30.0732421875, 31.49853515625, 32.923828125, 34.34912109375, 35.7744140625, 37.19970703125, 38.625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 15.0, 14.0, 24.0, 37.0, 49.0, 63.0, 64.0, 102.0, 96.0, 99.0, 102.0, 81.0, 54.0, 56.0, 40.0, 26.0, 26.0, 17.0, 14.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.4375, -78.337890625, -76.23828125, -74.138671875, -72.0390625, -69.939453125, -67.83984375, -65.740234375, -63.640625, -61.541015625, -59.44140625, -57.341796875, -55.2421875, -53.142578125, -51.04296875, -48.943359375, -46.84375, -44.744140625, -42.64453125, -40.544921875, -38.4453125, -36.345703125, -34.24609375, -32.146484375, -30.046875, -27.947265625, -25.84765625, -23.748046875, -21.6484375, -19.548828125, -17.44921875, -15.349609375, -13.25, -11.150390625, -9.05078125, -6.951171875, -4.8515625, -2.751953125, -0.65234375, 1.447265625, 3.546875, 5.646484375, 7.74609375, 9.845703125, 11.9453125, 14.044921875, 16.14453125, 18.244140625, 20.34375, 22.443359375, 24.54296875, 26.642578125, 28.7421875, 30.841796875, 32.94140625, 35.041015625, 37.140625, 39.240234375, 41.33984375, 43.439453125, 45.5390625, 47.638671875, 49.73828125, 51.837890625, 53.9375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 9.0, 16.0, 30.0, 54.0, 117.0, 291.0, 880.0, 3140.0, 13796.0, 124351.0, 834116.0, 59559.0, 8958.0, 2159.0, 656.0, 224.0, 86.0, 40.0, 14.0, 19.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.596923828125, -17.05322265625, -16.509521484375, -15.9658203125, -15.422119140625, -14.87841796875, -14.334716796875, -13.791015625, -13.247314453125, -12.70361328125, -12.159912109375, -11.6162109375, -11.072509765625, -10.52880859375, -9.985107421875, -9.44140625, -8.897705078125, -8.35400390625, -7.810302734375, -7.2666015625, -6.722900390625, -6.17919921875, -5.635498046875, -5.091796875, -4.548095703125, -4.00439453125, -3.460693359375, -2.9169921875, -2.373291015625, -1.82958984375, -1.285888671875, -0.7421875, -0.198486328125, 0.34521484375, 0.888916015625, 1.4326171875, 1.976318359375, 2.52001953125, 3.063720703125, 3.607421875, 4.151123046875, 4.69482421875, 5.238525390625, 5.7822265625, 6.325927734375, 6.86962890625, 7.413330078125, 7.95703125, 8.500732421875, 9.04443359375, 9.588134765625, 10.1318359375, 10.675537109375, 11.21923828125, 11.762939453125, 12.306640625, 12.850341796875, 13.39404296875, 13.937744140625, 14.4814453125, 15.025146484375, 15.56884765625, 16.112548828125, 16.65625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 15.0, 11.0, 23.0, 30.0, 52.0, 59.0, 164.0, 192.0, 151.0, 83.0, 63.0, 41.0, 25.0, 16.0, 6.0, 15.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028285980224609375, -0.0027085840702056885, -0.0025885701179504395, -0.0024685561656951904, -0.0023485422134399414, -0.0022285282611846924, -0.0021085143089294434, -0.0019885003566741943, -0.0018684864044189453, -0.0017484724521636963, -0.0016284584999084473, -0.0015084445476531982, -0.0013884305953979492, -0.0012684166431427002, -0.0011484026908874512, -0.0010283887386322021, -0.0009083747863769531, -0.0007883608341217041, -0.0006683468818664551, -0.0005483329296112061, -0.00042831897735595703, -0.000308305025100708, -0.00018829107284545898, -6.827712059020996e-05, 5.173683166503906e-05, 0.00017175078392028809, 0.0002917647361755371, 0.00041177868843078613, 0.0005317926406860352, 0.0006518065929412842, 0.0007718205451965332, 0.0008918344974517822, 0.0010118484497070312, 0.0011318624019622803, 0.0012518763542175293, 0.0013718903064727783, 0.0014919042587280273, 0.0016119182109832764, 0.0017319321632385254, 0.0018519461154937744, 0.0019719600677490234, 0.0020919740200042725, 0.0022119879722595215, 0.0023320019245147705, 0.0024520158767700195, 0.0025720298290252686, 0.0026920437812805176, 0.0028120577335357666, 0.0029320716857910156, 0.0030520856380462646, 0.0031720995903015137, 0.0032921135425567627, 0.0034121274948120117, 0.0035321414470672607, 0.0036521553993225098, 0.003772169351577759, 0.003892183303833008, 0.004012197256088257, 0.004132211208343506, 0.004252225160598755, 0.004372239112854004, 0.004492253065109253, 0.004612267017364502, 0.004732280969619751, 0.004852294921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 10.0, 16.0, 19.0, 31.0, 43.0, 75.0, 130.0, 229.0, 374.0, 758.0, 1584.0, 3485.0, 7829.0, 21355.0, 74598.0, 532080.0, 311418.0, 62451.0, 18744.0, 7218.0, 3116.0, 1438.0, 683.0, 380.0, 198.0, 117.0, 61.0, 39.0, 24.0, 9.0, 9.0, 11.0, 2.0, 5.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.390625, -11.09039306640625, -10.7901611328125, -10.48992919921875, -10.189697265625, -9.88946533203125, -9.5892333984375, -9.28900146484375, -8.98876953125, -8.68853759765625, -8.3883056640625, -8.08807373046875, -7.787841796875, -7.48760986328125, -7.1873779296875, -6.88714599609375, -6.5869140625, -6.28668212890625, -5.9864501953125, -5.68621826171875, -5.385986328125, -5.08575439453125, -4.7855224609375, -4.48529052734375, -4.18505859375, -3.88482666015625, -3.5845947265625, -3.28436279296875, -2.984130859375, -2.68389892578125, -2.3836669921875, -2.08343505859375, -1.783203125, -1.48297119140625, -1.1827392578125, -0.88250732421875, -0.582275390625, -0.28204345703125, 0.0181884765625, 0.31842041015625, 0.61865234375, 0.91888427734375, 1.2191162109375, 1.51934814453125, 1.819580078125, 2.11981201171875, 2.4200439453125, 2.72027587890625, 3.0205078125, 3.32073974609375, 3.6209716796875, 3.92120361328125, 4.221435546875, 4.52166748046875, 4.8218994140625, 5.12213134765625, 5.42236328125, 5.72259521484375, 6.0228271484375, 6.32305908203125, 6.623291015625, 6.92352294921875, 7.2237548828125, 7.52398681640625, 7.82421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 7.0, 7.0, 16.0, 22.0, 29.0, 43.0, 52.0, 62.0, 88.0, 113.0, 122.0, 109.0, 73.0, 58.0, 37.0, 32.0, 20.0, 20.0, 8.0, 14.0, 6.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.703125, -9.3612060546875, -9.019287109375, -8.6773681640625, -8.33544921875, -7.9935302734375, -7.651611328125, -7.3096923828125, -6.9677734375, -6.6258544921875, -6.283935546875, -5.9420166015625, -5.60009765625, -5.2581787109375, -4.916259765625, -4.5743408203125, -4.232421875, -3.8905029296875, -3.548583984375, -3.2066650390625, -2.86474609375, -2.5228271484375, -2.180908203125, -1.8389892578125, -1.4970703125, -1.1551513671875, -0.813232421875, -0.4713134765625, -0.12939453125, 0.2125244140625, 0.554443359375, 0.8963623046875, 1.23828125, 1.5802001953125, 1.922119140625, 2.2640380859375, 2.60595703125, 2.9478759765625, 3.289794921875, 3.6317138671875, 3.9736328125, 4.3155517578125, 4.657470703125, 4.9993896484375, 5.34130859375, 5.6832275390625, 6.025146484375, 6.3670654296875, 6.708984375, 7.0509033203125, 7.392822265625, 7.7347412109375, 8.07666015625, 8.4185791015625, 8.760498046875, 9.1024169921875, 9.4443359375, 9.7862548828125, 10.128173828125, 10.4700927734375, 10.81201171875, 11.1539306640625, 11.495849609375, 11.8377685546875, 12.1796875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 27.0, 119.0, 497.0, 267.0, 62.0, 8.0, 12.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.21905517578125, -237.69471740722656, -219.17037963867188, -200.6460418701172, -182.1217041015625, -163.5973663330078, -145.07302856445312, -126.54869079589844, -108.02435302734375, -89.50001525878906, -70.97567749023438, -52.45133972167969, -33.927001953125, -15.402664184570312, 3.121673583984375, 21.646011352539062, 40.17034912109375, 58.69468688964844, 77.21902465820312, 95.74336242675781, 114.2677001953125, 132.7920379638672, 151.31637573242188, 169.84071350097656, 188.36505126953125, 206.88938903808594, 225.41372680664062, 243.9380645751953, 262.46240234375, 280.98675537109375, 299.5110778808594, 318.035400390625, 336.559814453125, 355.08416748046875, 373.6084899902344, 392.1328125, 410.65716552734375, 429.1815185546875, 447.7058410644531, 466.23016357421875, 484.7545166015625, 503.27886962890625, 521.80322265625, 540.3275146484375, 558.8518676757812, 577.376220703125, 595.9005126953125, 614.4248657226562, 632.94921875, 651.4735717773438, 669.9979248046875, 688.522216796875, 707.0465698242188, 725.5709228515625, 744.09521484375, 762.6195678710938, 781.1439208984375, 799.6682739257812, 818.192626953125, 836.7169189453125, 855.2412719726562, 873.765625, 892.2899169921875, 910.8142700195312, 929.338623046875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 9.0, 14.0, 23.0, 23.0, 33.0, 42.0, 60.0, 68.0, 89.0, 145.0, 128.0, 96.0, 53.0, 58.0, 42.0, 30.0, 27.0, 21.0, 21.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.801025390625, -294.5783996582031, -285.35577392578125, -276.1331787109375, -266.9105529785156, -257.68792724609375, -248.46530151367188, -239.24269104003906, -230.02008056640625, -220.79745483398438, -211.57484436035156, -202.3522186279297, -193.12960815429688, -183.906982421875, -174.68435668945312, -165.4617462158203, -156.23912048339844, -147.01649475097656, -137.79388427734375, -128.57125854492188, -119.34864807128906, -110.12602233886719, -100.90340423583984, -91.6807861328125, -82.45816802978516, -73.23554992675781, -64.01293182373047, -54.79030990600586, -45.567691802978516, -36.34507369995117, -27.122451782226562, -17.89983367919922, -8.677215576171875, 0.5454034805297852, 9.768022537231445, 18.990642547607422, 28.213260650634766, 37.43587875366211, 46.65850067138672, 55.88111877441406, 65.1037368774414, 74.32635498046875, 83.5489730834961, 92.77159118652344, 101.99421691894531, 111.21682739257812, 120.439453125, 129.66207885742188, 138.8846893310547, 148.10731506347656, 157.32992553710938, 166.55255126953125, 175.77516174316406, 184.99778747558594, 194.22039794921875, 203.44302368164062, 212.6656494140625, 221.88827514648438, 231.1108856201172, 240.33351135253906, 249.55612182617188, 258.77874755859375, 268.0013732910156, 277.2239990234375, 286.44659423828125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 9.0, 10.0, 7.0, 9.0, 18.0, 32.0, 57.0, 96.0, 191.0, 417.0, 1279.0, 4547.0, 31246.0, 2951255.0, 1181699.0, 19382.0, 2842.0, 661.0, 232.0, 81.0, 52.0, 36.0, 25.0, 20.0, 14.0, 14.0, 14.0, 6.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.03125, -24.8427734375, -23.654296875, -22.4658203125, -21.27734375, -20.0888671875, -18.900390625, -17.7119140625, -16.5234375, -15.3349609375, -14.146484375, -12.9580078125, -11.76953125, -10.5810546875, -9.392578125, -8.2041015625, -7.015625, -5.8271484375, -4.638671875, -3.4501953125, -2.26171875, -1.0732421875, 0.115234375, 1.3037109375, 2.4921875, 3.6806640625, 4.869140625, 6.0576171875, 7.24609375, 8.4345703125, 9.623046875, 10.8115234375, 12.0, 13.1884765625, 14.376953125, 15.5654296875, 16.75390625, 17.9423828125, 19.130859375, 20.3193359375, 21.5078125, 22.6962890625, 23.884765625, 25.0732421875, 26.26171875, 27.4501953125, 28.638671875, 29.8271484375, 31.015625, 32.2041015625, 33.392578125, 34.5810546875, 35.76953125, 36.9580078125, 38.146484375, 39.3349609375, 40.5234375, 41.7119140625, 42.900390625, 44.0888671875, 45.27734375, 46.4658203125, 47.654296875, 48.8427734375, 50.03125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 8.0, 15.0, 8.0, 32.0, 22.0, 33.0, 34.0, 49.0, 56.0, 57.0, 72.0, 68.0, 85.0, 73.0, 75.0, 54.0, 47.0, 46.0, 51.0, 26.0, 16.0, 17.0, 13.0, 7.0, 8.0, 4.0, 4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.7979736328125, -8.400634765625, -8.0032958984375, -7.60595703125, -7.2086181640625, -6.811279296875, -6.4139404296875, -6.0166015625, -5.6192626953125, -5.221923828125, -4.8245849609375, -4.42724609375, -4.0299072265625, -3.632568359375, -3.2352294921875, -2.837890625, -2.4405517578125, -2.043212890625, -1.6458740234375, -1.24853515625, -0.8511962890625, -0.453857421875, -0.0565185546875, 0.3408203125, 0.7381591796875, 1.135498046875, 1.5328369140625, 1.93017578125, 2.3275146484375, 2.724853515625, 3.1221923828125, 3.51953125, 3.9168701171875, 4.314208984375, 4.7115478515625, 5.10888671875, 5.5062255859375, 5.903564453125, 6.3009033203125, 6.6982421875, 7.0955810546875, 7.492919921875, 7.8902587890625, 8.28759765625, 8.6849365234375, 9.082275390625, 9.4796142578125, 9.876953125, 10.2742919921875, 10.671630859375, 11.0689697265625, 11.46630859375, 11.8636474609375, 12.260986328125, 12.6583251953125, 13.0556640625, 13.4530029296875, 13.850341796875, 14.2476806640625, 14.64501953125, 15.0423583984375, 15.439697265625, 15.8370361328125, 16.234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 13.0, 13.0, 15.0, 21.0, 29.0, 62.0, 101.0, 261.0, 728.0, 2362.0, 15313.0, 560408.0, 3569501.0, 39132.0, 4462.0, 1094.0, 400.0, 160.0, 84.0, 38.0, 35.0, 11.0, 9.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.3125, -40.91064453125, -39.5087890625, -38.10693359375, -36.705078125, -35.30322265625, -33.9013671875, -32.49951171875, -31.09765625, -29.69580078125, -28.2939453125, -26.89208984375, -25.490234375, -24.08837890625, -22.6865234375, -21.28466796875, -19.8828125, -18.48095703125, -17.0791015625, -15.67724609375, -14.275390625, -12.87353515625, -11.4716796875, -10.06982421875, -8.66796875, -7.26611328125, -5.8642578125, -4.46240234375, -3.060546875, -1.65869140625, -0.2568359375, 1.14501953125, 2.546875, 3.94873046875, 5.3505859375, 6.75244140625, 8.154296875, 9.55615234375, 10.9580078125, 12.35986328125, 13.76171875, 15.16357421875, 16.5654296875, 17.96728515625, 19.369140625, 20.77099609375, 22.1728515625, 23.57470703125, 24.9765625, 26.37841796875, 27.7802734375, 29.18212890625, 30.583984375, 31.98583984375, 33.3876953125, 34.78955078125, 36.19140625, 37.59326171875, 38.9951171875, 40.39697265625, 41.798828125, 43.20068359375, 44.6025390625, 46.00439453125, 47.40625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 5.0, 11.0, 9.0, 23.0, 30.0, 43.0, 98.0, 150.0, 330.0, 637.0, 1069.0, 782.0, 406.0, 187.0, 105.0, 71.0, 33.0, 27.0, 18.0, 12.0, 6.0, 7.0, 5.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.546875, -29.640625, -28.734375, -27.828125, -26.921875, -26.015625, -25.109375, -24.203125, -23.296875, -22.390625, -21.484375, -20.578125, -19.671875, -18.765625, -17.859375, -16.953125, -16.046875, -15.140625, -14.234375, -13.328125, -12.421875, -11.515625, -10.609375, -9.703125, -8.796875, -7.890625, -6.984375, -6.078125, -5.171875, -4.265625, -3.359375, -2.453125, -1.546875, -0.640625, 0.265625, 1.171875, 2.078125, 2.984375, 3.890625, 4.796875, 5.703125, 6.609375, 7.515625, 8.421875, 9.328125, 10.234375, 11.140625, 12.046875, 12.953125, 13.859375, 14.765625, 15.671875, 16.578125, 17.484375, 18.390625, 19.296875, 20.203125, 21.109375, 22.015625, 22.921875, 23.828125, 24.734375, 25.640625, 26.546875, 27.453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 10.0, 14.0, 24.0, 50.0, 99.0, 135.0, 175.0, 171.0, 108.0, 100.0, 48.0, 31.0, 13.0, 13.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.69384002685547, -91.04043579101562, -84.38702392578125, -77.7336196899414, -71.08020782470703, -64.42680358886719, -57.77339553833008, -51.11998748779297, -44.46657943725586, -37.81317138671875, -31.15976333618164, -24.506357192993164, -17.852949142456055, -11.199542999267578, -4.546134948730469, 2.1072731018066406, 8.76068115234375, 15.41408920288086, 22.06749725341797, 28.720903396606445, 35.37431335449219, 42.02771759033203, 48.68112564086914, 55.33453369140625, 61.98794174194336, 68.64134979248047, 75.29475402832031, 81.94816589355469, 88.60157012939453, 95.25497436523438, 101.90838623046875, 108.56179809570312, 115.21519470214844, 121.86859893798828, 128.52200317382812, 135.1754150390625, 141.82882690429688, 148.48223876953125, 155.13563537597656, 161.78904724121094, 168.4424591064453, 175.0958709716797, 181.749267578125, 188.40267944335938, 195.05609130859375, 201.70950317382812, 208.36289978027344, 215.0163116455078, 221.66970825195312, 228.3231201171875, 234.9765167236328, 241.6299285888672, 248.28334045410156, 254.93673706054688, 261.59014892578125, 268.2435607910156, 274.89697265625, 281.5503845214844, 288.20379638671875, 294.8572082519531, 301.5105895996094, 308.16400146484375, 314.8174133300781, 321.4708251953125, 328.1242370605469]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 3.0, 5.0, 11.0, 7.0, 10.0, 12.0, 19.0, 11.0, 20.0, 27.0, 22.0, 26.0, 35.0, 30.0, 48.0, 53.0, 46.0, 51.0, 52.0, 51.0, 50.0, 54.0, 52.0, 47.0, 36.0, 30.0, 40.0, 33.0, 21.0, 18.0, 21.0, 11.0, 10.0, 10.0, 11.0, 3.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-93.21646118164062, -90.42561340332031, -87.63475799560547, -84.84391021728516, -82.05305480957031, -79.26220703125, -76.47135162353516, -73.68050384521484, -70.8896484375, -68.09880065917969, -65.30794525146484, -62.517093658447266, -59.72624206542969, -56.93539047241211, -54.14453887939453, -51.35369110107422, -48.56283950805664, -45.77198791503906, -42.981136322021484, -40.190284729003906, -37.39943313598633, -34.60858154296875, -31.817731857299805, -29.026880264282227, -26.23602867126465, -23.44517707824707, -20.654325485229492, -17.863475799560547, -15.072623252868652, -12.281771659851074, -9.490921020507812, -6.700069427490234, -3.9092178344726562, -1.1183664798736572, 1.6724848747253418, 4.463335990905762, 7.25418758392334, 10.045039176940918, 12.83588981628418, 15.626741409301758, 18.417593002319336, 21.208444595336914, 23.999296188354492, 26.790145874023438, 29.580997467041016, 32.371849060058594, 35.16270065307617, 37.95355224609375, 40.74440383911133, 43.535255432128906, 46.326107025146484, 49.11695861816406, 51.90781021118164, 54.69866180419922, 57.48950958251953, 60.280364990234375, 63.07121276855469, 65.862060546875, 68.65291595458984, 71.44376373291016, 74.234619140625, 77.02546691894531, 79.81632232666016, 82.60717010498047, 85.39802551269531]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 10.0, 12.0, 18.0, 34.0, 40.0, 79.0, 121.0, 203.0, 396.0, 878.0, 2528.0, 9452.0, 55510.0, 521506.0, 403255.0, 43010.0, 7736.0, 2103.0, 817.0, 354.0, 200.0, 106.0, 75.0, 37.0, 23.0, 8.0, 8.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.765625, -25.927490234375, -25.08935546875, -24.251220703125, -23.4130859375, -22.574951171875, -21.73681640625, -20.898681640625, -20.060546875, -19.222412109375, -18.38427734375, -17.546142578125, -16.7080078125, -15.869873046875, -15.03173828125, -14.193603515625, -13.35546875, -12.517333984375, -11.67919921875, -10.841064453125, -10.0029296875, -9.164794921875, -8.32666015625, -7.488525390625, -6.650390625, -5.812255859375, -4.97412109375, -4.135986328125, -3.2978515625, -2.459716796875, -1.62158203125, -0.783447265625, 0.0546875, 0.892822265625, 1.73095703125, 2.569091796875, 3.4072265625, 4.245361328125, 5.08349609375, 5.921630859375, 6.759765625, 7.597900390625, 8.43603515625, 9.274169921875, 10.1123046875, 10.950439453125, 11.78857421875, 12.626708984375, 13.46484375, 14.302978515625, 15.14111328125, 15.979248046875, 16.8173828125, 17.655517578125, 18.49365234375, 19.331787109375, 20.169921875, 21.008056640625, 21.84619140625, 22.684326171875, 23.5224609375, 24.360595703125, 25.19873046875, 26.036865234375, 26.875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 11.0, 16.0, 12.0, 20.0, 24.0, 32.0, 46.0, 55.0, 63.0, 80.0, 75.0, 79.0, 68.0, 67.0, 72.0, 53.0, 47.0, 44.0, 29.0, 22.0, 24.0, 18.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.0234375, -11.5731201171875, -11.122802734375, -10.6724853515625, -10.22216796875, -9.7718505859375, -9.321533203125, -8.8712158203125, -8.4208984375, -7.9705810546875, -7.520263671875, -7.0699462890625, -6.61962890625, -6.1693115234375, -5.718994140625, -5.2686767578125, -4.818359375, -4.3680419921875, -3.917724609375, -3.4674072265625, -3.01708984375, -2.5667724609375, -2.116455078125, -1.6661376953125, -1.2158203125, -0.7655029296875, -0.315185546875, 0.1351318359375, 0.58544921875, 1.0357666015625, 1.486083984375, 1.9364013671875, 2.38671875, 2.8370361328125, 3.287353515625, 3.7376708984375, 4.18798828125, 4.6383056640625, 5.088623046875, 5.5389404296875, 5.9892578125, 6.4395751953125, 6.889892578125, 7.3402099609375, 7.79052734375, 8.2408447265625, 8.691162109375, 9.1414794921875, 9.591796875, 10.0421142578125, 10.492431640625, 10.9427490234375, 11.39306640625, 11.8433837890625, 12.293701171875, 12.7440185546875, 13.1943359375, 13.6446533203125, 14.094970703125, 14.5452880859375, 14.99560546875, 15.4459228515625, 15.896240234375, 16.3465576171875, 16.796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 18.0, 19.0, 40.0, 58.0, 102.0, 158.0, 277.0, 549.0, 1251.0, 3647.0, 14277.0, 93157.0, 778296.0, 131268.0, 18332.0, 4263.0, 1387.0, 610.0, 314.0, 193.0, 122.0, 74.0, 36.0, 30.0, 13.0, 12.0, 8.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-32.21875, -31.286865234375, -30.35498046875, -29.423095703125, -28.4912109375, -27.559326171875, -26.62744140625, -25.695556640625, -24.763671875, -23.831787109375, -22.89990234375, -21.968017578125, -21.0361328125, -20.104248046875, -19.17236328125, -18.240478515625, -17.30859375, -16.376708984375, -15.44482421875, -14.512939453125, -13.5810546875, -12.649169921875, -11.71728515625, -10.785400390625, -9.853515625, -8.921630859375, -7.98974609375, -7.057861328125, -6.1259765625, -5.194091796875, -4.26220703125, -3.330322265625, -2.3984375, -1.466552734375, -0.53466796875, 0.397216796875, 1.3291015625, 2.260986328125, 3.19287109375, 4.124755859375, 5.056640625, 5.988525390625, 6.92041015625, 7.852294921875, 8.7841796875, 9.716064453125, 10.64794921875, 11.579833984375, 12.51171875, 13.443603515625, 14.37548828125, 15.307373046875, 16.2392578125, 17.171142578125, 18.10302734375, 19.034912109375, 19.966796875, 20.898681640625, 21.83056640625, 22.762451171875, 23.6943359375, 24.626220703125, 25.55810546875, 26.489990234375, 27.421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 15.0, 11.0, 8.0, 8.0, 10.0, 9.0, 16.0, 32.0, 28.0, 30.0, 36.0, 45.0, 38.0, 47.0, 44.0, 40.0, 53.0, 55.0, 54.0, 52.0, 54.0, 43.0, 36.0, 36.0, 30.0, 24.0, 27.0, 24.0, 9.0, 15.0, 7.0, 13.0, 7.0, 4.0, 1.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.65625, -38.36181640625, -37.0673828125, -35.77294921875, -34.478515625, -33.18408203125, -31.8896484375, -30.59521484375, -29.30078125, -28.00634765625, -26.7119140625, -25.41748046875, -24.123046875, -22.82861328125, -21.5341796875, -20.23974609375, -18.9453125, -17.65087890625, -16.3564453125, -15.06201171875, -13.767578125, -12.47314453125, -11.1787109375, -9.88427734375, -8.58984375, -7.29541015625, -6.0009765625, -4.70654296875, -3.412109375, -2.11767578125, -0.8232421875, 0.47119140625, 1.765625, 3.06005859375, 4.3544921875, 5.64892578125, 6.943359375, 8.23779296875, 9.5322265625, 10.82666015625, 12.12109375, 13.41552734375, 14.7099609375, 16.00439453125, 17.298828125, 18.59326171875, 19.8876953125, 21.18212890625, 22.4765625, 23.77099609375, 25.0654296875, 26.35986328125, 27.654296875, 28.94873046875, 30.2431640625, 31.53759765625, 32.83203125, 34.12646484375, 35.4208984375, 36.71533203125, 38.009765625, 39.30419921875, 40.5986328125, 41.89306640625, 43.1875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 9.0, 12.0, 16.0, 22.0, 30.0, 33.0, 44.0, 68.0, 119.0, 207.0, 406.0, 759.0, 1730.0, 4103.0, 11456.0, 39091.0, 246939.0, 660375.0, 58147.0, 15368.0, 5313.0, 2155.0, 960.0, 532.0, 230.0, 141.0, 75.0, 51.0, 48.0, 19.0, 19.0, 19.0, 13.0, 7.0, 8.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.857177734375, -8.58154296875, -8.305908203125, -8.0302734375, -7.754638671875, -7.47900390625, -7.203369140625, -6.927734375, -6.652099609375, -6.37646484375, -6.100830078125, -5.8251953125, -5.549560546875, -5.27392578125, -4.998291015625, -4.72265625, -4.447021484375, -4.17138671875, -3.895751953125, -3.6201171875, -3.344482421875, -3.06884765625, -2.793212890625, -2.517578125, -2.241943359375, -1.96630859375, -1.690673828125, -1.4150390625, -1.139404296875, -0.86376953125, -0.588134765625, -0.3125, -0.036865234375, 0.23876953125, 0.514404296875, 0.7900390625, 1.065673828125, 1.34130859375, 1.616943359375, 1.892578125, 2.168212890625, 2.44384765625, 2.719482421875, 2.9951171875, 3.270751953125, 3.54638671875, 3.822021484375, 4.09765625, 4.373291015625, 4.64892578125, 4.924560546875, 5.2001953125, 5.475830078125, 5.75146484375, 6.027099609375, 6.302734375, 6.578369140625, 6.85400390625, 7.129638671875, 7.4052734375, 7.680908203125, 7.95654296875, 8.232177734375, 8.5078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 5.0, 12.0, 15.0, 32.0, 25.0, 41.0, 51.0, 104.0, 148.0, 148.0, 106.0, 78.0, 50.0, 26.0, 32.0, 22.0, 21.0, 9.0, 8.0, 7.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0025348663330078125, -0.0024645626544952393, -0.002394258975982666, -0.0023239552974700928, -0.0022536516189575195, -0.0021833479404449463, -0.002113044261932373, -0.0020427405834198, -0.0019724369049072266, -0.0019021332263946533, -0.00183182954788208, -0.0017615258693695068, -0.0016912221908569336, -0.0016209185123443604, -0.0015506148338317871, -0.0014803111553192139, -0.0014100074768066406, -0.0013397037982940674, -0.0012694001197814941, -0.001199096441268921, -0.0011287927627563477, -0.0010584890842437744, -0.0009881854057312012, -0.0009178817272186279, -0.0008475780487060547, -0.0007772743701934814, -0.0007069706916809082, -0.000636667013168335, -0.0005663633346557617, -0.0004960596561431885, -0.00042575597763061523, -0.000355452299118042, -0.00028514862060546875, -0.0002148449420928955, -0.00014454126358032227, -7.423758506774902e-05, -3.933906555175781e-06, 6.636977195739746e-05, 0.0001366734504699707, 0.00020697712898254395, 0.0002772808074951172, 0.00034758448600769043, 0.00041788816452026367, 0.0004881918430328369, 0.0005584955215454102, 0.0006287992000579834, 0.0006991028785705566, 0.0007694065570831299, 0.0008397102355957031, 0.0009100139141082764, 0.0009803175926208496, 0.0010506212711334229, 0.001120924949645996, 0.0011912286281585693, 0.0012615323066711426, 0.0013318359851837158, 0.001402139663696289, 0.0014724433422088623, 0.0015427470207214355, 0.0016130506992340088, 0.001683354377746582, 0.0017536580562591553, 0.0018239617347717285, 0.0018942654132843018, 0.001964569091796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 2.0, 14.0, 19.0, 29.0, 51.0, 74.0, 117.0, 221.0, 350.0, 645.0, 1284.0, 2916.0, 7545.0, 25476.0, 134086.0, 757381.0, 88060.0, 19259.0, 6127.0, 2407.0, 1093.0, 556.0, 314.0, 192.0, 125.0, 75.0, 34.0, 34.0, 19.0, 12.0, 7.0, 3.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.765625, -9.4443359375, -9.123046875, -8.8017578125, -8.48046875, -8.1591796875, -7.837890625, -7.5166015625, -7.1953125, -6.8740234375, -6.552734375, -6.2314453125, -5.91015625, -5.5888671875, -5.267578125, -4.9462890625, -4.625, -4.3037109375, -3.982421875, -3.6611328125, -3.33984375, -3.0185546875, -2.697265625, -2.3759765625, -2.0546875, -1.7333984375, -1.412109375, -1.0908203125, -0.76953125, -0.4482421875, -0.126953125, 0.1943359375, 0.515625, 0.8369140625, 1.158203125, 1.4794921875, 1.80078125, 2.1220703125, 2.443359375, 2.7646484375, 3.0859375, 3.4072265625, 3.728515625, 4.0498046875, 4.37109375, 4.6923828125, 5.013671875, 5.3349609375, 5.65625, 5.9775390625, 6.298828125, 6.6201171875, 6.94140625, 7.2626953125, 7.583984375, 7.9052734375, 8.2265625, 8.5478515625, 8.869140625, 9.1904296875, 9.51171875, 9.8330078125, 10.154296875, 10.4755859375, 10.796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 3.0, 6.0, 11.0, 27.0, 16.0, 25.0, 30.0, 50.0, 79.0, 151.0, 190.0, 167.0, 60.0, 50.0, 28.0, 31.0, 19.0, 11.0, 15.0, 12.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.90625, -15.50341796875, -15.1005859375, -14.69775390625, -14.294921875, -13.89208984375, -13.4892578125, -13.08642578125, -12.68359375, -12.28076171875, -11.8779296875, -11.47509765625, -11.072265625, -10.66943359375, -10.2666015625, -9.86376953125, -9.4609375, -9.05810546875, -8.6552734375, -8.25244140625, -7.849609375, -7.44677734375, -7.0439453125, -6.64111328125, -6.23828125, -5.83544921875, -5.4326171875, -5.02978515625, -4.626953125, -4.22412109375, -3.8212890625, -3.41845703125, -3.015625, -2.61279296875, -2.2099609375, -1.80712890625, -1.404296875, -1.00146484375, -0.5986328125, -0.19580078125, 0.20703125, 0.60986328125, 1.0126953125, 1.41552734375, 1.818359375, 2.22119140625, 2.6240234375, 3.02685546875, 3.4296875, 3.83251953125, 4.2353515625, 4.63818359375, 5.041015625, 5.44384765625, 5.8466796875, 6.24951171875, 6.65234375, 7.05517578125, 7.4580078125, 7.86083984375, 8.263671875, 8.66650390625, 9.0693359375, 9.47216796875, 9.875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 18.0, 53.0, 243.0, 498.0, 133.0, 24.0, 12.0, 11.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-339.7746276855469, -324.47076416015625, -309.1669006347656, -293.863037109375, -278.5591735839844, -263.25531005859375, -247.95144653320312, -232.6475830078125, -217.34371948242188, -202.03985595703125, -186.73599243164062, -171.43212890625, -156.12826538085938, -140.82440185546875, -125.52053833007812, -110.2166748046875, -94.91281127929688, -79.60894775390625, -64.30508422851562, -49.001220703125, -33.697357177734375, -18.39349365234375, -3.089630126953125, 12.2142333984375, 27.518096923828125, 42.82196044921875, 58.125823974609375, 73.4296875, 88.73355102539062, 104.03741455078125, 119.34127807617188, 134.6451416015625, 149.948974609375, 165.25283813476562, 180.55670166015625, 195.86056518554688, 211.1644287109375, 226.46829223632812, 241.77215576171875, 257.0760192871094, 272.3798828125, 287.6837463378906, 302.98760986328125, 318.2914733886719, 333.5953369140625, 348.8992004394531, 364.20306396484375, 379.5069274902344, 394.810791015625, 410.1146545410156, 425.41851806640625, 440.7223815917969, 456.0262451171875, 471.3301086425781, 486.63397216796875, 501.9378356933594, 517.24169921875, 532.5455322265625, 547.8494262695312, 563.1533203125, 578.4571533203125, 593.760986328125, 609.0648803710938, 624.3687744140625, 639.672607421875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 3.0, 8.0, 4.0, 9.0, 12.0, 9.0, 8.0, 21.0, 13.0, 20.0, 10.0, 27.0, 29.0, 31.0, 37.0, 37.0, 56.0, 75.0, 92.0, 100.0, 72.0, 52.0, 38.0, 32.0, 25.0, 28.0, 29.0, 12.0, 18.0, 19.0, 12.0, 6.0, 11.0, 12.0, 8.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.70608520507812, -172.8904266357422, -167.07476806640625, -161.25912475585938, -155.44346618652344, -149.6278076171875, -143.81214904785156, -137.99649047851562, -132.18084716796875, -126.36518859863281, -120.5495376586914, -114.73387908935547, -108.91822814941406, -103.10256958007812, -97.28691101074219, -91.47125244140625, -85.65559387207031, -79.83993530273438, -74.02428436279297, -68.20862579345703, -62.39297103881836, -56.57731628417969, -50.76165771484375, -44.94600296020508, -39.130348205566406, -33.314693450927734, -27.49903678894043, -21.683380126953125, -15.867725372314453, -10.052070617675781, -4.236412048339844, 1.5792427062988281, 7.3948974609375, 13.210553169250488, 19.026208877563477, 24.84186553955078, 30.657520294189453, 36.473175048828125, 42.28883361816406, 48.104488372802734, 53.920143127441406, 59.73579788208008, 65.55145263671875, 71.36711120605469, 77.18276977539062, 82.99842071533203, 88.81407928466797, 94.62973022460938, 100.44538879394531, 106.26104736328125, 112.07669830322266, 117.8923568725586, 123.7080078125, 129.52366638183594, 135.33932495117188, 141.1549835205078, 146.97064208984375, 152.7863006591797, 158.60195922851562, 164.4176025390625, 170.23326110839844, 176.04891967773438, 181.8645782470703, 187.68023681640625, 193.49588012695312]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 8.0, 4.0, 8.0, 13.0, 21.0, 35.0, 33.0, 71.0, 179.0, 438.0, 1294.0, 4439.0, 24483.0, 838811.0, 3240212.0, 73649.0, 7989.0, 1750.0, 446.0, 161.0, 65.0, 40.0, 44.0, 22.0, 18.0, 14.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.421875, -23.524169921875, -22.62646484375, -21.728759765625, -20.8310546875, -19.933349609375, -19.03564453125, -18.137939453125, -17.240234375, -16.342529296875, -15.44482421875, -14.547119140625, -13.6494140625, -12.751708984375, -11.85400390625, -10.956298828125, -10.05859375, -9.160888671875, -8.26318359375, -7.365478515625, -6.4677734375, -5.570068359375, -4.67236328125, -3.774658203125, -2.876953125, -1.979248046875, -1.08154296875, -0.183837890625, 0.7138671875, 1.611572265625, 2.50927734375, 3.406982421875, 4.3046875, 5.202392578125, 6.10009765625, 6.997802734375, 7.8955078125, 8.793212890625, 9.69091796875, 10.588623046875, 11.486328125, 12.384033203125, 13.28173828125, 14.179443359375, 15.0771484375, 15.974853515625, 16.87255859375, 17.770263671875, 18.66796875, 19.565673828125, 20.46337890625, 21.361083984375, 22.2587890625, 23.156494140625, 24.05419921875, 24.951904296875, 25.849609375, 26.747314453125, 27.64501953125, 28.542724609375, 29.4404296875, 30.338134765625, 31.23583984375, 32.133544921875, 33.03125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 11.0, 16.0, 17.0, 17.0, 31.0, 34.0, 45.0, 51.0, 74.0, 83.0, 80.0, 71.0, 64.0, 74.0, 68.0, 56.0, 40.0, 38.0, 33.0, 26.0, 17.0, 20.0, 6.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.75, -14.3111572265625, -13.872314453125, -13.4334716796875, -12.99462890625, -12.5557861328125, -12.116943359375, -11.6781005859375, -11.2392578125, -10.8004150390625, -10.361572265625, -9.9227294921875, -9.48388671875, -9.0450439453125, -8.606201171875, -8.1673583984375, -7.728515625, -7.2896728515625, -6.850830078125, -6.4119873046875, -5.97314453125, -5.5343017578125, -5.095458984375, -4.6566162109375, -4.2177734375, -3.7789306640625, -3.340087890625, -2.9012451171875, -2.46240234375, -2.0235595703125, -1.584716796875, -1.1458740234375, -0.70703125, -0.2681884765625, 0.170654296875, 0.6094970703125, 1.04833984375, 1.4871826171875, 1.926025390625, 2.3648681640625, 2.8037109375, 3.2425537109375, 3.681396484375, 4.1202392578125, 4.55908203125, 4.9979248046875, 5.436767578125, 5.8756103515625, 6.314453125, 6.7532958984375, 7.192138671875, 7.6309814453125, 8.06982421875, 8.5086669921875, 8.947509765625, 9.3863525390625, 9.8251953125, 10.2640380859375, 10.702880859375, 11.1417236328125, 11.58056640625, 12.0194091796875, 12.458251953125, 12.8970947265625, 13.3359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 13.0, 13.0, 27.0, 33.0, 60.0, 153.0, 353.0, 1038.0, 5427.0, 114164.0, 3999357.0, 67859.0, 4263.0, 891.0, 294.0, 137.0, 86.0, 47.0, 19.0, 20.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -45.365234375, -43.82421875, -42.283203125, -40.7421875, -39.201171875, -37.66015625, -36.119140625, -34.578125, -33.037109375, -31.49609375, -29.955078125, -28.4140625, -26.873046875, -25.33203125, -23.791015625, -22.25, -20.708984375, -19.16796875, -17.626953125, -16.0859375, -14.544921875, -13.00390625, -11.462890625, -9.921875, -8.380859375, -6.83984375, -5.298828125, -3.7578125, -2.216796875, -0.67578125, 0.865234375, 2.40625, 3.947265625, 5.48828125, 7.029296875, 8.5703125, 10.111328125, 11.65234375, 13.193359375, 14.734375, 16.275390625, 17.81640625, 19.357421875, 20.8984375, 22.439453125, 23.98046875, 25.521484375, 27.0625, 28.603515625, 30.14453125, 31.685546875, 33.2265625, 34.767578125, 36.30859375, 37.849609375, 39.390625, 40.931640625, 42.47265625, 44.013671875, 45.5546875, 47.095703125, 48.63671875, 50.177734375, 51.71875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 4.0, 13.0, 20.0, 26.0, 33.0, 44.0, 70.0, 127.0, 209.0, 420.0, 745.0, 883.0, 625.0, 361.0, 212.0, 101.0, 64.0, 30.0, 29.0, 15.0, 7.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.4375, -20.623291015625, -19.80908203125, -18.994873046875, -18.1806640625, -17.366455078125, -16.55224609375, -15.738037109375, -14.923828125, -14.109619140625, -13.29541015625, -12.481201171875, -11.6669921875, -10.852783203125, -10.03857421875, -9.224365234375, -8.41015625, -7.595947265625, -6.78173828125, -5.967529296875, -5.1533203125, -4.339111328125, -3.52490234375, -2.710693359375, -1.896484375, -1.082275390625, -0.26806640625, 0.546142578125, 1.3603515625, 2.174560546875, 2.98876953125, 3.802978515625, 4.6171875, 5.431396484375, 6.24560546875, 7.059814453125, 7.8740234375, 8.688232421875, 9.50244140625, 10.316650390625, 11.130859375, 11.945068359375, 12.75927734375, 13.573486328125, 14.3876953125, 15.201904296875, 16.01611328125, 16.830322265625, 17.64453125, 18.458740234375, 19.27294921875, 20.087158203125, 20.9013671875, 21.715576171875, 22.52978515625, 23.343994140625, 24.158203125, 24.972412109375, 25.78662109375, 26.600830078125, 27.4150390625, 28.229248046875, 29.04345703125, 29.857666015625, 30.671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 8.0, 12.0, 16.0, 39.0, 67.0, 104.0, 141.0, 160.0, 161.0, 94.0, 91.0, 44.0, 23.0, 14.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-137.1199951171875, -131.57003784179688, -126.02008819580078, -120.47013854980469, -114.92018127441406, -109.37023162841797, -103.82028198242188, -98.27032470703125, -92.72036743164062, -87.17041778564453, -81.6204605102539, -76.07051086425781, -70.52055358886719, -64.9706039428711, -59.420650482177734, -53.870697021484375, -48.32074737548828, -42.77079391479492, -37.22084045410156, -31.670888900756836, -26.120935440063477, -20.570981979370117, -15.02103042602539, -9.471076965332031, -3.921123504638672, 1.6288294792175293, 7.1787824630737305, 12.728734970092773, 18.278688430786133, 23.828641891479492, 29.37859344482422, 34.92854690551758, 40.47850036621094, 46.0284538269043, 51.578407287597656, 57.12835693359375, 62.678314208984375, 68.22826385498047, 73.77821350097656, 79.32817077636719, 84.87812805175781, 90.4280776977539, 95.97803497314453, 101.52798461914062, 107.07794189453125, 112.62789154052734, 118.17784118652344, 123.72779846191406, 129.27774047851562, 134.82769775390625, 140.3776397705078, 145.92759704589844, 151.47755432128906, 157.0275115966797, 162.57745361328125, 168.12741088867188, 173.6773681640625, 179.22732543945312, 184.7772674560547, 190.3272247314453, 195.87718200683594, 201.42713928222656, 206.97708129882812, 212.52703857421875, 218.07699584960938]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 15.0, 12.0, 20.0, 20.0, 26.0, 24.0, 30.0, 39.0, 38.0, 65.0, 63.0, 48.0, 64.0, 53.0, 63.0, 53.0, 56.0, 44.0, 42.0, 43.0, 39.0, 23.0, 21.0, 14.0, 16.0, 10.0, 10.0, 15.0, 5.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.61149597167969, -110.34532165527344, -107.07914733886719, -103.81297302246094, -100.54679870605469, -97.28062438964844, -94.01445007324219, -90.74827575683594, -87.48210144042969, -84.21592712402344, -80.94975280761719, -77.68357849121094, -74.41740417480469, -71.15122985839844, -67.88505554199219, -64.61888122558594, -61.352699279785156, -58.086524963378906, -54.820350646972656, -51.554176330566406, -48.288002014160156, -45.021827697753906, -41.75564956665039, -38.48947525024414, -35.22330093383789, -31.95712661743164, -28.69095230102539, -25.424776077270508, -22.158601760864258, -18.892427444458008, -15.626251220703125, -12.360076904296875, -9.093910217285156, -5.827735424041748, -2.56156063079834, 0.7046146392822266, 3.9707889556884766, 7.236963272094727, 10.50313949584961, 13.76931381225586, 17.03548812866211, 20.30166244506836, 23.56783676147461, 26.834012985229492, 30.100187301635742, 33.366363525390625, 36.632537841796875, 39.898712158203125, 43.164886474609375, 46.431060791015625, 49.697235107421875, 52.963409423828125, 56.229583740234375, 59.495758056640625, 62.76193618774414, 66.02810668945312, 69.29428100585938, 72.56045532226562, 75.82662963867188, 79.09280395507812, 82.35897827148438, 85.62515258789062, 88.89132690429688, 92.15750122070312, 95.4236831665039]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 17.0, 14.0, 15.0, 40.0, 39.0, 69.0, 120.0, 179.0, 356.0, 804.0, 1836.0, 5163.0, 16270.0, 65178.0, 337753.0, 490173.0, 96204.0, 23137.0, 6836.0, 2291.0, 996.0, 435.0, 258.0, 134.0, 80.0, 39.0, 32.0, 22.0, 15.0, 10.0, 10.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.15625, -20.497802734375, -19.83935546875, -19.180908203125, -18.5224609375, -17.864013671875, -17.20556640625, -16.547119140625, -15.888671875, -15.230224609375, -14.57177734375, -13.913330078125, -13.2548828125, -12.596435546875, -11.93798828125, -11.279541015625, -10.62109375, -9.962646484375, -9.30419921875, -8.645751953125, -7.9873046875, -7.328857421875, -6.67041015625, -6.011962890625, -5.353515625, -4.695068359375, -4.03662109375, -3.378173828125, -2.7197265625, -2.061279296875, -1.40283203125, -0.744384765625, -0.0859375, 0.572509765625, 1.23095703125, 1.889404296875, 2.5478515625, 3.206298828125, 3.86474609375, 4.523193359375, 5.181640625, 5.840087890625, 6.49853515625, 7.156982421875, 7.8154296875, 8.473876953125, 9.13232421875, 9.790771484375, 10.44921875, 11.107666015625, 11.76611328125, 12.424560546875, 13.0830078125, 13.741455078125, 14.39990234375, 15.058349609375, 15.716796875, 16.375244140625, 17.03369140625, 17.692138671875, 18.3505859375, 19.009033203125, 19.66748046875, 20.325927734375, 20.984375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 9.0, 11.0, 24.0, 31.0, 25.0, 49.0, 54.0, 46.0, 55.0, 59.0, 79.0, 89.0, 73.0, 79.0, 66.0, 53.0, 49.0, 34.0, 36.0, 27.0, 17.0, 12.0, 9.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.442138671875, -9.97802734375, -9.513916015625, -9.0498046875, -8.585693359375, -8.12158203125, -7.657470703125, -7.193359375, -6.729248046875, -6.26513671875, -5.801025390625, -5.3369140625, -4.872802734375, -4.40869140625, -3.944580078125, -3.48046875, -3.016357421875, -2.55224609375, -2.088134765625, -1.6240234375, -1.159912109375, -0.69580078125, -0.231689453125, 0.232421875, 0.696533203125, 1.16064453125, 1.624755859375, 2.0888671875, 2.552978515625, 3.01708984375, 3.481201171875, 3.9453125, 4.409423828125, 4.87353515625, 5.337646484375, 5.8017578125, 6.265869140625, 6.72998046875, 7.194091796875, 7.658203125, 8.122314453125, 8.58642578125, 9.050537109375, 9.5146484375, 9.978759765625, 10.44287109375, 10.906982421875, 11.37109375, 11.835205078125, 12.29931640625, 12.763427734375, 13.2275390625, 13.691650390625, 14.15576171875, 14.619873046875, 15.083984375, 15.548095703125, 16.01220703125, 16.476318359375, 16.9404296875, 17.404541015625, 17.86865234375, 18.332763671875, 18.796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 7.0, 12.0, 18.0, 23.0, 33.0, 49.0, 88.0, 112.0, 200.0, 357.0, 739.0, 1593.0, 4715.0, 23590.0, 319944.0, 660047.0, 28420.0, 5208.0, 1681.0, 723.0, 410.0, 208.0, 113.0, 82.0, 57.0, 37.0, 19.0, 18.0, 8.0, 13.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.46875, -40.349365234375, -39.22998046875, -38.110595703125, -36.9912109375, -35.871826171875, -34.75244140625, -33.633056640625, -32.513671875, -31.394287109375, -30.27490234375, -29.155517578125, -28.0361328125, -26.916748046875, -25.79736328125, -24.677978515625, -23.55859375, -22.439208984375, -21.31982421875, -20.200439453125, -19.0810546875, -17.961669921875, -16.84228515625, -15.722900390625, -14.603515625, -13.484130859375, -12.36474609375, -11.245361328125, -10.1259765625, -9.006591796875, -7.88720703125, -6.767822265625, -5.6484375, -4.529052734375, -3.40966796875, -2.290283203125, -1.1708984375, -0.051513671875, 1.06787109375, 2.187255859375, 3.306640625, 4.426025390625, 5.54541015625, 6.664794921875, 7.7841796875, 8.903564453125, 10.02294921875, 11.142333984375, 12.26171875, 13.381103515625, 14.50048828125, 15.619873046875, 16.7392578125, 17.858642578125, 18.97802734375, 20.097412109375, 21.216796875, 22.336181640625, 23.45556640625, 24.574951171875, 25.6943359375, 26.813720703125, 27.93310546875, 29.052490234375, 30.171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 8.0, 17.0, 21.0, 21.0, 21.0, 55.0, 46.0, 73.0, 80.0, 99.0, 122.0, 90.0, 96.0, 65.0, 53.0, 42.0, 34.0, 22.0, 6.0, 8.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.1875, -76.03369140625, -73.8798828125, -71.72607421875, -69.572265625, -67.41845703125, -65.2646484375, -63.11083984375, -60.95703125, -58.80322265625, -56.6494140625, -54.49560546875, -52.341796875, -50.18798828125, -48.0341796875, -45.88037109375, -43.7265625, -41.57275390625, -39.4189453125, -37.26513671875, -35.111328125, -32.95751953125, -30.8037109375, -28.64990234375, -26.49609375, -24.34228515625, -22.1884765625, -20.03466796875, -17.880859375, -15.72705078125, -13.5732421875, -11.41943359375, -9.265625, -7.11181640625, -4.9580078125, -2.80419921875, -0.650390625, 1.50341796875, 3.6572265625, 5.81103515625, 7.96484375, 10.11865234375, 12.2724609375, 14.42626953125, 16.580078125, 18.73388671875, 20.8876953125, 23.04150390625, 25.1953125, 27.34912109375, 29.5029296875, 31.65673828125, 33.810546875, 35.96435546875, 38.1181640625, 40.27197265625, 42.42578125, 44.57958984375, 46.7333984375, 48.88720703125, 51.041015625, 53.19482421875, 55.3486328125, 57.50244140625, 59.65625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 1.0, 5.0, 2.0, 7.0, 12.0, 12.0, 36.0, 43.0, 67.0, 133.0, 246.0, 548.0, 1609.0, 5696.0, 33119.0, 801009.0, 183635.0, 17015.0, 3532.0, 1045.0, 363.0, 195.0, 92.0, 60.0, 24.0, 14.0, 14.0, 7.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -18.191162109375, -17.60107421875, -17.010986328125, -16.4208984375, -15.830810546875, -15.24072265625, -14.650634765625, -14.060546875, -13.470458984375, -12.88037109375, -12.290283203125, -11.7001953125, -11.110107421875, -10.52001953125, -9.929931640625, -9.33984375, -8.749755859375, -8.15966796875, -7.569580078125, -6.9794921875, -6.389404296875, -5.79931640625, -5.209228515625, -4.619140625, -4.029052734375, -3.43896484375, -2.848876953125, -2.2587890625, -1.668701171875, -1.07861328125, -0.488525390625, 0.1015625, 0.691650390625, 1.28173828125, 1.871826171875, 2.4619140625, 3.052001953125, 3.64208984375, 4.232177734375, 4.822265625, 5.412353515625, 6.00244140625, 6.592529296875, 7.1826171875, 7.772705078125, 8.36279296875, 8.952880859375, 9.54296875, 10.133056640625, 10.72314453125, 11.313232421875, 11.9033203125, 12.493408203125, 13.08349609375, 13.673583984375, 14.263671875, 14.853759765625, 15.44384765625, 16.033935546875, 16.6240234375, 17.214111328125, 17.80419921875, 18.394287109375, 18.984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 9.0, 10.0, 21.0, 29.0, 45.0, 101.0, 175.0, 221.0, 138.0, 87.0, 37.0, 28.0, 20.0, 12.0, 10.0, 9.0, 7.0, 3.0, 6.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004230499267578125, -0.004075527191162109, -0.003920555114746094, -0.003765583038330078, -0.0036106109619140625, -0.003455638885498047, -0.0033006668090820312, -0.0031456947326660156, -0.00299072265625, -0.0028357505798339844, -0.0026807785034179688, -0.002525806427001953, -0.0023708343505859375, -0.002215862274169922, -0.0020608901977539062, -0.0019059181213378906, -0.001750946044921875, -0.0015959739685058594, -0.0014410018920898438, -0.0012860298156738281, -0.0011310577392578125, -0.0009760856628417969, -0.0008211135864257812, -0.0006661415100097656, -0.00051116943359375, -0.0003561973571777344, -0.00020122528076171875, -4.6253204345703125e-05, 0.0001087188720703125, 0.0002636909484863281, 0.00041866302490234375, 0.0005736351013183594, 0.000728607177734375, 0.0008835792541503906, 0.0010385513305664062, 0.0011935234069824219, 0.0013484954833984375, 0.0015034675598144531, 0.0016584396362304688, 0.0018134117126464844, 0.0019683837890625, 0.0021233558654785156, 0.0022783279418945312, 0.002433300018310547, 0.0025882720947265625, 0.002743244171142578, 0.0028982162475585938, 0.0030531883239746094, 0.003208160400390625, 0.0033631324768066406, 0.0035181045532226562, 0.003673076629638672, 0.0038280487060546875, 0.003983020782470703, 0.004137992858886719, 0.004292964935302734, 0.00444793701171875, 0.004602909088134766, 0.004757881164550781, 0.004912853240966797, 0.0050678253173828125, 0.005222797393798828, 0.005377769470214844, 0.005532741546630859, 0.005687713623046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 11.0, 9.0, 16.0, 28.0, 34.0, 69.0, 113.0, 224.0, 421.0, 990.0, 2774.0, 10157.0, 56963.0, 804121.0, 146354.0, 18847.0, 4607.0, 1543.0, 597.0, 278.0, 163.0, 82.0, 45.0, 29.0, 21.0, 12.0, 9.0, 4.0, 11.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5390625, -13.083251953125, -12.62744140625, -12.171630859375, -11.7158203125, -11.260009765625, -10.80419921875, -10.348388671875, -9.892578125, -9.436767578125, -8.98095703125, -8.525146484375, -8.0693359375, -7.613525390625, -7.15771484375, -6.701904296875, -6.24609375, -5.790283203125, -5.33447265625, -4.878662109375, -4.4228515625, -3.967041015625, -3.51123046875, -3.055419921875, -2.599609375, -2.143798828125, -1.68798828125, -1.232177734375, -0.7763671875, -0.320556640625, 0.13525390625, 0.591064453125, 1.046875, 1.502685546875, 1.95849609375, 2.414306640625, 2.8701171875, 3.325927734375, 3.78173828125, 4.237548828125, 4.693359375, 5.149169921875, 5.60498046875, 6.060791015625, 6.5166015625, 6.972412109375, 7.42822265625, 7.884033203125, 8.33984375, 8.795654296875, 9.25146484375, 9.707275390625, 10.1630859375, 10.618896484375, 11.07470703125, 11.530517578125, 11.986328125, 12.442138671875, 12.89794921875, 13.353759765625, 13.8095703125, 14.265380859375, 14.72119140625, 15.177001953125, 15.6328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 1.0, 8.0, 10.0, 11.0, 17.0, 21.0, 23.0, 25.0, 32.0, 46.0, 57.0, 61.0, 79.0, 109.0, 109.0, 52.0, 57.0, 37.0, 45.0, 21.0, 22.0, 23.0, 20.0, 15.0, 12.0, 9.0, 6.0, 12.0, 12.0, 8.0, 10.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.57421875, -7.3431396484375, -7.112060546875, -6.8809814453125, -6.64990234375, -6.4188232421875, -6.187744140625, -5.9566650390625, -5.7255859375, -5.4945068359375, -5.263427734375, -5.0323486328125, -4.80126953125, -4.5701904296875, -4.339111328125, -4.1080322265625, -3.876953125, -3.6458740234375, -3.414794921875, -3.1837158203125, -2.95263671875, -2.7215576171875, -2.490478515625, -2.2593994140625, -2.0283203125, -1.7972412109375, -1.566162109375, -1.3350830078125, -1.10400390625, -0.8729248046875, -0.641845703125, -0.4107666015625, -0.1796875, 0.0513916015625, 0.282470703125, 0.5135498046875, 0.74462890625, 0.9757080078125, 1.206787109375, 1.4378662109375, 1.6689453125, 1.9000244140625, 2.131103515625, 2.3621826171875, 2.59326171875, 2.8243408203125, 3.055419921875, 3.2864990234375, 3.517578125, 3.7486572265625, 3.979736328125, 4.2108154296875, 4.44189453125, 4.6729736328125, 4.904052734375, 5.1351318359375, 5.3662109375, 5.5972900390625, 5.828369140625, 6.0594482421875, 6.29052734375, 6.5216064453125, 6.752685546875, 6.9837646484375, 7.21484375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 7.0, 21.0, 51.0, 184.0, 544.0, 121.0, 39.0, 11.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-736.0587768554688, -717.9351196289062, -699.8115234375, -681.6878662109375, -663.564208984375, -645.4405517578125, -627.3169555664062, -609.1932983398438, -591.0697021484375, -572.946044921875, -554.8224487304688, -536.6987915039062, -518.5751342773438, -500.4515075683594, -482.327880859375, -464.2042236328125, -446.08056640625, -427.9569396972656, -409.8332824707031, -391.70965576171875, -373.58599853515625, -355.4623718261719, -337.3387451171875, -319.215087890625, -301.0914611816406, -282.96783447265625, -264.84417724609375, -246.72055053710938, -228.59690856933594, -210.4732666015625, -192.34963989257812, -174.2259979248047, -156.102294921875, -137.97865295410156, -119.85501861572266, -101.73138427734375, -83.60774230957031, -65.48410034179688, -47.36046600341797, -29.236831665039062, -11.113189697265625, 7.010448455810547, 25.13408660888672, 43.25772476196289, 61.38136291503906, 79.5050048828125, 97.6286392211914, 115.75227355957031, 133.87591552734375, 151.9995574951172, 170.12319946289062, 188.246826171875, 206.37046813964844, 224.49411010742188, 242.61773681640625, 260.74139404296875, 278.8650207519531, 296.9886474609375, 315.1123046875, 333.2359313964844, 351.35955810546875, 369.48321533203125, 387.6068420410156, 405.73046875, 423.8541259765625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 10.0, 11.0, 13.0, 25.0, 30.0, 30.0, 25.0, 49.0, 36.0, 38.0, 102.0, 200.0, 97.0, 63.0, 55.0, 33.0, 30.0, 26.0, 22.0, 25.0, 18.0, 6.0, 15.0, 7.0, 4.0, 4.0, 8.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.8546142578125, -265.7618713378906, -258.6691589355469, -251.57643127441406, -244.48370361328125, -237.39096069335938, -230.29823303222656, -223.20550537109375, -216.11277770996094, -209.02005004882812, -201.9273223876953, -194.8345947265625, -187.74185180664062, -180.64913940429688, -173.556396484375, -166.4636688232422, -159.37094116210938, -152.27821350097656, -145.18548583984375, -138.09275817871094, -131.00003051757812, -123.90729522705078, -116.81455993652344, -109.72183227539062, -102.62910461425781, -95.536376953125, -88.44364929199219, -81.35091400146484, -74.25818634033203, -67.16545867919922, -60.07272720336914, -52.97999572753906, -45.88728332519531, -38.7945556640625, -31.701824188232422, -24.609094619750977, -17.51636505126953, -10.423637390136719, -3.3309059143066406, 3.7618255615234375, 10.85455322265625, 17.947282791137695, 25.04001235961914, 32.13274383544922, 39.22547149658203, 46.318199157714844, 53.41093063354492, 60.503662109375, 67.59638977050781, 74.68911743164062, 81.78184509277344, 88.87458038330078, 95.9673080444336, 103.0600357055664, 110.15277099609375, 117.24549865722656, 124.33822631835938, 131.4309539794922, 138.523681640625, 145.6164093017578, 152.70913696289062, 159.8018798828125, 166.8946075439453, 173.98733520507812, 181.08006286621094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 13.0, 18.0, 36.0, 49.0, 74.0, 167.0, 368.0, 817.0, 2321.0, 9054.0, 73965.0, 2395832.0, 1648251.0, 51876.0, 7869.0, 2227.0, 724.0, 277.0, 146.0, 63.0, 47.0, 19.0, 7.0, 10.0, 9.0, 12.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-50.53125, -49.2333984375, -47.935546875, -46.6376953125, -45.33984375, -44.0419921875, -42.744140625, -41.4462890625, -40.1484375, -38.8505859375, -37.552734375, -36.2548828125, -34.95703125, -33.6591796875, -32.361328125, -31.0634765625, -29.765625, -28.4677734375, -27.169921875, -25.8720703125, -24.57421875, -23.2763671875, -21.978515625, -20.6806640625, -19.3828125, -18.0849609375, -16.787109375, -15.4892578125, -14.19140625, -12.8935546875, -11.595703125, -10.2978515625, -9.0, -7.7021484375, -6.404296875, -5.1064453125, -3.80859375, -2.5107421875, -1.212890625, 0.0849609375, 1.3828125, 2.6806640625, 3.978515625, 5.2763671875, 6.57421875, 7.8720703125, 9.169921875, 10.4677734375, 11.765625, 13.0634765625, 14.361328125, 15.6591796875, 16.95703125, 18.2548828125, 19.552734375, 20.8505859375, 22.1484375, 23.4462890625, 24.744140625, 26.0419921875, 27.33984375, 28.6376953125, 29.935546875, 31.2333984375, 32.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 16.0, 18.0, 28.0, 37.0, 66.0, 89.0, 104.0, 91.0, 96.0, 83.0, 91.0, 67.0, 73.0, 40.0, 38.0, 27.0, 19.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.78125, -28.163330078125, -27.54541015625, -26.927490234375, -26.3095703125, -25.691650390625, -25.07373046875, -24.455810546875, -23.837890625, -23.219970703125, -22.60205078125, -21.984130859375, -21.3662109375, -20.748291015625, -20.13037109375, -19.512451171875, -18.89453125, -18.276611328125, -17.65869140625, -17.040771484375, -16.4228515625, -15.804931640625, -15.18701171875, -14.569091796875, -13.951171875, -13.333251953125, -12.71533203125, -12.097412109375, -11.4794921875, -10.861572265625, -10.24365234375, -9.625732421875, -9.0078125, -8.389892578125, -7.77197265625, -7.154052734375, -6.5361328125, -5.918212890625, -5.30029296875, -4.682373046875, -4.064453125, -3.446533203125, -2.82861328125, -2.210693359375, -1.5927734375, -0.974853515625, -0.35693359375, 0.260986328125, 0.87890625, 1.496826171875, 2.11474609375, 2.732666015625, 3.3505859375, 3.968505859375, 4.58642578125, 5.204345703125, 5.822265625, 6.440185546875, 7.05810546875, 7.676025390625, 8.2939453125, 8.911865234375, 9.52978515625, 10.147705078125, 10.765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 10.0, 14.0, 33.0, 66.0, 175.0, 479.0, 2204.0, 815941.0, 3371952.0, 2639.0, 519.0, 139.0, 54.0, 16.0, 12.0, 11.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-209.5, -202.75, -196.0, -189.25, -182.5, -175.75, -169.0, -162.25, -155.5, -148.75, -142.0, -135.25, -128.5, -121.75, -115.0, -108.25, -101.5, -94.75, -88.0, -81.25, -74.5, -67.75, -61.0, -54.25, -47.5, -40.75, -34.0, -27.25, -20.5, -13.75, -7.0, -0.25, 6.5, 13.25, 20.0, 26.75, 33.5, 40.25, 47.0, 53.75, 60.5, 67.25, 74.0, 80.75, 87.5, 94.25, 101.0, 107.75, 114.5, 121.25, 128.0, 134.75, 141.5, 148.25, 155.0, 161.75, 168.5, 175.25, 182.0, 188.75, 195.5, 202.25, 209.0, 215.75, 222.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 9.0, 11.0, 40.0, 103.0, 286.0, 791.0, 1611.0, 820.0, 269.0, 88.0, 31.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.625, -138.294921875, -134.96484375, -131.634765625, -128.3046875, -124.974609375, -121.64453125, -118.314453125, -114.984375, -111.654296875, -108.32421875, -104.994140625, -101.6640625, -98.333984375, -95.00390625, -91.673828125, -88.34375, -85.013671875, -81.68359375, -78.353515625, -75.0234375, -71.693359375, -68.36328125, -65.033203125, -61.703125, -58.373046875, -55.04296875, -51.712890625, -48.3828125, -45.052734375, -41.72265625, -38.392578125, -35.0625, -31.732421875, -28.40234375, -25.072265625, -21.7421875, -18.412109375, -15.08203125, -11.751953125, -8.421875, -5.091796875, -1.76171875, 1.568359375, 4.8984375, 8.228515625, 11.55859375, 14.888671875, 18.21875, 21.548828125, 24.87890625, 28.208984375, 31.5390625, 34.869140625, 38.19921875, 41.529296875, 44.859375, 48.189453125, 51.51953125, 54.849609375, 58.1796875, 61.509765625, 64.83984375, 68.169921875, 71.5]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 1.0, 10.0, 19.0, 48.0, 181.0, 409.0, 227.0, 62.0, 26.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1769.67041015625, -1735.419189453125, -1701.16796875, -1666.916748046875, -1632.66552734375, -1598.414306640625, -1564.1630859375, -1529.911865234375, -1495.66064453125, -1461.409423828125, -1427.158203125, -1392.906982421875, -1358.65576171875, -1324.404541015625, -1290.1533203125, -1255.902099609375, -1221.65087890625, -1187.399658203125, -1153.1484375, -1118.897216796875, -1084.64599609375, -1050.394775390625, -1016.1435546875, -981.892333984375, -947.6412353515625, -913.3900146484375, -879.1387939453125, -844.8875732421875, -810.6363525390625, -776.3851318359375, -742.1339111328125, -707.8826904296875, -673.6314697265625, -639.3802490234375, -605.1290283203125, -570.8778076171875, -536.6265869140625, -502.3753662109375, -468.1241760253906, -433.8729553222656, -399.6217346191406, -365.3705139160156, -331.1192932128906, -296.86810302734375, -262.61688232421875, -228.3656463623047, -194.11444091796875, -159.86322021484375, -125.61199951171875, -91.36077880859375, -57.10956573486328, -22.858352661132812, 11.392868041992188, 45.64408874511719, 79.89529418945312, 114.14651489257812, 148.39773559570312, 182.64895629882812, 216.90017700195312, 251.15138244628906, 285.402587890625, 319.65380859375, 353.905029296875, 388.15625, 422.407470703125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 18.0, 17.0, 32.0, 38.0, 36.0, 58.0, 63.0, 73.0, 89.0, 90.0, 93.0, 70.0, 63.0, 45.0, 46.0, 32.0, 30.0, 12.0, 19.0, 8.0, 9.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-309.8646240234375, -297.5186767578125, -285.1727294921875, -272.8267822265625, -260.4808349609375, -248.1348876953125, -235.7889404296875, -223.4429931640625, -211.0970458984375, -198.7510986328125, -186.4051513671875, -174.0592041015625, -161.7132568359375, -149.3673095703125, -137.0213623046875, -124.67542266845703, -112.32948303222656, -99.98353576660156, -87.63758850097656, -75.29164123535156, -62.94569778442383, -50.59975051879883, -38.253807067871094, -25.907859802246094, -13.561912536621094, -1.2159662246704102, 11.129980087280273, 23.47592544555664, 35.82187271118164, 48.16781997680664, 60.513763427734375, 72.85971069335938, 85.20565795898438, 97.55160522460938, 109.89755249023438, 122.24349975585938, 134.58944702148438, 146.93539428710938, 159.28134155273438, 171.62728881835938, 183.97323608398438, 196.31918334960938, 208.66513061523438, 221.01107788085938, 233.35702514648438, 245.70297241210938, 258.0489196777344, 270.3948669433594, 282.74078369140625, 295.08673095703125, 307.43267822265625, 319.77862548828125, 332.12457275390625, 344.47052001953125, 356.81646728515625, 369.16241455078125, 381.50836181640625, 393.85430908203125, 406.20025634765625, 418.54620361328125, 430.89215087890625, 443.23809814453125, 455.58404541015625, 467.92999267578125, 480.27593994140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 15.0, 20.0, 24.0, 33.0, 45.0, 99.0, 181.0, 351.0, 856.0, 2114.0, 6524.0, 32829.0, 509082.0, 455510.0, 30907.0, 6336.0, 1979.0, 817.0, 355.0, 194.0, 118.0, 64.0, 30.0, 23.0, 12.0, 11.0, 11.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.953125, -29.761962890625, -28.57080078125, -27.379638671875, -26.1884765625, -24.997314453125, -23.80615234375, -22.614990234375, -21.423828125, -20.232666015625, -19.04150390625, -17.850341796875, -16.6591796875, -15.468017578125, -14.27685546875, -13.085693359375, -11.89453125, -10.703369140625, -9.51220703125, -8.321044921875, -7.1298828125, -5.938720703125, -4.74755859375, -3.556396484375, -2.365234375, -1.174072265625, 0.01708984375, 1.208251953125, 2.3994140625, 3.590576171875, 4.78173828125, 5.972900390625, 7.1640625, 8.355224609375, 9.54638671875, 10.737548828125, 11.9287109375, 13.119873046875, 14.31103515625, 15.502197265625, 16.693359375, 17.884521484375, 19.07568359375, 20.266845703125, 21.4580078125, 22.649169921875, 23.84033203125, 25.031494140625, 26.22265625, 27.413818359375, 28.60498046875, 29.796142578125, 30.9873046875, 32.178466796875, 33.36962890625, 34.560791015625, 35.751953125, 36.943115234375, 38.13427734375, 39.325439453125, 40.5166015625, 41.707763671875, 42.89892578125, 44.090087890625, 45.28125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 7.0, 10.0, 18.0, 22.0, 39.0, 42.0, 55.0, 74.0, 75.0, 78.0, 78.0, 82.0, 75.0, 63.0, 57.0, 50.0, 38.0, 34.0, 28.0, 14.0, 21.0, 3.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -18.958984375, -18.19921875, -17.439453125, -16.6796875, -15.919921875, -15.16015625, -14.400390625, -13.640625, -12.880859375, -12.12109375, -11.361328125, -10.6015625, -9.841796875, -9.08203125, -8.322265625, -7.5625, -6.802734375, -6.04296875, -5.283203125, -4.5234375, -3.763671875, -3.00390625, -2.244140625, -1.484375, -0.724609375, 0.03515625, 0.794921875, 1.5546875, 2.314453125, 3.07421875, 3.833984375, 4.59375, 5.353515625, 6.11328125, 6.873046875, 7.6328125, 8.392578125, 9.15234375, 9.912109375, 10.671875, 11.431640625, 12.19140625, 12.951171875, 13.7109375, 14.470703125, 15.23046875, 15.990234375, 16.75, 17.509765625, 18.26953125, 19.029296875, 19.7890625, 20.548828125, 21.30859375, 22.068359375, 22.828125, 23.587890625, 24.34765625, 25.107421875, 25.8671875, 26.626953125, 27.38671875, 28.146484375, 28.90625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 9.0, 8.0, 11.0, 11.0, 13.0, 13.0, 29.0, 38.0, 44.0, 70.0, 114.0, 173.0, 298.0, 576.0, 1208.0, 3192.0, 12858.0, 113010.0, 868179.0, 37852.0, 6566.0, 2027.0, 909.0, 456.0, 315.0, 154.0, 122.0, 78.0, 54.0, 39.0, 30.0, 17.0, 15.0, 11.0, 11.0, 5.0, 6.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.578125, -28.531982421875, -27.48583984375, -26.439697265625, -25.3935546875, -24.347412109375, -23.30126953125, -22.255126953125, -21.208984375, -20.162841796875, -19.11669921875, -18.070556640625, -17.0244140625, -15.978271484375, -14.93212890625, -13.885986328125, -12.83984375, -11.793701171875, -10.74755859375, -9.701416015625, -8.6552734375, -7.609130859375, -6.56298828125, -5.516845703125, -4.470703125, -3.424560546875, -2.37841796875, -1.332275390625, -0.2861328125, 0.760009765625, 1.80615234375, 2.852294921875, 3.8984375, 4.944580078125, 5.99072265625, 7.036865234375, 8.0830078125, 9.129150390625, 10.17529296875, 11.221435546875, 12.267578125, 13.313720703125, 14.35986328125, 15.406005859375, 16.4521484375, 17.498291015625, 18.54443359375, 19.590576171875, 20.63671875, 21.682861328125, 22.72900390625, 23.775146484375, 24.8212890625, 25.867431640625, 26.91357421875, 27.959716796875, 29.005859375, 30.052001953125, 31.09814453125, 32.144287109375, 33.1904296875, 34.236572265625, 35.28271484375, 36.328857421875, 37.375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 5.0, 8.0, 5.0, 9.0, 8.0, 13.0, 10.0, 14.0, 18.0, 14.0, 11.0, 17.0, 23.0, 32.0, 43.0, 43.0, 63.0, 73.0, 54.0, 75.0, 56.0, 59.0, 53.0, 35.0, 32.0, 22.0, 23.0, 33.0, 17.0, 18.0, 16.0, 11.0, 26.0, 15.0, 4.0, 6.0, 10.0, 8.0, 6.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-61.03125, -59.18505859375, -57.3388671875, -55.49267578125, -53.646484375, -51.80029296875, -49.9541015625, -48.10791015625, -46.26171875, -44.41552734375, -42.5693359375, -40.72314453125, -38.876953125, -37.03076171875, -35.1845703125, -33.33837890625, -31.4921875, -29.64599609375, -27.7998046875, -25.95361328125, -24.107421875, -22.26123046875, -20.4150390625, -18.56884765625, -16.72265625, -14.87646484375, -13.0302734375, -11.18408203125, -9.337890625, -7.49169921875, -5.6455078125, -3.79931640625, -1.953125, -0.10693359375, 1.7392578125, 3.58544921875, 5.431640625, 7.27783203125, 9.1240234375, 10.97021484375, 12.81640625, 14.66259765625, 16.5087890625, 18.35498046875, 20.201171875, 22.04736328125, 23.8935546875, 25.73974609375, 27.5859375, 29.43212890625, 31.2783203125, 33.12451171875, 34.970703125, 36.81689453125, 38.6630859375, 40.50927734375, 42.35546875, 44.20166015625, 46.0478515625, 47.89404296875, 49.740234375, 51.58642578125, 53.4326171875, 55.27880859375, 57.125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 3.0, 15.0, 8.0, 11.0, 19.0, 23.0, 38.0, 65.0, 78.0, 137.0, 267.0, 507.0, 1189.0, 3266.0, 12841.0, 102156.0, 882610.0, 34875.0, 6561.0, 2096.0, 835.0, 401.0, 163.0, 127.0, 73.0, 50.0, 33.0, 21.0, 16.0, 15.0, 11.0, 3.0, 6.0, 8.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.35919189453125, -6.1558837890625, -5.95257568359375, -5.749267578125, -5.54595947265625, -5.3426513671875, -5.13934326171875, -4.93603515625, -4.73272705078125, -4.5294189453125, -4.32611083984375, -4.122802734375, -3.91949462890625, -3.7161865234375, -3.51287841796875, -3.3095703125, -3.10626220703125, -2.9029541015625, -2.69964599609375, -2.496337890625, -2.29302978515625, -2.0897216796875, -1.88641357421875, -1.68310546875, -1.47979736328125, -1.2764892578125, -1.07318115234375, -0.869873046875, -0.66656494140625, -0.4632568359375, -0.25994873046875, -0.056640625, 0.14666748046875, 0.3499755859375, 0.55328369140625, 0.756591796875, 0.95989990234375, 1.1632080078125, 1.36651611328125, 1.56982421875, 1.77313232421875, 1.9764404296875, 2.17974853515625, 2.383056640625, 2.58636474609375, 2.7896728515625, 2.99298095703125, 3.1962890625, 3.39959716796875, 3.6029052734375, 3.80621337890625, 4.009521484375, 4.21282958984375, 4.4161376953125, 4.61944580078125, 4.82275390625, 5.02606201171875, 5.2293701171875, 5.43267822265625, 5.635986328125, 5.83929443359375, 6.0426025390625, 6.24591064453125, 6.44921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 7.0, 6.0, 12.0, 10.0, 12.0, 19.0, 32.0, 39.0, 66.0, 109.0, 158.0, 160.0, 113.0, 69.0, 41.0, 26.0, 17.0, 14.0, 15.0, 12.0, 6.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0017709732055664062, -0.001718863844871521, -0.0016667544841766357, -0.0016146451234817505, -0.0015625357627868652, -0.00151042640209198, -0.0014583170413970947, -0.0014062076807022095, -0.0013540983200073242, -0.001301988959312439, -0.0012498795986175537, -0.0011977702379226685, -0.0011456608772277832, -0.001093551516532898, -0.0010414421558380127, -0.0009893327951431274, -0.0009372234344482422, -0.0008851140737533569, -0.0008330047130584717, -0.0007808953523635864, -0.0007287859916687012, -0.0006766766309738159, -0.0006245672702789307, -0.0005724579095840454, -0.0005203485488891602, -0.0004682391881942749, -0.00041612982749938965, -0.0003640204668045044, -0.00031191110610961914, -0.0002598017454147339, -0.00020769238471984863, -0.00015558302402496338, -0.00010347366333007812, -5.136430263519287e-05, 7.450580596923828e-07, 5.285441875457764e-05, 0.00010496377944946289, 0.00015707314014434814, 0.0002091825008392334, 0.00026129186153411865, 0.0003134012222290039, 0.00036551058292388916, 0.0004176199436187744, 0.00046972930431365967, 0.0005218386650085449, 0.0005739480257034302, 0.0006260573863983154, 0.0006781667470932007, 0.0007302761077880859, 0.0007823854684829712, 0.0008344948291778564, 0.0008866041898727417, 0.000938713550567627, 0.0009908229112625122, 0.0010429322719573975, 0.0010950416326522827, 0.001147150993347168, 0.0011992603540420532, 0.0012513697147369385, 0.0013034790754318237, 0.001355588436126709, 0.0014076977968215942, 0.0014598071575164795, 0.0015119165182113647, 0.00156402587890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 9.0, 17.0, 11.0, 24.0, 48.0, 89.0, 146.0, 288.0, 574.0, 1359.0, 3511.0, 12433.0, 62961.0, 865041.0, 80491.0, 14521.0, 4118.0, 1546.0, 642.0, 323.0, 157.0, 95.0, 56.0, 23.0, 29.0, 16.0, 8.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.7109375, -5.52996826171875, -5.3489990234375, -5.16802978515625, -4.987060546875, -4.80609130859375, -4.6251220703125, -4.44415283203125, -4.26318359375, -4.08221435546875, -3.9012451171875, -3.72027587890625, -3.539306640625, -3.35833740234375, -3.1773681640625, -2.99639892578125, -2.8154296875, -2.63446044921875, -2.4534912109375, -2.27252197265625, -2.091552734375, -1.91058349609375, -1.7296142578125, -1.54864501953125, -1.36767578125, -1.18670654296875, -1.0057373046875, -0.82476806640625, -0.643798828125, -0.46282958984375, -0.2818603515625, -0.10089111328125, 0.080078125, 0.26104736328125, 0.4420166015625, 0.62298583984375, 0.803955078125, 0.98492431640625, 1.1658935546875, 1.34686279296875, 1.52783203125, 1.70880126953125, 1.8897705078125, 2.07073974609375, 2.251708984375, 2.43267822265625, 2.6136474609375, 2.79461669921875, 2.9755859375, 3.15655517578125, 3.3375244140625, 3.51849365234375, 3.699462890625, 3.88043212890625, 4.0614013671875, 4.24237060546875, 4.42333984375, 4.60430908203125, 4.7852783203125, 4.96624755859375, 5.147216796875, 5.32818603515625, 5.5091552734375, 5.69012451171875, 5.87109375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 12.0, 4.0, 7.0, 15.0, 9.0, 18.0, 25.0, 33.0, 42.0, 74.0, 134.0, 172.0, 120.0, 93.0, 58.0, 48.0, 25.0, 28.0, 14.0, 17.0, 14.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.4140625, -9.19329833984375, -8.9725341796875, -8.75177001953125, -8.531005859375, -8.31024169921875, -8.0894775390625, -7.86871337890625, -7.64794921875, -7.42718505859375, -7.2064208984375, -6.98565673828125, -6.764892578125, -6.54412841796875, -6.3233642578125, -6.10260009765625, -5.8818359375, -5.66107177734375, -5.4403076171875, -5.21954345703125, -4.998779296875, -4.77801513671875, -4.5572509765625, -4.33648681640625, -4.11572265625, -3.89495849609375, -3.6741943359375, -3.45343017578125, -3.232666015625, -3.01190185546875, -2.7911376953125, -2.57037353515625, -2.349609375, -2.12884521484375, -1.9080810546875, -1.68731689453125, -1.466552734375, -1.24578857421875, -1.0250244140625, -0.80426025390625, -0.58349609375, -0.36273193359375, -0.1419677734375, 0.07879638671875, 0.299560546875, 0.52032470703125, 0.7410888671875, 0.96185302734375, 1.1826171875, 1.40338134765625, 1.6241455078125, 1.84490966796875, 2.065673828125, 2.28643798828125, 2.5072021484375, 2.72796630859375, 2.94873046875, 3.16949462890625, 3.3902587890625, 3.61102294921875, 3.831787109375, 4.05255126953125, 4.2733154296875, 4.49407958984375, 4.71484375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 12.0, 15.0, 15.0, 55.0, 113.0, 485.0, 165.0, 62.0, 31.0, 20.0, 13.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.80047607421875, -338.10931396484375, -327.4181213378906, -316.7269592285156, -306.0357666015625, -295.3446044921875, -284.6534423828125, -273.9622497558594, -263.2710876464844, -252.5799102783203, -241.88873291015625, -231.19757080078125, -220.5063934326172, -209.81521606445312, -199.12403869628906, -188.432861328125, -177.74168395996094, -167.05050659179688, -156.3593292236328, -145.66815185546875, -134.97698974609375, -124.28581237792969, -113.59463500976562, -102.9034652709961, -92.21228790283203, -81.52111053466797, -70.82994079589844, -60.138763427734375, -49.44758987426758, -38.75641632080078, -28.06523895263672, -17.374069213867188, -6.682891845703125, 4.008282661437988, 14.699457168579102, 25.39063262939453, 36.08180618286133, 46.772979736328125, 57.46415710449219, 68.15532684326172, 78.84650421142578, 89.53768157958984, 100.22885131835938, 110.92002868652344, 121.6112060546875, 132.3023681640625, 142.99356079101562, 153.68472290039062, 164.3759002685547, 175.06707763671875, 185.7582550048828, 196.44943237304688, 207.14059448242188, 217.83177185058594, 228.52294921875, 239.214111328125, 249.90530395507812, 260.5964660644531, 271.28765869140625, 281.97882080078125, 292.6700134277344, 303.3611755371094, 314.0523681640625, 324.7435302734375, 335.4346923828125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 12.0, 9.0, 14.0, 16.0, 9.0, 33.0, 27.0, 28.0, 41.0, 144.0, 181.0, 222.0, 72.0, 32.0, 35.0, 35.0, 14.0, 18.0, 13.0, 15.0, 6.0, 9.0, 6.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-447.53302001953125, -437.53424072265625, -427.53546142578125, -417.53668212890625, -407.53790283203125, -397.5391540527344, -387.5403747558594, -377.5415954589844, -367.5428161621094, -357.5440368652344, -347.5452575683594, -337.5464782714844, -327.5477294921875, -317.5489501953125, -307.5501708984375, -297.5513916015625, -287.5526123046875, -277.5538330078125, -267.5550537109375, -257.5562744140625, -247.55751037597656, -237.55873107910156, -227.55996704101562, -217.56118774414062, -207.56240844726562, -197.56362915039062, -187.56484985351562, -177.5660858154297, -167.5673065185547, -157.5685272216797, -147.56976318359375, -137.57098388671875, -127.57220458984375, -117.57342529296875, -107.57465362548828, -97.57588195800781, -87.57710266113281, -77.57832336425781, -67.57955169677734, -57.580780029296875, -47.582000732421875, -37.58322525024414, -27.584449768066406, -17.585674285888672, -7.5868988037109375, 2.411876678466797, 12.410652160644531, 22.409423828125, 32.408203125, 42.406978607177734, 52.40575408935547, 62.4045295715332, 72.40330505371094, 82.40208435058594, 92.4008560180664, 102.39962768554688, 112.39840698242188, 122.39718627929688, 132.39596557617188, 142.3947296142578, 152.3935089111328, 162.3922882080078, 172.39105224609375, 182.38983154296875, 192.38861083984375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 2.0, 10.0, 12.0, 11.0, 9.0, 17.0, 18.0, 25.0, 24.0, 22.0, 45.0, 51.0, 51.0, 181.0, 155.0, 62.0, 38.0, 30.0, 28.0, 33.0, 21.0, 24.0, 11.0, 22.0, 12.0, 9.0, 10.0, 11.0, 7.0, 7.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.890625, -15.3934326171875, -14.896240234375, -14.3990478515625, -13.90185546875, -13.4046630859375, -12.907470703125, -12.4102783203125, -11.9130859375, -11.4158935546875, -10.918701171875, -10.4215087890625, -9.92431640625, -9.4271240234375, -8.929931640625, -8.4327392578125, -7.935546875, -7.4383544921875, -6.941162109375, -6.4439697265625, -5.94677734375, -5.4495849609375, -4.952392578125, -4.4552001953125, -3.9580078125, -3.4608154296875, -2.963623046875, -2.4664306640625, -1.96923828125, -1.4720458984375, -0.974853515625, -0.4776611328125, 0.01953125, 0.5167236328125, 1.013916015625, 1.5111083984375, 2.00830078125, 2.5054931640625, 3.002685546875, 3.4998779296875, 3.9970703125, 4.4942626953125, 4.991455078125, 5.4886474609375, 5.98583984375, 6.4830322265625, 6.980224609375, 7.4774169921875, 7.974609375, 8.4718017578125, 8.968994140625, 9.4661865234375, 9.96337890625, 10.4605712890625, 10.957763671875, 11.4549560546875, 11.9521484375, 12.4493408203125, 12.946533203125, 13.4437255859375, 13.94091796875, 14.4381103515625, 14.935302734375, 15.4324951171875, 15.9296875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 6.0, 2.0, 8.0, 17.0, 16.0, 21.0, 32.0, 41.0, 61.0, 117.0, 227.0, 570.0, 2390.0, 32767.0, 8344527.0, 6082.0, 1013.0, 296.0, 139.0, 72.0, 42.0, 30.0, 31.0, 15.0, 4.0, 15.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-169.83935546875, -164.02932739257812, -158.21929931640625, -152.40927124023438, -146.5992431640625, -140.78921508789062, -134.97918701171875, -129.16915893554688, -123.35912322998047, -117.5490951538086, -111.73906707763672, -105.92903137207031, -100.11900329589844, -94.30897521972656, -88.49894714355469, -82.68891906738281, -76.87889099121094, -71.06886291503906, -65.25883483886719, -59.44880294799805, -53.63877487182617, -47.8287467956543, -42.018714904785156, -36.20868682861328, -30.398658752441406, -24.58863067626953, -18.778600692749023, -12.968570709228516, -7.158542633056641, -1.3485145568847656, 4.461517333984375, 10.27154541015625, 16.081573486328125, 21.8916015625, 27.701631546020508, 33.511661529541016, 39.32168960571289, 45.131717681884766, 50.941749572753906, 56.75177764892578, 62.561805725097656, 68.37183380126953, 74.1818618774414, 79.99189758300781, 85.80192565917969, 91.61195373535156, 97.42198181152344, 103.23200988769531, 109.04203796386719, 114.85206604003906, 120.66209411621094, 126.47212219238281, 132.2821502685547, 138.09217834472656, 143.9022216796875, 149.71224975585938, 155.52227783203125, 161.33230590820312, 167.142333984375, 172.95236206054688, 178.76239013671875, 184.57241821289062, 190.3824462890625, 196.19247436523438, 202.00250244140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 6.0, 6.0, 2.0, 8.0, 2.0, 5.0, 3.0, 6.0, 4.0, 1.0, 7.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-191.10089111328125, -184.21043395996094, -177.31996154785156, -170.42950439453125, -163.53903198242188, -156.64857482910156, -149.75811767578125, -142.86764526367188, -135.97718811035156, -129.08673095703125, -122.19625854492188, -115.30580139160156, -108.41533660888672, -101.52487182617188, -94.63441467285156, -87.74394989013672, -80.85348510742188, -73.96302032470703, -67.07255554199219, -60.182098388671875, -53.29163360595703, -46.40116882324219, -39.51070785522461, -32.62024688720703, -25.729782104492188, -18.839319229125977, -11.948856353759766, -5.058393478393555, 1.8320693969726562, 8.7225341796875, 15.612995147705078, 22.503456115722656, 29.393905639648438, 36.28437042236328, 43.17483139038086, 50.06529235839844, 56.95575714111328, 63.846221923828125, 70.73667907714844, 77.62714385986328, 84.51760864257812, 91.40807342529297, 98.29853820800781, 105.18899536132812, 112.07946014404297, 118.96992492675781, 125.86038208007812, 132.7508544921875, 139.6413116455078, 146.53176879882812, 153.4222412109375, 160.3126983642578, 167.20315551757812, 174.0936279296875, 180.9840850830078, 187.87454223632812, 194.7650146484375, 201.6554718017578, 208.5459442138672, 215.4364013671875, 222.32687377929688, 229.2173309326172, 236.1077880859375, 242.99826049804688, 249.8887176513672]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 6.0, 5.0, 6.0, 14.0, 14.0, 22.0, 10.0, 33.0, 25.0, 33.0, 31.0, 39.0, 58.0, 55.0, 64.0, 73.0, 62.0, 58.0, 68.0, 51.0, 52.0, 42.0, 38.0, 20.0, 33.0, 16.0, 16.0, 16.0, 9.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8671875, -9.5693359375, -9.271484375, -8.9736328125, -8.67578125, -8.3779296875, -8.080078125, -7.7822265625, -7.484375, -7.1865234375, -6.888671875, -6.5908203125, -6.29296875, -5.9951171875, -5.697265625, -5.3994140625, -5.1015625, -4.8037109375, -4.505859375, -4.2080078125, -3.91015625, -3.6123046875, -3.314453125, -3.0166015625, -2.71875, -2.4208984375, -2.123046875, -1.8251953125, -1.52734375, -1.2294921875, -0.931640625, -0.6337890625, -0.3359375, -0.0380859375, 0.259765625, 0.5576171875, 0.85546875, 1.1533203125, 1.451171875, 1.7490234375, 2.046875, 2.3447265625, 2.642578125, 2.9404296875, 3.23828125, 3.5361328125, 3.833984375, 4.1318359375, 4.4296875, 4.7275390625, 5.025390625, 5.3232421875, 5.62109375, 5.9189453125, 6.216796875, 6.5146484375, 6.8125, 7.1103515625, 7.408203125, 7.7060546875, 8.00390625, 8.3017578125, 8.599609375, 8.8974609375, 9.1953125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 12.0, 9.0, 13.0, 10.0, 20.0, 34.0, 43.0, 62.0, 115.0, 196.0, 318.0, 590.0, 1187.0, 2520.0, 6541.0, 18652.0, 61304.0, 189941.0, 165410.0, 51164.0, 15762.0, 5700.0, 2269.0, 1073.0, 571.0, 275.0, 162.0, 115.0, 63.0, 50.0, 25.0, 23.0, 13.0, 8.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-113.75, -110.4931640625, -107.236328125, -103.9794921875, -100.72265625, -97.4658203125, -94.208984375, -90.9521484375, -87.6953125, -84.4384765625, -81.181640625, -77.9248046875, -74.66796875, -71.4111328125, -68.154296875, -64.8974609375, -61.640625, -58.3837890625, -55.126953125, -51.8701171875, -48.61328125, -45.3564453125, -42.099609375, -38.8427734375, -35.5859375, -32.3291015625, -29.072265625, -25.8154296875, -22.55859375, -19.3017578125, -16.044921875, -12.7880859375, -9.53125, -6.2744140625, -3.017578125, 0.2392578125, 3.49609375, 6.7529296875, 10.009765625, 13.2666015625, 16.5234375, 19.7802734375, 23.037109375, 26.2939453125, 29.55078125, 32.8076171875, 36.064453125, 39.3212890625, 42.578125, 45.8349609375, 49.091796875, 52.3486328125, 55.60546875, 58.8623046875, 62.119140625, 65.3759765625, 68.6328125, 71.8896484375, 75.146484375, 78.4033203125, 81.66015625, 84.9169921875, 88.173828125, 91.4306640625, 94.6875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 4.0, 7.0, 8.0, 10.0, 15.0, 15.0, 15.0, 26.0, 24.0, 38.0, 43.0, 58.0, 55.0, 76.0, 66.0, 86.0, 73.0, 58.0, 45.0, 62.0, 31.0, 33.0, 22.0, 24.0, 19.0, 16.0, 8.0, 12.0, 10.0, 7.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -13.98583984375, -13.4560546875, -12.92626953125, -12.396484375, -11.86669921875, -11.3369140625, -10.80712890625, -10.27734375, -9.74755859375, -9.2177734375, -8.68798828125, -8.158203125, -7.62841796875, -7.0986328125, -6.56884765625, -6.0390625, -5.50927734375, -4.9794921875, -4.44970703125, -3.919921875, -3.39013671875, -2.8603515625, -2.33056640625, -1.80078125, -1.27099609375, -0.7412109375, -0.21142578125, 0.318359375, 0.84814453125, 1.3779296875, 1.90771484375, 2.4375, 2.96728515625, 3.4970703125, 4.02685546875, 4.556640625, 5.08642578125, 5.6162109375, 6.14599609375, 6.67578125, 7.20556640625, 7.7353515625, 8.26513671875, 8.794921875, 9.32470703125, 9.8544921875, 10.38427734375, 10.9140625, 11.44384765625, 11.9736328125, 12.50341796875, 13.033203125, 13.56298828125, 14.0927734375, 14.62255859375, 15.15234375, 15.68212890625, 16.2119140625, 16.74169921875, 17.271484375, 17.80126953125, 18.3310546875, 18.86083984375, 19.390625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 5.0, 13.0, 12.0, 15.0, 20.0, 40.0, 40.0, 64.0, 69.0, 54.0, 37.0, 24.0, 19.0, 11.0, 9.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-83.76661682128906, -81.0662612915039, -78.36590576171875, -75.6655502319336, -72.96519470214844, -70.26483917236328, -67.56448364257812, -64.8641357421875, -62.16377639770508, -59.46342086791992, -56.763065338134766, -54.062713623046875, -51.36235809326172, -48.66200256347656, -45.961647033691406, -43.26129150390625, -40.560935974121094, -37.86058044433594, -35.16022491455078, -32.459869384765625, -29.7595157623291, -27.059160232543945, -24.358806610107422, -21.658451080322266, -18.95809555053711, -16.257740020751953, -13.557385444641113, -10.857030868530273, -8.156675338745117, -5.456319808959961, -2.7559661865234375, -0.05561065673828125, 2.6447525024414062, 5.345107555389404, 8.045462608337402, 10.745817184448242, 13.446172714233398, 16.146528244018555, 18.846881866455078, 21.547237396240234, 24.24759292602539, 26.947948455810547, 29.648303985595703, 32.348655700683594, 35.04901123046875, 37.749366760253906, 40.44972229003906, 43.15007781982422, 45.850433349609375, 48.55078887939453, 51.25114440917969, 53.951499938964844, 56.65185546875, 59.352210998535156, 62.05256271362305, 64.75291442871094, 67.45327758789062, 70.15363311767578, 72.85398864746094, 75.5543441772461, 78.25469970703125, 80.9550552368164, 83.65541076660156, 86.35575866699219, 89.05611419677734]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 9.0, 6.0, 15.0, 20.0, 35.0, 42.0, 63.0, 63.0, 49.0, 43.0, 29.0, 13.0, 15.0, 12.0, 9.0, 7.0, 3.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-81.45079803466797, -78.36444091796875, -75.27808380126953, -72.19172668457031, -69.1053695678711, -66.01901245117188, -62.932655334472656, -59.84629821777344, -56.75994110107422, -53.673583984375, -50.58722686767578, -47.50086975097656, -44.414512634277344, -41.328155517578125, -38.241798400878906, -35.15544128417969, -32.06908416748047, -28.98272705078125, -25.89636993408203, -22.810012817382812, -19.723655700683594, -16.637298583984375, -13.550941467285156, -10.464584350585938, -7.378227233886719, -4.2918701171875, -1.2055130004882812, 1.8808441162109375, 4.967201232910156, 8.053558349609375, 11.139915466308594, 14.226272583007812, 17.31262969970703, 20.39898681640625, 23.48534393310547, 26.571701049804688, 29.658058166503906, 32.744415283203125, 35.830772399902344, 38.91712951660156, 42.00348663330078, 45.08984375, 48.17620086669922, 51.26255798339844, 54.348915100097656, 57.435272216796875, 60.521629333496094, 63.60798645019531, 66.69434356689453, 69.78070068359375, 72.86705780029297, 75.95341491699219, 79.0397720336914, 82.12612915039062, 85.21248626708984, 88.29884338378906, 91.38520050048828, 94.4715576171875, 97.55791473388672, 100.64427185058594, 103.73062896728516, 106.81698608398438, 109.9033432006836, 112.98970031738281, 116.07605743408203]}, "eval/loss": 5.471095085144043, "eval/wer": 1.5604323681078938, "eval/runtime": 668.0797, "eval/samples_per_second": 3.955, "eval/steps_per_second": 0.495} \ No newline at end of file