diff --git "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 6.1467, "train/learning_rate": 2.9295774647887323e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 8792, "_timestamp": 1648150136, "_step": 1500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 12.0, 5.0, 14.0, 11.0, 15.0, 19.0, 21.0, 35.0, 31.0, 30.0, 31.0, 34.0, 44.0, 50.0, 46.0, 50.0, 59.0, 52.0, 44.0, 49.0, 53.0, 34.0, 43.0, 26.0, 34.0, 30.0, 22.0, 28.0, 12.0, 11.0, 18.0, 10.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-76.76399993896484, -74.40105438232422, -72.0381088256836, -69.6751708984375, -67.31222534179688, -64.94927978515625, -62.586334228515625, -60.223392486572266, -57.860450744628906, -55.49750518798828, -53.13456344604492, -50.7716178894043, -48.40867614746094, -46.04573059082031, -43.68278503417969, -41.31984329223633, -38.9568977355957, -36.59395217895508, -34.23101043701172, -31.868064880371094, -29.505123138427734, -27.14217758178711, -24.779233932495117, -22.416290283203125, -20.053346633911133, -17.69040298461914, -15.327459335327148, -12.96451473236084, -10.601571083068848, -8.238627433776855, -5.875682830810547, -3.5127391815185547, -1.1497955322265625, 1.2131483554840088, 3.57609224319458, 5.9390363693237305, 8.301980018615723, 10.664923667907715, 13.027868270874023, 15.390811920166016, 17.753755569458008, 20.11669921875, 22.479642868041992, 24.842586517333984, 27.20553207397461, 29.56847381591797, 31.931419372558594, 34.29436492919922, 36.65730667114258, 39.0202522277832, 41.38319396972656, 43.74613952636719, 46.10908126831055, 48.47202682495117, 50.83496856689453, 53.197914123535156, 55.56085968017578, 57.923805236816406, 60.286746978759766, 62.64969253540039, 65.01263427734375, 67.37557983398438, 69.738525390625, 72.10147094726562, 74.46440887451172]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 10.0, 7.0, 11.0, 15.0, 12.0, 12.0, 13.0, 21.0, 23.0, 43.0, 36.0, 23.0, 29.0, 41.0, 44.0, 32.0, 35.0, 35.0, 43.0, 44.0, 40.0, 45.0, 33.0, 41.0, 45.0, 39.0, 39.0, 37.0, 32.0, 16.0, 20.0, 18.0, 11.0, 10.0, 11.0, 7.0, 4.0, 6.0, 5.0, 7.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.36962890625, -73.99669647216797, -71.62376403808594, -69.25082397460938, -66.87789154052734, -64.50495910644531, -62.132022857666016, -59.75908660888672, -57.38615417480469, -55.013221740722656, -52.64028549194336, -50.26734924316406, -47.89441680908203, -45.521484375, -43.1485481262207, -40.775611877441406, -38.402679443359375, -36.029747009277344, -33.65681076049805, -31.283876419067383, -28.91094207763672, -26.538007736206055, -24.16507339477539, -21.792139053344727, -19.419204711914062, -17.0462703704834, -14.673336029052734, -12.30040168762207, -9.927467346191406, -7.554533004760742, -5.181598663330078, -2.808664321899414, -0.43572235107421875, 1.9372119903564453, 4.310146331787109, 6.683080673217773, 9.056015014648438, 11.428949356079102, 13.801883697509766, 16.17481803894043, 18.547752380371094, 20.920686721801758, 23.293621063232422, 25.666555404663086, 28.03948974609375, 30.412424087524414, 32.78535842895508, 35.158294677734375, 37.531227111816406, 39.90415954589844, 42.277095794677734, 44.65003204345703, 47.02296447753906, 49.395896911621094, 51.76883316040039, 54.14176940917969, 56.51470184326172, 58.88763427734375, 61.26057052612305, 63.633506774902344, 66.00643920898438, 68.3793716430664, 70.75230407714844, 73.125244140625, 75.49817657470703]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 6.0, 9.0, 14.0, 27.0, 35.0, 46.0, 82.0, 127.0, 171.0, 257.0, 425.0, 728.0, 1040.0, 1733.0, 2959.0, 5107.0, 8602.0, 15147.0, 26827.0, 49759.0, 98897.0, 213474.0, 466717.0, 845852.0, 1003888.0, 738701.0, 371978.0, 166536.0, 80016.0, 41160.0, 22709.0, 12576.0, 7309.0, 4294.0, 2614.0, 1636.0, 994.0, 615.0, 448.0, 262.0, 190.0, 104.0, 79.0, 51.0, 33.0, 20.0, 10.0, 6.0, 2.0, 9.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-58.78125, -56.96435546875, -55.1474609375, -53.33056640625, -51.513671875, -49.69677734375, -47.8798828125, -46.06298828125, -44.24609375, -42.42919921875, -40.6123046875, -38.79541015625, -36.978515625, -35.16162109375, -33.3447265625, -31.52783203125, -29.7109375, -27.89404296875, -26.0771484375, -24.26025390625, -22.443359375, -20.62646484375, -18.8095703125, -16.99267578125, -15.17578125, -13.35888671875, -11.5419921875, -9.72509765625, -7.908203125, -6.09130859375, -4.2744140625, -2.45751953125, -0.640625, 1.17626953125, 2.9931640625, 4.81005859375, 6.626953125, 8.44384765625, 10.2607421875, 12.07763671875, 13.89453125, 15.71142578125, 17.5283203125, 19.34521484375, 21.162109375, 22.97900390625, 24.7958984375, 26.61279296875, 28.4296875, 30.24658203125, 32.0634765625, 33.88037109375, 35.697265625, 37.51416015625, 39.3310546875, 41.14794921875, 42.96484375, 44.78173828125, 46.5986328125, 48.41552734375, 50.232421875, 52.04931640625, 53.8662109375, 55.68310546875, 57.5]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 4.0, 8.0, 9.0, 11.0, 21.0, 15.0, 16.0, 30.0, 26.0, 27.0, 40.0, 31.0, 36.0, 34.0, 25.0, 45.0, 38.0, 34.0, 47.0, 34.0, 34.0, 38.0, 36.0, 41.0, 42.0, 44.0, 29.0, 30.0, 21.0, 30.0, 13.0, 20.0, 17.0, 12.0, 12.0, 9.0, 8.0, 3.0, 6.0, 3.0, 1.0, 6.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-51.1875, -49.6796875, -48.171875, -46.6640625, -45.15625, -43.6484375, -42.140625, -40.6328125, -39.125, -37.6171875, -36.109375, -34.6015625, -33.09375, -31.5859375, -30.078125, -28.5703125, -27.0625, -25.5546875, -24.046875, -22.5390625, -21.03125, -19.5234375, -18.015625, -16.5078125, -15.0, -13.4921875, -11.984375, -10.4765625, -8.96875, -7.4609375, -5.953125, -4.4453125, -2.9375, -1.4296875, 0.078125, 1.5859375, 3.09375, 4.6015625, 6.109375, 7.6171875, 9.125, 10.6328125, 12.140625, 13.6484375, 15.15625, 16.6640625, 18.171875, 19.6796875, 21.1875, 22.6953125, 24.203125, 25.7109375, 27.21875, 28.7265625, 30.234375, 31.7421875, 33.25, 34.7578125, 36.265625, 37.7734375, 39.28125, 40.7890625, 42.296875, 43.8046875, 45.3125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 5.0, 2.0, 18.0, 19.0, 28.0, 39.0, 76.0, 126.0, 218.0, 302.0, 441.0, 721.0, 1171.0, 1840.0, 2899.0, 4451.0, 6985.0, 10857.0, 16873.0, 25684.0, 40440.0, 62593.0, 96444.0, 149259.0, 230161.0, 350462.0, 523388.0, 694209.0, 648769.0, 458932.0, 303585.0, 198958.0, 129110.0, 84110.0, 53490.0, 35039.0, 22238.0, 14390.0, 9427.0, 5936.0, 3773.0, 2490.0, 1639.0, 998.0, 636.0, 375.0, 253.0, 169.0, 112.0, 58.0, 34.0, 26.0, 14.0, 9.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.0654296875, -37.755859375, -36.4462890625, -35.13671875, -33.8271484375, -32.517578125, -31.2080078125, -29.8984375, -28.5888671875, -27.279296875, -25.9697265625, -24.66015625, -23.3505859375, -22.041015625, -20.7314453125, -19.421875, -18.1123046875, -16.802734375, -15.4931640625, -14.18359375, -12.8740234375, -11.564453125, -10.2548828125, -8.9453125, -7.6357421875, -6.326171875, -5.0166015625, -3.70703125, -2.3974609375, -1.087890625, 0.2216796875, 1.53125, 2.8408203125, 4.150390625, 5.4599609375, 6.76953125, 8.0791015625, 9.388671875, 10.6982421875, 12.0078125, 13.3173828125, 14.626953125, 15.9365234375, 17.24609375, 18.5556640625, 19.865234375, 21.1748046875, 22.484375, 23.7939453125, 25.103515625, 26.4130859375, 27.72265625, 29.0322265625, 30.341796875, 31.6513671875, 32.9609375, 34.2705078125, 35.580078125, 36.8896484375, 38.19921875, 39.5087890625, 40.818359375, 42.1279296875, 43.4375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 6.0, 7.0, 11.0, 16.0, 11.0, 13.0, 20.0, 32.0, 32.0, 45.0, 49.0, 64.0, 79.0, 108.0, 105.0, 135.0, 154.0, 189.0, 252.0, 291.0, 334.0, 311.0, 337.0, 302.0, 217.0, 181.0, 171.0, 129.0, 111.0, 81.0, 49.0, 60.0, 43.0, 33.0, 25.0, 18.0, 19.0, 4.0, 8.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -20.9765625, -20.265625, -19.5546875, -18.84375, -18.1328125, -17.421875, -16.7109375, -16.0, -15.2890625, -14.578125, -13.8671875, -13.15625, -12.4453125, -11.734375, -11.0234375, -10.3125, -9.6015625, -8.890625, -8.1796875, -7.46875, -6.7578125, -6.046875, -5.3359375, -4.625, -3.9140625, -3.203125, -2.4921875, -1.78125, -1.0703125, -0.359375, 0.3515625, 1.0625, 1.7734375, 2.484375, 3.1953125, 3.90625, 4.6171875, 5.328125, 6.0390625, 6.75, 7.4609375, 8.171875, 8.8828125, 9.59375, 10.3046875, 11.015625, 11.7265625, 12.4375, 13.1484375, 13.859375, 14.5703125, 15.28125, 15.9921875, 16.703125, 17.4140625, 18.125, 18.8359375, 19.546875, 20.2578125, 20.96875, 21.6796875, 22.390625, 23.1015625, 23.8125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [6.0, 2.0, 1.0, 3.0, 8.0, 1.0, 2.0, 8.0, 9.0, 6.0, 12.0, 5.0, 11.0, 14.0, 15.0, 23.0, 27.0, 19.0, 33.0, 32.0, 38.0, 28.0, 48.0, 34.0, 50.0, 42.0, 41.0, 45.0, 23.0, 44.0, 47.0, 34.0, 37.0, 41.0, 35.0, 31.0, 22.0, 26.0, 17.0, 16.0, 9.0, 16.0, 8.0, 7.0, 12.0, 5.0, 4.0, 4.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.57273864746094, -36.1736946105957, -34.77465057373047, -33.37560272216797, -31.976558685302734, -30.5775146484375, -29.178468704223633, -27.779422760009766, -26.38037872314453, -24.981334686279297, -23.58228874206543, -22.183242797851562, -20.784198760986328, -19.385154724121094, -17.986108779907227, -16.58706283569336, -15.188018798828125, -13.788973808288574, -12.389928817749023, -10.990883827209473, -9.591838836669922, -8.192793846130371, -6.79374885559082, -5.3947038650512695, -3.9956588745117188, -2.596613883972168, -1.1975688934326172, 0.2014760971069336, 1.6005210876464844, 2.999566078186035, 4.398611068725586, 5.797656059265137, 7.1967010498046875, 8.595746040344238, 9.994791030883789, 11.39383602142334, 12.79288101196289, 14.191926002502441, 15.590970993041992, 16.99001693725586, 18.389060974121094, 19.788105010986328, 21.187150955200195, 22.586196899414062, 23.985240936279297, 25.38428497314453, 26.7833309173584, 28.182376861572266, 29.5814208984375, 30.980464935302734, 32.37950897216797, 33.77855682373047, 35.1776008605957, 36.57664489746094, 37.97569274902344, 39.37473678588867, 40.773780822753906, 42.17282485961914, 43.571868896484375, 44.970916748046875, 46.36996078491211, 47.769004821777344, 49.168052673339844, 50.56709671020508, 51.96614074707031]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 14.0, 12.0, 22.0, 15.0, 13.0, 22.0, 25.0, 25.0, 36.0, 39.0, 31.0, 43.0, 30.0, 44.0, 36.0, 48.0, 45.0, 41.0, 40.0, 46.0, 45.0, 34.0, 36.0, 27.0, 34.0, 21.0, 38.0, 31.0, 18.0, 15.0, 12.0, 15.0, 13.0, 5.0, 10.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.23810958862305, -50.60106658935547, -48.964027404785156, -47.326988220214844, -45.689945220947266, -44.05290222167969, -42.415863037109375, -40.77882385253906, -39.141780853271484, -37.504737854003906, -35.867698669433594, -34.23065948486328, -32.5936164855957, -30.956575393676758, -29.319534301757812, -27.682493209838867, -26.045452117919922, -24.408411026000977, -22.77136993408203, -21.134328842163086, -19.49728775024414, -17.860246658325195, -16.22320556640625, -14.586164474487305, -12.94912338256836, -11.312082290649414, -9.675041198730469, -8.038000106811523, -6.400959014892578, -4.763917922973633, -3.1268768310546875, -1.4898357391357422, 0.14720916748046875, 1.784250259399414, 3.4212913513183594, 5.058332443237305, 6.69537353515625, 8.332414627075195, 9.96945571899414, 11.606496810913086, 13.243537902832031, 14.880578994750977, 16.517620086669922, 18.154661178588867, 19.791702270507812, 21.428743362426758, 23.065784454345703, 24.70282554626465, 26.339866638183594, 27.97690773010254, 29.613948822021484, 31.25098991394043, 32.888031005859375, 34.52507019042969, 36.162113189697266, 37.799156188964844, 39.436195373535156, 41.07323455810547, 42.71027755737305, 44.347320556640625, 45.98435974121094, 47.62139892578125, 49.25844192504883, 50.895484924316406, 52.53252410888672]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 8.0, 10.0, 14.0, 24.0, 22.0, 52.0, 61.0, 72.0, 134.0, 163.0, 217.0, 310.0, 465.0, 673.0, 921.0, 1326.0, 1938.0, 2735.0, 4152.0, 6321.0, 9412.0, 14956.0, 23222.0, 37404.0, 61517.0, 104184.0, 171522.0, 217572.0, 151798.0, 90522.0, 54027.0, 32978.0, 20683.0, 13218.0, 8351.0, 5557.0, 3764.0, 2514.0, 1701.0, 1203.0, 829.0, 591.0, 420.0, 284.0, 205.0, 152.0, 107.0, 62.0, 57.0, 52.0, 22.0, 20.0, 16.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.2421875, -13.773193359375, -13.30419921875, -12.835205078125, -12.3662109375, -11.897216796875, -11.42822265625, -10.959228515625, -10.490234375, -10.021240234375, -9.55224609375, -9.083251953125, -8.6142578125, -8.145263671875, -7.67626953125, -7.207275390625, -6.73828125, -6.269287109375, -5.80029296875, -5.331298828125, -4.8623046875, -4.393310546875, -3.92431640625, -3.455322265625, -2.986328125, -2.517333984375, -2.04833984375, -1.579345703125, -1.1103515625, -0.641357421875, -0.17236328125, 0.296630859375, 0.765625, 1.234619140625, 1.70361328125, 2.172607421875, 2.6416015625, 3.110595703125, 3.57958984375, 4.048583984375, 4.517578125, 4.986572265625, 5.45556640625, 5.924560546875, 6.3935546875, 6.862548828125, 7.33154296875, 7.800537109375, 8.26953125, 8.738525390625, 9.20751953125, 9.676513671875, 10.1455078125, 10.614501953125, 11.08349609375, 11.552490234375, 12.021484375, 12.490478515625, 12.95947265625, 13.428466796875, 13.8974609375, 14.366455078125, 14.83544921875, 15.304443359375, 15.7734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 4.0, 10.0, 11.0, 15.0, 10.0, 17.0, 20.0, 18.0, 31.0, 34.0, 29.0, 32.0, 46.0, 33.0, 39.0, 31.0, 53.0, 36.0, 38.0, 42.0, 52.0, 53.0, 38.0, 38.0, 35.0, 37.0, 24.0, 34.0, 22.0, 27.0, 23.0, 15.0, 12.0, 18.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-50.75, -49.13232421875, -47.5146484375, -45.89697265625, -44.279296875, -42.66162109375, -41.0439453125, -39.42626953125, -37.80859375, -36.19091796875, -34.5732421875, -32.95556640625, -31.337890625, -29.72021484375, -28.1025390625, -26.48486328125, -24.8671875, -23.24951171875, -21.6318359375, -20.01416015625, -18.396484375, -16.77880859375, -15.1611328125, -13.54345703125, -11.92578125, -10.30810546875, -8.6904296875, -7.07275390625, -5.455078125, -3.83740234375, -2.2197265625, -0.60205078125, 1.015625, 2.63330078125, 4.2509765625, 5.86865234375, 7.486328125, 9.10400390625, 10.7216796875, 12.33935546875, 13.95703125, 15.57470703125, 17.1923828125, 18.81005859375, 20.427734375, 22.04541015625, 23.6630859375, 25.28076171875, 26.8984375, 28.51611328125, 30.1337890625, 31.75146484375, 33.369140625, 34.98681640625, 36.6044921875, 38.22216796875, 39.83984375, 41.45751953125, 43.0751953125, 44.69287109375, 46.310546875, 47.92822265625, 49.5458984375, 51.16357421875, 52.78125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 7.0, 11.0, 20.0, 17.0, 30.0, 33.0, 50.0, 61.0, 90.0, 131.0, 154.0, 228.0, 305.0, 413.0, 561.0, 712.0, 1045.0, 1466.0, 2129.0, 3173.0, 4653.0, 7034.0, 10973.0, 17562.0, 29559.0, 51494.0, 95468.0, 174625.0, 249152.0, 173201.0, 93555.0, 51044.0, 29480.0, 17488.0, 10599.0, 6943.0, 4602.0, 3084.0, 2083.0, 1518.0, 1029.0, 726.0, 533.0, 397.0, 290.0, 226.0, 168.0, 110.0, 110.0, 74.0, 46.0, 26.0, 28.0, 24.0, 12.0, 5.0, 6.0, 1.0, 4.0, 1.0], "bins": [-9.34375, -9.05615234375, -8.7685546875, -8.48095703125, -8.193359375, -7.90576171875, -7.6181640625, -7.33056640625, -7.04296875, -6.75537109375, -6.4677734375, -6.18017578125, -5.892578125, -5.60498046875, -5.3173828125, -5.02978515625, -4.7421875, -4.45458984375, -4.1669921875, -3.87939453125, -3.591796875, -3.30419921875, -3.0166015625, -2.72900390625, -2.44140625, -2.15380859375, -1.8662109375, -1.57861328125, -1.291015625, -1.00341796875, -0.7158203125, -0.42822265625, -0.140625, 0.14697265625, 0.4345703125, 0.72216796875, 1.009765625, 1.29736328125, 1.5849609375, 1.87255859375, 2.16015625, 2.44775390625, 2.7353515625, 3.02294921875, 3.310546875, 3.59814453125, 3.8857421875, 4.17333984375, 4.4609375, 4.74853515625, 5.0361328125, 5.32373046875, 5.611328125, 5.89892578125, 6.1865234375, 6.47412109375, 6.76171875, 7.04931640625, 7.3369140625, 7.62451171875, 7.912109375, 8.19970703125, 8.4873046875, 8.77490234375, 9.0625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 2.0, 7.0, 10.0, 12.0, 14.0, 13.0, 28.0, 28.0, 23.0, 24.0, 31.0, 30.0, 29.0, 31.0, 37.0, 33.0, 29.0, 39.0, 30.0, 44.0, 50.0, 39.0, 52.0, 38.0, 32.0, 26.0, 34.0, 35.0, 28.0, 24.0, 28.0, 22.0, 11.0, 13.0, 12.0, 12.0, 5.0, 10.0, 3.0, 0.0, 7.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-32.78125, -31.740234375, -30.69921875, -29.658203125, -28.6171875, -27.576171875, -26.53515625, -25.494140625, -24.453125, -23.412109375, -22.37109375, -21.330078125, -20.2890625, -19.248046875, -18.20703125, -17.166015625, -16.125, -15.083984375, -14.04296875, -13.001953125, -11.9609375, -10.919921875, -9.87890625, -8.837890625, -7.796875, -6.755859375, -5.71484375, -4.673828125, -3.6328125, -2.591796875, -1.55078125, -0.509765625, 0.53125, 1.572265625, 2.61328125, 3.654296875, 4.6953125, 5.736328125, 6.77734375, 7.818359375, 8.859375, 9.900390625, 10.94140625, 11.982421875, 13.0234375, 14.064453125, 15.10546875, 16.146484375, 17.1875, 18.228515625, 19.26953125, 20.310546875, 21.3515625, 22.392578125, 23.43359375, 24.474609375, 25.515625, 26.556640625, 27.59765625, 28.638671875, 29.6796875, 30.720703125, 31.76171875, 32.802734375, 33.84375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 16.0, 14.0, 12.0, 26.0, 43.0, 59.0, 70.0, 91.0, 125.0, 163.0, 239.0, 291.0, 388.0, 474.0, 609.0, 735.0, 1003.0, 1468.0, 2039.0, 3189.0, 5626.0, 12499.0, 34069.0, 119452.0, 485091.0, 270299.0, 67033.0, 21133.0, 8524.0, 4172.0, 2546.0, 1763.0, 1282.0, 962.0, 740.0, 561.0, 418.0, 296.0, 243.0, 162.0, 150.0, 122.0, 91.0, 86.0, 56.0, 46.0, 24.0, 13.0, 16.0, 9.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.314453125, -2.2392578125, -2.1640625, -2.0888671875, -2.013671875, -1.9384765625, -1.86328125, -1.7880859375, -1.712890625, -1.6376953125, -1.5625, -1.4873046875, -1.412109375, -1.3369140625, -1.26171875, -1.1865234375, -1.111328125, -1.0361328125, -0.9609375, -0.8857421875, -0.810546875, -0.7353515625, -0.66015625, -0.5849609375, -0.509765625, -0.4345703125, -0.359375, -0.2841796875, -0.208984375, -0.1337890625, -0.05859375, 0.0166015625, 0.091796875, 0.1669921875, 0.2421875, 0.3173828125, 0.392578125, 0.4677734375, 0.54296875, 0.6181640625, 0.693359375, 0.7685546875, 0.84375, 0.9189453125, 0.994140625, 1.0693359375, 1.14453125, 1.2197265625, 1.294921875, 1.3701171875, 1.4453125, 1.5205078125, 1.595703125, 1.6708984375, 1.74609375, 1.8212890625, 1.896484375, 1.9716796875, 2.046875, 2.1220703125, 2.197265625, 2.2724609375, 2.34765625, 2.4228515625, 2.498046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 7.0, 12.0, 14.0, 7.0, 25.0, 18.0, 39.0, 52.0, 72.0, 91.0, 109.0, 98.0, 91.0, 66.0, 67.0, 45.0, 31.0, 20.0, 21.0, 7.0, 13.0, 10.0, 13.0, 7.0, 4.0, 9.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0003771781921386719, -0.0003664456307888031, -0.0003557130694389343, -0.00034498050808906555, -0.0003342479467391968, -0.000323515385389328, -0.00031278282403945923, -0.00030205026268959045, -0.0002913177013397217, -0.0002805851399898529, -0.00026985257863998413, -0.00025912001729011536, -0.0002483874559402466, -0.0002376548945903778, -0.00022692233324050903, -0.00021618977189064026, -0.00020545721054077148, -0.0001947246491909027, -0.00018399208784103394, -0.00017325952649116516, -0.0001625269651412964, -0.0001517944037914276, -0.00014106184244155884, -0.00013032928109169006, -0.00011959671974182129, -0.00010886415839195251, -9.813159704208374e-05, -8.739903569221497e-05, -7.666647434234619e-05, -6.593391299247742e-05, -5.520135164260864e-05, -4.446879029273987e-05, -3.3736228942871094e-05, -2.300366759300232e-05, -1.2271106243133545e-05, -1.5385448932647705e-06, 9.194016456604004e-06, 1.992657780647278e-05, 3.065913915634155e-05, 4.139170050621033e-05, 5.21242618560791e-05, 6.285682320594788e-05, 7.358938455581665e-05, 8.432194590568542e-05, 9.50545072555542e-05, 0.00010578706860542297, 0.00011651962995529175, 0.00012725219130516052, 0.0001379847526550293, 0.00014871731400489807, 0.00015944987535476685, 0.00017018243670463562, 0.0001809149980545044, 0.00019164755940437317, 0.00020238012075424194, 0.00021311268210411072, 0.0002238452434539795, 0.00023457780480384827, 0.00024531036615371704, 0.0002560429275035858, 0.0002667754888534546, 0.00027750805020332336, 0.00028824061155319214, 0.0002989731729030609, 0.0003097057342529297]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 4.0, 7.0, 18.0, 11.0, 21.0, 34.0, 49.0, 71.0, 73.0, 114.0, 155.0, 210.0, 312.0, 391.0, 613.0, 892.0, 1284.0, 1834.0, 2899.0, 4784.0, 7962.0, 14832.0, 27926.0, 52817.0, 101789.0, 205569.0, 302036.0, 152431.0, 77731.0, 40768.0, 21520.0, 11644.0, 6433.0, 3860.0, 2346.0, 1511.0, 986.0, 764.0, 497.0, 344.0, 283.0, 204.0, 144.0, 87.0, 99.0, 52.0, 44.0, 25.0, 26.0, 18.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8330078125, -1.7779541015625, -1.722900390625, -1.6678466796875, -1.61279296875, -1.5577392578125, -1.502685546875, -1.4476318359375, -1.392578125, -1.3375244140625, -1.282470703125, -1.2274169921875, -1.17236328125, -1.1173095703125, -1.062255859375, -1.0072021484375, -0.9521484375, -0.8970947265625, -0.842041015625, -0.7869873046875, -0.73193359375, -0.6768798828125, -0.621826171875, -0.5667724609375, -0.51171875, -0.4566650390625, -0.401611328125, -0.3465576171875, -0.29150390625, -0.2364501953125, -0.181396484375, -0.1263427734375, -0.0712890625, -0.0162353515625, 0.038818359375, 0.0938720703125, 0.14892578125, 0.2039794921875, 0.259033203125, 0.3140869140625, 0.369140625, 0.4241943359375, 0.479248046875, 0.5343017578125, 0.58935546875, 0.6444091796875, 0.699462890625, 0.7545166015625, 0.8095703125, 0.8646240234375, 0.919677734375, 0.9747314453125, 1.02978515625, 1.0848388671875, 1.139892578125, 1.1949462890625, 1.25, 1.3050537109375, 1.360107421875, 1.4151611328125, 1.47021484375, 1.5252685546875, 1.580322265625, 1.6353759765625, 1.6904296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 5.0, 17.0, 12.0, 25.0, 40.0, 39.0, 64.0, 84.0, 105.0, 127.0, 125.0, 100.0, 68.0, 50.0, 31.0, 23.0, 22.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81982421875, -0.7948226928710938, -0.7698211669921875, -0.7448196411132812, -0.719818115234375, -0.6948165893554688, -0.6698150634765625, -0.6448135375976562, -0.61981201171875, -0.5948104858398438, -0.5698089599609375, -0.5448074340820312, -0.519805908203125, -0.49480438232421875, -0.4698028564453125, -0.44480133056640625, -0.4197998046875, -0.39479827880859375, -0.3697967529296875, -0.34479522705078125, -0.319793701171875, -0.29479217529296875, -0.2697906494140625, -0.24478912353515625, -0.21978759765625, -0.19478607177734375, -0.1697845458984375, -0.14478302001953125, -0.119781494140625, -0.09477996826171875, -0.0697784423828125, -0.04477691650390625, -0.019775390625, 0.00522613525390625, 0.0302276611328125, 0.05522918701171875, 0.080230712890625, 0.10523223876953125, 0.1302337646484375, 0.15523529052734375, 0.18023681640625, 0.20523834228515625, 0.2302398681640625, 0.25524139404296875, 0.280242919921875, 0.30524444580078125, 0.3302459716796875, 0.35524749755859375, 0.3802490234375, 0.40525054931640625, 0.4302520751953125, 0.45525360107421875, 0.480255126953125, 0.5052566528320312, 0.5302581787109375, 0.5552597045898438, 0.58026123046875, 0.6052627563476562, 0.6302642822265625, 0.6552658081054688, 0.680267333984375, 0.7052688598632812, 0.7302703857421875, 0.7552719116210938, 0.7802734375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 4.0, 8.0, 3.0, 5.0, 8.0, 6.0, 10.0, 9.0, 11.0, 19.0, 18.0, 17.0, 21.0, 22.0, 28.0, 37.0, 40.0, 42.0, 37.0, 43.0, 43.0, 39.0, 40.0, 41.0, 32.0, 38.0, 58.0, 33.0, 32.0, 34.0, 37.0, 34.0, 22.0, 26.0, 18.0, 9.0, 17.0, 10.0, 9.0, 8.0, 8.0, 7.0, 3.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75106430053711, -34.4222297668457, -33.0933952331543, -31.76456069946289, -30.435726165771484, -29.106891632080078, -27.77805519104004, -26.449220657348633, -25.120386123657227, -23.79155158996582, -22.462717056274414, -21.133882522583008, -19.80504608154297, -18.476211547851562, -17.147377014160156, -15.81854248046875, -14.489707946777344, -13.160873413085938, -11.832038879394531, -10.503203392028809, -9.174368858337402, -7.845534324645996, -6.516699314117432, -5.187864303588867, -3.859029769897461, -2.5301949977874756, -1.2013602256774902, 0.12747454643249512, 1.4563093185424805, 2.7851438522338867, 4.113978862762451, 5.442813873291016, 6.771648406982422, 8.100482940673828, 9.429317474365234, 10.758152961730957, 12.086987495422363, 13.41582202911377, 14.744657516479492, 16.0734920501709, 17.402326583862305, 18.73116111755371, 20.059995651245117, 21.388830184936523, 22.717666625976562, 24.04650115966797, 25.375335693359375, 26.70417022705078, 28.033004760742188, 29.361839294433594, 30.690673828125, 32.019508361816406, 33.34834289550781, 34.67717742919922, 36.006011962890625, 37.33484649658203, 38.66368103027344, 39.992515563964844, 41.32135009765625, 42.650184631347656, 43.97901916503906, 45.30785369873047, 46.636688232421875, 47.96552276611328, 49.29436111450195]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 13.0, 18.0, 17.0, 13.0, 22.0, 18.0, 24.0, 34.0, 38.0, 34.0, 33.0, 41.0, 34.0, 42.0, 38.0, 43.0, 47.0, 42.0, 50.0, 40.0, 36.0, 41.0, 26.0, 31.0, 30.0, 29.0, 40.0, 21.0, 14.0, 19.0, 13.0, 9.0, 15.0, 6.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.53192901611328, -46.9837646484375, -45.435604095458984, -43.8874397277832, -42.33927917480469, -40.791114807128906, -39.242950439453125, -37.69478988647461, -36.14662551879883, -34.59846115112305, -33.05030059814453, -31.50213623046875, -29.9539737701416, -28.405811309814453, -26.857648849487305, -25.309486389160156, -23.761323928833008, -22.21316146850586, -20.66499900817871, -19.116836547851562, -17.56867218017578, -16.020509719848633, -14.472347259521484, -12.92418384552002, -11.376021385192871, -9.827858924865723, -8.279695510864258, -6.731533050537109, -5.183370113372803, -3.635207176208496, -2.0870447158813477, -0.5388813018798828, 1.0092811584472656, 2.5574440956115723, 4.105607032775879, 5.653769493103027, 7.201932430267334, 8.75009536743164, 10.298257827758789, 11.846421241760254, 13.394583702087402, 14.94274616241455, 16.490909576416016, 18.039072036743164, 19.587234497070312, 21.135398864746094, 22.68355941772461, 24.23172378540039, 25.77988624572754, 27.328048706054688, 28.876211166381836, 30.424373626708984, 31.972537994384766, 33.52069854736328, 35.06886291503906, 36.617027282714844, 38.16518783569336, 39.71335220336914, 41.261512756347656, 42.80967712402344, 44.35783767700195, 45.906002044677734, 47.45416259765625, 49.00232696533203, 50.55049133300781]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 14.0, 19.0, 34.0, 34.0, 65.0, 88.0, 156.0, 237.0, 367.0, 694.0, 1083.0, 1770.0, 3008.0, 5093.0, 9000.0, 15690.0, 27925.0, 48449.0, 80961.0, 124227.0, 163614.0, 173269.0, 144431.0, 100625.0, 62438.0, 36619.0, 20665.0, 11604.0, 6768.0, 3864.0, 2235.0, 1359.0, 802.0, 489.0, 313.0, 203.0, 98.0, 77.0, 56.0, 34.0, 30.0, 11.0, 8.0, 6.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0], "bins": [-56.46875, -54.8662109375, -53.263671875, -51.6611328125, -50.05859375, -48.4560546875, -46.853515625, -45.2509765625, -43.6484375, -42.0458984375, -40.443359375, -38.8408203125, -37.23828125, -35.6357421875, -34.033203125, -32.4306640625, -30.828125, -29.2255859375, -27.623046875, -26.0205078125, -24.41796875, -22.8154296875, -21.212890625, -19.6103515625, -18.0078125, -16.4052734375, -14.802734375, -13.2001953125, -11.59765625, -9.9951171875, -8.392578125, -6.7900390625, -5.1875, -3.5849609375, -1.982421875, -0.3798828125, 1.22265625, 2.8251953125, 4.427734375, 6.0302734375, 7.6328125, 9.2353515625, 10.837890625, 12.4404296875, 14.04296875, 15.6455078125, 17.248046875, 18.8505859375, 20.453125, 22.0556640625, 23.658203125, 25.2607421875, 26.86328125, 28.4658203125, 30.068359375, 31.6708984375, 33.2734375, 34.8759765625, 36.478515625, 38.0810546875, 39.68359375, 41.2861328125, 42.888671875, 44.4912109375, 46.09375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 3.0, 13.0, 9.0, 15.0, 14.0, 23.0, 16.0, 26.0, 30.0, 32.0, 29.0, 40.0, 43.0, 34.0, 44.0, 32.0, 35.0, 32.0, 57.0, 31.0, 47.0, 39.0, 28.0, 44.0, 28.0, 42.0, 24.0, 25.0, 27.0, 15.0, 25.0, 19.0, 14.0, 15.0, 8.0, 6.0, 2.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-41.6875, -40.388671875, -39.08984375, -37.791015625, -36.4921875, -35.193359375, -33.89453125, -32.595703125, -31.296875, -29.998046875, -28.69921875, -27.400390625, -26.1015625, -24.802734375, -23.50390625, -22.205078125, -20.90625, -19.607421875, -18.30859375, -17.009765625, -15.7109375, -14.412109375, -13.11328125, -11.814453125, -10.515625, -9.216796875, -7.91796875, -6.619140625, -5.3203125, -4.021484375, -2.72265625, -1.423828125, -0.125, 1.173828125, 2.47265625, 3.771484375, 5.0703125, 6.369140625, 7.66796875, 8.966796875, 10.265625, 11.564453125, 12.86328125, 14.162109375, 15.4609375, 16.759765625, 18.05859375, 19.357421875, 20.65625, 21.955078125, 23.25390625, 24.552734375, 25.8515625, 27.150390625, 28.44921875, 29.748046875, 31.046875, 32.345703125, 33.64453125, 34.943359375, 36.2421875, 37.541015625, 38.83984375, 40.138671875, 41.4375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 12.0, 15.0, 29.0, 52.0, 61.0, 107.0, 155.0, 266.0, 324.0, 531.0, 844.0, 1243.0, 1771.0, 2653.0, 3804.0, 5529.0, 8156.0, 11468.0, 16253.0, 22623.0, 31352.0, 42234.0, 55734.0, 70818.0, 85547.0, 97684.0, 103224.0, 100233.0, 89133.0, 74539.0, 59448.0, 45309.0, 33851.0, 24842.0, 17851.0, 12555.0, 8914.0, 6168.0, 4297.0, 3019.0, 1938.0, 1332.0, 893.0, 581.0, 412.0, 267.0, 165.0, 105.0, 82.0, 40.0, 40.0, 24.0, 16.0, 8.0, 4.0, 4.0, 0.0, 1.0], "bins": [-33.96875, -32.927734375, -31.88671875, -30.845703125, -29.8046875, -28.763671875, -27.72265625, -26.681640625, -25.640625, -24.599609375, -23.55859375, -22.517578125, -21.4765625, -20.435546875, -19.39453125, -18.353515625, -17.3125, -16.271484375, -15.23046875, -14.189453125, -13.1484375, -12.107421875, -11.06640625, -10.025390625, -8.984375, -7.943359375, -6.90234375, -5.861328125, -4.8203125, -3.779296875, -2.73828125, -1.697265625, -0.65625, 0.384765625, 1.42578125, 2.466796875, 3.5078125, 4.548828125, 5.58984375, 6.630859375, 7.671875, 8.712890625, 9.75390625, 10.794921875, 11.8359375, 12.876953125, 13.91796875, 14.958984375, 16.0, 17.041015625, 18.08203125, 19.123046875, 20.1640625, 21.205078125, 22.24609375, 23.287109375, 24.328125, 25.369140625, 26.41015625, 27.451171875, 28.4921875, 29.533203125, 30.57421875, 31.615234375, 32.65625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 8.0, 14.0, 14.0, 23.0, 14.0, 16.0, 16.0, 22.0, 23.0, 33.0, 27.0, 36.0, 36.0, 36.0, 33.0, 35.0, 30.0, 40.0, 50.0, 38.0, 38.0, 35.0, 31.0, 48.0, 36.0, 32.0, 24.0, 30.0, 22.0, 19.0, 30.0, 16.0, 15.0, 16.0, 9.0, 10.0, 7.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.578125, -28.71826171875, -27.8583984375, -26.99853515625, -26.138671875, -25.27880859375, -24.4189453125, -23.55908203125, -22.69921875, -21.83935546875, -20.9794921875, -20.11962890625, -19.259765625, -18.39990234375, -17.5400390625, -16.68017578125, -15.8203125, -14.96044921875, -14.1005859375, -13.24072265625, -12.380859375, -11.52099609375, -10.6611328125, -9.80126953125, -8.94140625, -8.08154296875, -7.2216796875, -6.36181640625, -5.501953125, -4.64208984375, -3.7822265625, -2.92236328125, -2.0625, -1.20263671875, -0.3427734375, 0.51708984375, 1.376953125, 2.23681640625, 3.0966796875, 3.95654296875, 4.81640625, 5.67626953125, 6.5361328125, 7.39599609375, 8.255859375, 9.11572265625, 9.9755859375, 10.83544921875, 11.6953125, 12.55517578125, 13.4150390625, 14.27490234375, 15.134765625, 15.99462890625, 16.8544921875, 17.71435546875, 18.57421875, 19.43408203125, 20.2939453125, 21.15380859375, 22.013671875, 22.87353515625, 23.7333984375, 24.59326171875, 25.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 10.0, 13.0, 17.0, 32.0, 47.0, 76.0, 82.0, 156.0, 250.0, 408.0, 610.0, 1019.0, 1644.0, 2726.0, 4698.0, 8139.0, 13733.0, 23702.0, 39669.0, 65343.0, 101249.0, 139405.0, 161635.0, 154019.0, 120027.0, 82849.0, 51580.0, 30871.0, 18477.0, 10728.0, 6053.0, 3626.0, 2219.0, 1247.0, 800.0, 474.0, 342.0, 207.0, 149.0, 83.0, 48.0, 40.0, 20.0, 11.0, 12.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.84521484375, -8.5576171875, -8.27001953125, -7.982421875, -7.69482421875, -7.4072265625, -7.11962890625, -6.83203125, -6.54443359375, -6.2568359375, -5.96923828125, -5.681640625, -5.39404296875, -5.1064453125, -4.81884765625, -4.53125, -4.24365234375, -3.9560546875, -3.66845703125, -3.380859375, -3.09326171875, -2.8056640625, -2.51806640625, -2.23046875, -1.94287109375, -1.6552734375, -1.36767578125, -1.080078125, -0.79248046875, -0.5048828125, -0.21728515625, 0.0703125, 0.35791015625, 0.6455078125, 0.93310546875, 1.220703125, 1.50830078125, 1.7958984375, 2.08349609375, 2.37109375, 2.65869140625, 2.9462890625, 3.23388671875, 3.521484375, 3.80908203125, 4.0966796875, 4.38427734375, 4.671875, 4.95947265625, 5.2470703125, 5.53466796875, 5.822265625, 6.10986328125, 6.3974609375, 6.68505859375, 6.97265625, 7.26025390625, 7.5478515625, 7.83544921875, 8.123046875, 8.41064453125, 8.6982421875, 8.98583984375, 9.2734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 5.0, 12.0, 6.0, 10.0, 22.0, 24.0, 20.0, 40.0, 29.0, 43.0, 31.0, 54.0, 63.0, 50.0, 50.0, 64.0, 69.0, 61.0, 57.0, 55.0, 36.0, 25.0, 36.0, 30.0, 19.0, 16.0, 13.0, 19.0, 12.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0010442733764648438, -0.0010155066847801208, -0.000986739993095398, -0.000957973301410675, -0.0009292066097259521, -0.0009004399180412292, -0.0008716732263565063, -0.0008429065346717834, -0.0008141398429870605, -0.0007853731513023376, -0.0007566064596176147, -0.0007278397679328918, -0.0006990730762481689, -0.000670306384563446, -0.0006415396928787231, -0.0006127730011940002, -0.0005840063095092773, -0.0005552396178245544, -0.0005264729261398315, -0.0004977062344551086, -0.00046893954277038574, -0.00044017285108566284, -0.00041140615940093994, -0.00038263946771621704, -0.00035387277603149414, -0.00032510608434677124, -0.00029633939266204834, -0.00026757270097732544, -0.00023880600929260254, -0.00021003931760787964, -0.00018127262592315674, -0.00015250593423843384, -0.00012373924255371094, -9.497255086898804e-05, -6.620585918426514e-05, -3.7439167499542236e-05, -8.672475814819336e-06, 2.0094215869903564e-05, 4.8860907554626465e-05, 7.762759923934937e-05, 0.00010639429092407227, 0.00013516098260879517, 0.00016392767429351807, 0.00019269436597824097, 0.00022146105766296387, 0.00025022774934768677, 0.00027899444103240967, 0.00030776113271713257, 0.00033652782440185547, 0.00036529451608657837, 0.00039406120777130127, 0.00042282789945602417, 0.00045159459114074707, 0.00048036128282546997, 0.0005091279745101929, 0.0005378946661949158, 0.0005666613578796387, 0.0005954280495643616, 0.0006241947412490845, 0.0006529614329338074, 0.0006817281246185303, 0.0007104948163032532, 0.0007392615079879761, 0.000768028199672699, 0.0007967948913574219]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 10.0, 5.0, 11.0, 18.0, 31.0, 44.0, 66.0, 84.0, 160.0, 230.0, 366.0, 534.0, 838.0, 1271.0, 1955.0, 2828.0, 4604.0, 6809.0, 10267.0, 15653.0, 23464.0, 35101.0, 49693.0, 69651.0, 90727.0, 111006.0, 122430.0, 119602.0, 103771.0, 83126.0, 61383.0, 43579.0, 29917.0, 20103.0, 13434.0, 8836.0, 5822.0, 3754.0, 2566.0, 1582.0, 1109.0, 721.0, 480.0, 304.0, 202.0, 147.0, 90.0, 57.0, 44.0, 24.0, 22.0, 9.0, 10.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.671875, -6.455322265625, -6.23876953125, -6.022216796875, -5.8056640625, -5.589111328125, -5.37255859375, -5.156005859375, -4.939453125, -4.722900390625, -4.50634765625, -4.289794921875, -4.0732421875, -3.856689453125, -3.64013671875, -3.423583984375, -3.20703125, -2.990478515625, -2.77392578125, -2.557373046875, -2.3408203125, -2.124267578125, -1.90771484375, -1.691162109375, -1.474609375, -1.258056640625, -1.04150390625, -0.824951171875, -0.6083984375, -0.391845703125, -0.17529296875, 0.041259765625, 0.2578125, 0.474365234375, 0.69091796875, 0.907470703125, 1.1240234375, 1.340576171875, 1.55712890625, 1.773681640625, 1.990234375, 2.206787109375, 2.42333984375, 2.639892578125, 2.8564453125, 3.072998046875, 3.28955078125, 3.506103515625, 3.72265625, 3.939208984375, 4.15576171875, 4.372314453125, 4.5888671875, 4.805419921875, 5.02197265625, 5.238525390625, 5.455078125, 5.671630859375, 5.88818359375, 6.104736328125, 6.3212890625, 6.537841796875, 6.75439453125, 6.970947265625, 7.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 10.0, 5.0, 6.0, 12.0, 10.0, 16.0, 16.0, 25.0, 21.0, 25.0, 26.0, 28.0, 41.0, 29.0, 56.0, 54.0, 53.0, 37.0, 33.0, 39.0, 34.0, 54.0, 44.0, 43.0, 30.0, 33.0, 31.0, 27.0, 20.0, 24.0, 16.0, 18.0, 12.0, 15.0, 9.0, 9.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.478515625, -3.377655029296875, -3.27679443359375, -3.175933837890625, -3.0750732421875, -2.974212646484375, -2.87335205078125, -2.772491455078125, -2.671630859375, -2.570770263671875, -2.46990966796875, -2.369049072265625, -2.2681884765625, -2.167327880859375, -2.06646728515625, -1.965606689453125, -1.86474609375, -1.763885498046875, -1.66302490234375, -1.562164306640625, -1.4613037109375, -1.360443115234375, -1.25958251953125, -1.158721923828125, -1.057861328125, -0.957000732421875, -0.85614013671875, -0.755279541015625, -0.6544189453125, -0.553558349609375, -0.45269775390625, -0.351837158203125, -0.2509765625, -0.150115966796875, -0.04925537109375, 0.051605224609375, 0.1524658203125, 0.253326416015625, 0.35418701171875, 0.455047607421875, 0.555908203125, 0.656768798828125, 0.75762939453125, 0.858489990234375, 0.9593505859375, 1.060211181640625, 1.16107177734375, 1.261932373046875, 1.36279296875, 1.463653564453125, 1.56451416015625, 1.665374755859375, 1.7662353515625, 1.867095947265625, 1.96795654296875, 2.068817138671875, 2.169677734375, 2.270538330078125, 2.37139892578125, 2.472259521484375, 2.5731201171875, 2.673980712890625, 2.77484130859375, 2.875701904296875, 2.9765625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 10.0, 7.0, 7.0, 10.0, 10.0, 14.0, 18.0, 18.0, 20.0, 38.0, 33.0, 43.0, 40.0, 43.0, 42.0, 44.0, 51.0, 45.0, 42.0, 38.0, 46.0, 47.0, 51.0, 38.0, 52.0, 21.0, 28.0, 17.0, 25.0, 17.0, 17.0, 11.0, 8.0, 12.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.775482177734375, -34.43992233276367, -33.10436248779297, -31.7688045501709, -30.433244705200195, -29.097684860229492, -27.762126922607422, -26.42656707763672, -25.091007232666016, -23.755447387695312, -22.41988754272461, -21.08432960510254, -19.748769760131836, -18.413209915161133, -17.077651977539062, -15.74209213256836, -14.406532287597656, -13.070972442626953, -11.735413551330566, -10.39985466003418, -9.064294815063477, -7.728735446929932, -6.393176078796387, -5.0576171875, -3.722057342529297, -2.386497974395752, -1.050938606262207, 0.2846207618713379, 1.6201801300048828, 2.9557394981384277, 4.291298866271973, 5.626857757568359, 6.962421417236328, 8.297981262207031, 9.633540153503418, 10.969099044799805, 12.304658889770508, 13.640218734741211, 14.975777626037598, 16.311336517333984, 17.646896362304688, 18.98245620727539, 20.318016052246094, 21.653573989868164, 22.989133834838867, 24.32469367980957, 25.66025161743164, 26.995811462402344, 28.331371307373047, 29.66693115234375, 31.002490997314453, 32.338050842285156, 33.673606872558594, 35.0091667175293, 36.3447265625, 37.6802864074707, 39.015846252441406, 40.35140609741211, 41.68696594238281, 43.022525787353516, 44.35808563232422, 45.693641662597656, 47.02920150756836, 48.36476135253906, 49.700321197509766]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 9.0, 12.0, 8.0, 10.0, 6.0, 13.0, 17.0, 13.0, 19.0, 23.0, 25.0, 24.0, 28.0, 30.0, 28.0, 38.0, 38.0, 26.0, 35.0, 36.0, 35.0, 42.0, 36.0, 42.0, 40.0, 36.0, 35.0, 25.0, 42.0, 24.0, 27.0, 24.0, 24.0, 20.0, 14.0, 18.0, 10.0, 12.0, 5.0, 8.0, 8.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-42.815799713134766, -41.51879119873047, -40.22178268432617, -38.924774169921875, -37.627769470214844, -36.33076095581055, -35.03375244140625, -33.73674392700195, -32.439735412597656, -31.14272689819336, -29.845718383789062, -28.5487117767334, -27.2517032623291, -25.954694747924805, -24.65768814086914, -23.360679626464844, -22.063671112060547, -20.76666259765625, -19.469654083251953, -18.17264747619629, -16.875638961791992, -15.578630447387695, -14.281622886657715, -12.984615325927734, -11.687606811523438, -10.39059829711914, -9.09359073638916, -7.7965826988220215, -6.499574661254883, -5.202566623687744, -3.9055585861206055, -2.608551025390625, -1.3115386962890625, -0.014530658721923828, 1.2824773788452148, 2.5794854164123535, 3.876493453979492, 5.173501491546631, 6.4705095291137695, 7.76751708984375, 9.064525604248047, 10.361534118652344, 11.658541679382324, 12.955549240112305, 14.252557754516602, 15.549566268920898, 16.846572875976562, 18.14358139038086, 19.440589904785156, 20.737598419189453, 22.03460693359375, 23.331613540649414, 24.62862205505371, 25.925630569458008, 27.222637176513672, 28.51964569091797, 29.816654205322266, 31.113662719726562, 32.41067123413086, 33.707679748535156, 35.00468444824219, 36.301692962646484, 37.59870147705078, 38.89570999145508, 40.192718505859375]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 8.0, 1.0, 9.0, 13.0, 16.0, 28.0, 51.0, 80.0, 126.0, 210.0, 350.0, 537.0, 963.0, 1618.0, 2866.0, 4832.0, 8682.0, 15577.0, 27837.0, 51138.0, 93677.0, 172073.0, 312669.0, 530886.0, 749148.0, 785362.0, 604804.0, 374983.0, 209391.0, 113314.0, 60885.0, 32608.0, 17926.0, 9750.0, 5282.0, 2959.0, 1606.0, 899.0, 478.0, 261.0, 153.0, 104.0, 55.0, 33.0, 25.0, 10.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.875, -35.65185546875, -34.4287109375, -33.20556640625, -31.982421875, -30.75927734375, -29.5361328125, -28.31298828125, -27.08984375, -25.86669921875, -24.6435546875, -23.42041015625, -22.197265625, -20.97412109375, -19.7509765625, -18.52783203125, -17.3046875, -16.08154296875, -14.8583984375, -13.63525390625, -12.412109375, -11.18896484375, -9.9658203125, -8.74267578125, -7.51953125, -6.29638671875, -5.0732421875, -3.85009765625, -2.626953125, -1.40380859375, -0.1806640625, 1.04248046875, 2.265625, 3.48876953125, 4.7119140625, 5.93505859375, 7.158203125, 8.38134765625, 9.6044921875, 10.82763671875, 12.05078125, 13.27392578125, 14.4970703125, 15.72021484375, 16.943359375, 18.16650390625, 19.3896484375, 20.61279296875, 21.8359375, 23.05908203125, 24.2822265625, 25.50537109375, 26.728515625, 27.95166015625, 29.1748046875, 30.39794921875, 31.62109375, 32.84423828125, 34.0673828125, 35.29052734375, 36.513671875, 37.73681640625, 38.9599609375, 40.18310546875, 41.40625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 6.0, 4.0, 14.0, 15.0, 11.0, 13.0, 15.0, 22.0, 20.0, 23.0, 28.0, 32.0, 39.0, 22.0, 29.0, 38.0, 34.0, 29.0, 31.0, 50.0, 34.0, 37.0, 38.0, 41.0, 45.0, 38.0, 20.0, 41.0, 30.0, 26.0, 23.0, 23.0, 19.0, 10.0, 22.0, 12.0, 7.0, 7.0, 7.0, 10.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-29.65625, -28.754150390625, -27.85205078125, -26.949951171875, -26.0478515625, -25.145751953125, -24.24365234375, -23.341552734375, -22.439453125, -21.537353515625, -20.63525390625, -19.733154296875, -18.8310546875, -17.928955078125, -17.02685546875, -16.124755859375, -15.22265625, -14.320556640625, -13.41845703125, -12.516357421875, -11.6142578125, -10.712158203125, -9.81005859375, -8.907958984375, -8.005859375, -7.103759765625, -6.20166015625, -5.299560546875, -4.3974609375, -3.495361328125, -2.59326171875, -1.691162109375, -0.7890625, 0.113037109375, 1.01513671875, 1.917236328125, 2.8193359375, 3.721435546875, 4.62353515625, 5.525634765625, 6.427734375, 7.329833984375, 8.23193359375, 9.134033203125, 10.0361328125, 10.938232421875, 11.84033203125, 12.742431640625, 13.64453125, 14.546630859375, 15.44873046875, 16.350830078125, 17.2529296875, 18.155029296875, 19.05712890625, 19.959228515625, 20.861328125, 21.763427734375, 22.66552734375, 23.567626953125, 24.4697265625, 25.371826171875, 26.27392578125, 27.176025390625, 28.078125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 18.0, 22.0, 45.0, 80.0, 104.0, 173.0, 323.0, 566.0, 904.0, 1587.0, 2745.0, 4749.0, 8539.0, 15419.0, 26822.0, 47246.0, 81289.0, 136823.0, 223031.0, 341555.0, 479969.0, 594881.0, 618156.0, 533476.0, 399456.0, 267673.0, 169155.0, 101378.0, 59523.0, 33956.0, 19152.0, 10982.0, 6254.0, 3540.0, 1959.0, 1146.0, 605.0, 384.0, 223.0, 138.0, 88.0, 45.0, 30.0, 27.0, 9.0, 14.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-34.25, -33.248779296875, -32.24755859375, -31.246337890625, -30.2451171875, -29.243896484375, -28.24267578125, -27.241455078125, -26.240234375, -25.239013671875, -24.23779296875, -23.236572265625, -22.2353515625, -21.234130859375, -20.23291015625, -19.231689453125, -18.23046875, -17.229248046875, -16.22802734375, -15.226806640625, -14.2255859375, -13.224365234375, -12.22314453125, -11.221923828125, -10.220703125, -9.219482421875, -8.21826171875, -7.217041015625, -6.2158203125, -5.214599609375, -4.21337890625, -3.212158203125, -2.2109375, -1.209716796875, -0.20849609375, 0.792724609375, 1.7939453125, 2.795166015625, 3.79638671875, 4.797607421875, 5.798828125, 6.800048828125, 7.80126953125, 8.802490234375, 9.8037109375, 10.804931640625, 11.80615234375, 12.807373046875, 13.80859375, 14.809814453125, 15.81103515625, 16.812255859375, 17.8134765625, 18.814697265625, 19.81591796875, 20.817138671875, 21.818359375, 22.819580078125, 23.82080078125, 24.822021484375, 25.8232421875, 26.824462890625, 27.82568359375, 28.826904296875, 29.828125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 6.0, 5.0, 6.0, 1.0, 9.0, 9.0, 14.0, 15.0, 14.0, 22.0, 42.0, 48.0, 43.0, 66.0, 72.0, 91.0, 116.0, 134.0, 156.0, 179.0, 190.0, 223.0, 235.0, 258.0, 266.0, 244.0, 239.0, 210.0, 188.0, 204.0, 146.0, 142.0, 88.0, 98.0, 73.0, 56.0, 37.0, 43.0, 36.0, 12.0, 18.0, 14.0, 6.0, 6.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5390625, -14.0382080078125, -13.537353515625, -13.0364990234375, -12.53564453125, -12.0347900390625, -11.533935546875, -11.0330810546875, -10.5322265625, -10.0313720703125, -9.530517578125, -9.0296630859375, -8.52880859375, -8.0279541015625, -7.527099609375, -7.0262451171875, -6.525390625, -6.0245361328125, -5.523681640625, -5.0228271484375, -4.52197265625, -4.0211181640625, -3.520263671875, -3.0194091796875, -2.5185546875, -2.0177001953125, -1.516845703125, -1.0159912109375, -0.51513671875, -0.0142822265625, 0.486572265625, 0.9874267578125, 1.48828125, 1.9891357421875, 2.489990234375, 2.9908447265625, 3.49169921875, 3.9925537109375, 4.493408203125, 4.9942626953125, 5.4951171875, 5.9959716796875, 6.496826171875, 6.9976806640625, 7.49853515625, 7.9993896484375, 8.500244140625, 9.0010986328125, 9.501953125, 10.0028076171875, 10.503662109375, 11.0045166015625, 11.50537109375, 12.0062255859375, 12.507080078125, 13.0079345703125, 13.5087890625, 14.0096435546875, 14.510498046875, 15.0113525390625, 15.51220703125, 16.0130615234375, 16.513916015625, 17.0147705078125, 17.515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 6.0, 8.0, 4.0, 5.0, 5.0, 12.0, 13.0, 5.0, 16.0, 24.0, 30.0, 32.0, 28.0, 33.0, 34.0, 33.0, 32.0, 31.0, 27.0, 46.0, 50.0, 42.0, 42.0, 39.0, 42.0, 26.0, 32.0, 31.0, 30.0, 26.0, 36.0, 22.0, 23.0, 10.0, 19.0, 20.0, 12.0, 9.0, 11.0, 10.0, 13.0, 2.0, 6.0, 3.0, 2.0, 4.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-26.792695999145508, -25.934385299682617, -25.07607650756836, -24.21776580810547, -23.359455108642578, -22.50114631652832, -21.64283561706543, -20.784526824951172, -19.92621612548828, -19.06790542602539, -18.209596633911133, -17.351285934448242, -16.492977142333984, -15.634666442871094, -14.776355743408203, -13.918045997619629, -13.059736251831055, -12.20142650604248, -11.343116760253906, -10.484806060791016, -9.626496315002441, -8.768186569213867, -7.909876346588135, -7.051566123962402, -6.193256378173828, -5.334946632385254, -4.4766364097595215, -3.618326425552368, -2.760016441345215, -1.9017066955566406, -1.0433964729309082, -0.18508625030517578, 0.6732215881347656, 1.531531572341919, 2.3898415565490723, 3.2481515407562256, 4.106461524963379, 4.964771270751953, 5.8230814933776855, 6.681391716003418, 7.539701461791992, 8.398011207580566, 9.25632095336914, 10.114631652832031, 10.972941398620605, 11.83125114440918, 12.68956184387207, 13.547871589660645, 14.406181335449219, 15.264491081237793, 16.122800827026367, 16.981111526489258, 17.839420318603516, 18.697731018066406, 19.556041717529297, 20.414352416992188, 21.272661209106445, 22.130971908569336, 22.989280700683594, 23.847591400146484, 24.705902099609375, 25.564210891723633, 26.422521591186523, 27.28083038330078, 28.139141082763672]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 9.0, 10.0, 7.0, 16.0, 15.0, 17.0, 18.0, 17.0, 21.0, 21.0, 19.0, 32.0, 33.0, 32.0, 36.0, 34.0, 27.0, 33.0, 43.0, 41.0, 27.0, 36.0, 41.0, 36.0, 40.0, 47.0, 32.0, 34.0, 31.0, 34.0, 22.0, 21.0, 17.0, 14.0, 16.0, 11.0, 11.0, 14.0, 3.0, 6.0, 7.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0], "bins": [-37.08106231689453, -36.048091888427734, -35.01512145996094, -33.98215103149414, -32.949180603027344, -31.91621208190918, -30.883241653442383, -29.850271224975586, -28.817302703857422, -27.784332275390625, -26.751361846923828, -25.71839141845703, -24.685422897338867, -23.65245246887207, -22.619482040405273, -21.586511611938477, -20.55354118347168, -19.520570755004883, -18.487600326538086, -17.454631805419922, -16.421661376953125, -15.388690948486328, -14.355720520019531, -13.322750091552734, -12.289780616760254, -11.256810188293457, -10.223840713500977, -9.19087028503418, -8.157899856567383, -7.124930381774902, -6.0919599533081055, -5.058990001678467, -4.026020050048828, -2.9930500984191895, -1.9600799083709717, -0.9271097183227539, 0.10586023330688477, 1.1388301849365234, 2.1718006134033203, 3.204770565032959, 4.237740516662598, 5.270710468292236, 6.303680419921875, 7.336650848388672, 8.369621276855469, 9.40259075164795, 10.435561180114746, 11.468530654907227, 12.501501083374023, 13.53447151184082, 14.5674409866333, 15.600411415100098, 16.633380889892578, 17.666351318359375, 18.699321746826172, 19.73229217529297, 20.765262603759766, 21.798233032226562, 22.83120346069336, 23.864173889160156, 24.89714241027832, 25.930112838745117, 26.963083267211914, 27.99605369567871, 29.029022216796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 8.0, 9.0, 17.0, 20.0, 25.0, 46.0, 68.0, 82.0, 166.0, 231.0, 390.0, 643.0, 1234.0, 2080.0, 3606.0, 6607.0, 12110.0, 22856.0, 45175.0, 94152.0, 196177.0, 291995.0, 188593.0, 90129.0, 43534.0, 22096.0, 11901.0, 6363.0, 3476.0, 1930.0, 1154.0, 626.0, 413.0, 213.0, 146.0, 89.0, 68.0, 35.0, 34.0, 17.0, 10.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.8798828125, -8.556640625, -8.2333984375, -7.91015625, -7.5869140625, -7.263671875, -6.9404296875, -6.6171875, -6.2939453125, -5.970703125, -5.6474609375, -5.32421875, -5.0009765625, -4.677734375, -4.3544921875, -4.03125, -3.7080078125, -3.384765625, -3.0615234375, -2.73828125, -2.4150390625, -2.091796875, -1.7685546875, -1.4453125, -1.1220703125, -0.798828125, -0.4755859375, -0.15234375, 0.1708984375, 0.494140625, 0.8173828125, 1.140625, 1.4638671875, 1.787109375, 2.1103515625, 2.43359375, 2.7568359375, 3.080078125, 3.4033203125, 3.7265625, 4.0498046875, 4.373046875, 4.6962890625, 5.01953125, 5.3427734375, 5.666015625, 5.9892578125, 6.3125, 6.6357421875, 6.958984375, 7.2822265625, 7.60546875, 7.9287109375, 8.251953125, 8.5751953125, 8.8984375, 9.2216796875, 9.544921875, 9.8681640625, 10.19140625, 10.5146484375, 10.837890625, 11.1611328125, 11.484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 7.0, 6.0, 5.0, 9.0, 14.0, 18.0, 19.0, 21.0, 21.0, 24.0, 29.0, 31.0, 27.0, 39.0, 30.0, 21.0, 37.0, 36.0, 38.0, 41.0, 29.0, 46.0, 41.0, 34.0, 37.0, 46.0, 35.0, 35.0, 35.0, 22.0, 24.0, 28.0, 20.0, 14.0, 11.0, 8.0, 11.0, 8.0, 5.0, 11.0, 0.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.25, -33.20751953125, -32.1650390625, -31.12255859375, -30.080078125, -29.03759765625, -27.9951171875, -26.95263671875, -25.91015625, -24.86767578125, -23.8251953125, -22.78271484375, -21.740234375, -20.69775390625, -19.6552734375, -18.61279296875, -17.5703125, -16.52783203125, -15.4853515625, -14.44287109375, -13.400390625, -12.35791015625, -11.3154296875, -10.27294921875, -9.23046875, -8.18798828125, -7.1455078125, -6.10302734375, -5.060546875, -4.01806640625, -2.9755859375, -1.93310546875, -0.890625, 0.15185546875, 1.1943359375, 2.23681640625, 3.279296875, 4.32177734375, 5.3642578125, 6.40673828125, 7.44921875, 8.49169921875, 9.5341796875, 10.57666015625, 11.619140625, 12.66162109375, 13.7041015625, 14.74658203125, 15.7890625, 16.83154296875, 17.8740234375, 18.91650390625, 19.958984375, 21.00146484375, 22.0439453125, 23.08642578125, 24.12890625, 25.17138671875, 26.2138671875, 27.25634765625, 28.298828125, 29.34130859375, 30.3837890625, 31.42626953125, 32.46875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 11.0, 13.0, 26.0, 21.0, 35.0, 33.0, 53.0, 71.0, 105.0, 133.0, 211.0, 289.0, 467.0, 701.0, 1070.0, 1614.0, 2515.0, 4100.0, 6781.0, 11509.0, 19923.0, 35324.0, 63773.0, 114875.0, 191636.0, 231154.0, 156184.0, 89662.0, 49101.0, 27335.0, 15497.0, 9265.0, 5627.0, 3369.0, 2053.0, 1296.0, 825.0, 603.0, 381.0, 255.0, 205.0, 122.0, 89.0, 72.0, 48.0, 28.0, 22.0, 22.0, 20.0, 6.0, 3.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0], "bins": [-5.9765625, -5.79144287109375, -5.6063232421875, -5.42120361328125, -5.236083984375, -5.05096435546875, -4.8658447265625, -4.68072509765625, -4.49560546875, -4.31048583984375, -4.1253662109375, -3.94024658203125, -3.755126953125, -3.57000732421875, -3.3848876953125, -3.19976806640625, -3.0146484375, -2.82952880859375, -2.6444091796875, -2.45928955078125, -2.274169921875, -2.08905029296875, -1.9039306640625, -1.71881103515625, -1.53369140625, -1.34857177734375, -1.1634521484375, -0.97833251953125, -0.793212890625, -0.60809326171875, -0.4229736328125, -0.23785400390625, -0.052734375, 0.13238525390625, 0.3175048828125, 0.50262451171875, 0.687744140625, 0.87286376953125, 1.0579833984375, 1.24310302734375, 1.42822265625, 1.61334228515625, 1.7984619140625, 1.98358154296875, 2.168701171875, 2.35382080078125, 2.5389404296875, 2.72406005859375, 2.9091796875, 3.09429931640625, 3.2794189453125, 3.46453857421875, 3.649658203125, 3.83477783203125, 4.0198974609375, 4.20501708984375, 4.39013671875, 4.57525634765625, 4.7603759765625, 4.94549560546875, 5.130615234375, 5.31573486328125, 5.5008544921875, 5.68597412109375, 5.87109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 10.0, 5.0, 9.0, 15.0, 24.0, 14.0, 14.0, 18.0, 21.0, 29.0, 27.0, 31.0, 26.0, 26.0, 26.0, 46.0, 38.0, 43.0, 31.0, 29.0, 33.0, 41.0, 46.0, 34.0, 36.0, 33.0, 28.0, 30.0, 26.0, 20.0, 26.0, 26.0, 22.0, 10.0, 19.0, 14.0, 11.0, 16.0, 5.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.890625, -24.128662109375, -23.36669921875, -22.604736328125, -21.8427734375, -21.080810546875, -20.31884765625, -19.556884765625, -18.794921875, -18.032958984375, -17.27099609375, -16.509033203125, -15.7470703125, -14.985107421875, -14.22314453125, -13.461181640625, -12.69921875, -11.937255859375, -11.17529296875, -10.413330078125, -9.6513671875, -8.889404296875, -8.12744140625, -7.365478515625, -6.603515625, -5.841552734375, -5.07958984375, -4.317626953125, -3.5556640625, -2.793701171875, -2.03173828125, -1.269775390625, -0.5078125, 0.254150390625, 1.01611328125, 1.778076171875, 2.5400390625, 3.302001953125, 4.06396484375, 4.825927734375, 5.587890625, 6.349853515625, 7.11181640625, 7.873779296875, 8.6357421875, 9.397705078125, 10.15966796875, 10.921630859375, 11.68359375, 12.445556640625, 13.20751953125, 13.969482421875, 14.7314453125, 15.493408203125, 16.25537109375, 17.017333984375, 17.779296875, 18.541259765625, 19.30322265625, 20.065185546875, 20.8271484375, 21.589111328125, 22.35107421875, 23.113037109375, 23.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 2.0, 5.0, 5.0, 12.0, 17.0, 23.0, 41.0, 65.0, 90.0, 147.0, 215.0, 321.0, 464.0, 712.0, 1049.0, 1636.0, 2597.0, 4381.0, 7449.0, 13190.0, 25049.0, 51079.0, 112902.0, 292708.0, 305728.0, 117507.0, 52355.0, 25641.0, 13472.0, 7696.0, 4474.0, 2675.0, 1678.0, 1043.0, 681.0, 471.0, 326.0, 210.0, 156.0, 93.0, 67.0, 43.0, 36.0, 18.0, 7.0, 4.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.642578125, -0.6218643188476562, -0.6011505126953125, -0.5804367065429688, -0.559722900390625, -0.5390090942382812, -0.5182952880859375, -0.49758148193359375, -0.47686767578125, -0.45615386962890625, -0.4354400634765625, -0.41472625732421875, -0.394012451171875, -0.37329864501953125, -0.3525848388671875, -0.33187103271484375, -0.3111572265625, -0.29044342041015625, -0.2697296142578125, -0.24901580810546875, -0.228302001953125, -0.20758819580078125, -0.1868743896484375, -0.16616058349609375, -0.14544677734375, -0.12473297119140625, -0.1040191650390625, -0.08330535888671875, -0.062591552734375, -0.04187774658203125, -0.0211639404296875, -0.00045013427734375, 0.020263671875, 0.04097747802734375, 0.0616912841796875, 0.08240509033203125, 0.103118896484375, 0.12383270263671875, 0.1445465087890625, 0.16526031494140625, 0.18597412109375, 0.20668792724609375, 0.2274017333984375, 0.24811553955078125, 0.268829345703125, 0.28954315185546875, 0.3102569580078125, 0.33097076416015625, 0.3516845703125, 0.37239837646484375, 0.3931121826171875, 0.41382598876953125, 0.434539794921875, 0.45525360107421875, 0.4759674072265625, 0.49668121337890625, 0.51739501953125, 0.5381088256835938, 0.5588226318359375, 0.5795364379882812, 0.600250244140625, 0.6209640502929688, 0.6416778564453125, 0.6623916625976562, 0.68310546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 5.0, 4.0, 9.0, 9.0, 11.0, 9.0, 26.0, 31.0, 41.0, 47.0, 78.0, 67.0, 85.0, 98.0, 83.0, 93.0, 75.0, 68.0, 44.0, 25.0, 25.0, 17.0, 17.0, 11.0, 4.0, 2.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013875961303710938, -0.00013453513383865356, -0.00013031065464019775, -0.00012608617544174194, -0.00012186169624328613, -0.00011763721704483032, -0.00011341273784637451, -0.0001091882586479187, -0.00010496377944946289, -0.00010073930025100708, -9.651482105255127e-05, -9.229034185409546e-05, -8.806586265563965e-05, -8.384138345718384e-05, -7.961690425872803e-05, -7.539242506027222e-05, -7.11679458618164e-05, -6.69434666633606e-05, -6.271898746490479e-05, -5.8494508266448975e-05, -5.4270029067993164e-05, -5.0045549869537354e-05, -4.582107067108154e-05, -4.159659147262573e-05, -3.737211227416992e-05, -3.314763307571411e-05, -2.89231538772583e-05, -2.469867467880249e-05, -2.047419548034668e-05, -1.624971628189087e-05, -1.2025237083435059e-05, -7.800757884979248e-06, -3.5762786865234375e-06, 6.48200511932373e-07, 4.872679710388184e-06, 9.097158908843994e-06, 1.3321638107299805e-05, 1.7546117305755615e-05, 2.1770596504211426e-05, 2.5995075702667236e-05, 3.0219554901123047e-05, 3.444403409957886e-05, 3.866851329803467e-05, 4.289299249649048e-05, 4.711747169494629e-05, 5.13419508934021e-05, 5.556643009185791e-05, 5.979090929031372e-05, 6.401538848876953e-05, 6.823986768722534e-05, 7.246434688568115e-05, 7.668882608413696e-05, 8.091330528259277e-05, 8.513778448104858e-05, 8.93622636795044e-05, 9.35867428779602e-05, 9.781122207641602e-05, 0.00010203570127487183, 0.00010626018047332764, 0.00011048465967178345, 0.00011470913887023926, 0.00011893361806869507, 0.00012315809726715088, 0.0001273825764656067, 0.0001316070556640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 14.0, 13.0, 26.0, 37.0, 64.0, 75.0, 148.0, 229.0, 309.0, 460.0, 720.0, 1164.0, 1596.0, 2425.0, 3783.0, 5639.0, 8214.0, 12556.0, 18439.0, 27743.0, 43322.0, 67580.0, 113405.0, 225121.0, 215368.0, 110426.0, 65864.0, 41577.0, 27561.0, 18191.0, 12057.0, 8014.0, 5526.0, 3687.0, 2398.0, 1587.0, 1186.0, 725.0, 453.0, 300.0, 194.0, 120.0, 76.0, 60.0, 31.0, 26.0, 9.0, 13.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.1015625, -1.067108154296875, -1.03265380859375, -0.998199462890625, -0.9637451171875, -0.929290771484375, -0.89483642578125, -0.860382080078125, -0.825927734375, -0.791473388671875, -0.75701904296875, -0.722564697265625, -0.6881103515625, -0.653656005859375, -0.61920166015625, -0.584747314453125, -0.55029296875, -0.515838623046875, -0.48138427734375, -0.446929931640625, -0.4124755859375, -0.378021240234375, -0.34356689453125, -0.309112548828125, -0.274658203125, -0.240203857421875, -0.20574951171875, -0.171295166015625, -0.1368408203125, -0.102386474609375, -0.06793212890625, -0.033477783203125, 0.0009765625, 0.035430908203125, 0.06988525390625, 0.104339599609375, 0.1387939453125, 0.173248291015625, 0.20770263671875, 0.242156982421875, 0.276611328125, 0.311065673828125, 0.34552001953125, 0.379974365234375, 0.4144287109375, 0.448883056640625, 0.48333740234375, 0.517791748046875, 0.55224609375, 0.586700439453125, 0.62115478515625, 0.655609130859375, 0.6900634765625, 0.724517822265625, 0.75897216796875, 0.793426513671875, 0.827880859375, 0.862335205078125, 0.89678955078125, 0.931243896484375, 0.9656982421875, 1.000152587890625, 1.03460693359375, 1.069061279296875, 1.103515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 2.0, 9.0, 7.0, 5.0, 6.0, 15.0, 13.0, 9.0, 16.0, 17.0, 15.0, 20.0, 40.0, 23.0, 22.0, 41.0, 40.0, 39.0, 41.0, 39.0, 53.0, 37.0, 44.0, 49.0, 33.0, 45.0, 47.0, 29.0, 30.0, 22.0, 26.0, 17.0, 21.0, 16.0, 18.0, 16.0, 11.0, 12.0, 6.0, 12.0, 9.0, 5.0, 7.0, 5.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51513671875, -0.49884033203125, -0.4825439453125, -0.46624755859375, -0.449951171875, -0.43365478515625, -0.4173583984375, -0.40106201171875, -0.384765625, -0.36846923828125, -0.3521728515625, -0.33587646484375, -0.319580078125, -0.30328369140625, -0.2869873046875, -0.27069091796875, -0.25439453125, -0.23809814453125, -0.2218017578125, -0.20550537109375, -0.189208984375, -0.17291259765625, -0.1566162109375, -0.14031982421875, -0.1240234375, -0.10772705078125, -0.0914306640625, -0.07513427734375, -0.058837890625, -0.04254150390625, -0.0262451171875, -0.00994873046875, 0.00634765625, 0.02264404296875, 0.0389404296875, 0.05523681640625, 0.071533203125, 0.08782958984375, 0.1041259765625, 0.12042236328125, 0.13671875, 0.15301513671875, 0.1693115234375, 0.18560791015625, 0.201904296875, 0.21820068359375, 0.2344970703125, 0.25079345703125, 0.26708984375, 0.28338623046875, 0.2996826171875, 0.31597900390625, 0.332275390625, 0.34857177734375, 0.3648681640625, 0.38116455078125, 0.3974609375, 0.41375732421875, 0.4300537109375, 0.44635009765625, 0.462646484375, 0.47894287109375, 0.4952392578125, 0.51153564453125, 0.52783203125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 4.0, 5.0, 8.0, 5.0, 5.0, 4.0, 5.0, 13.0, 12.0, 7.0, 19.0, 21.0, 32.0, 37.0, 24.0, 32.0, 28.0, 34.0, 30.0, 33.0, 32.0, 41.0, 46.0, 43.0, 49.0, 39.0, 35.0, 34.0, 33.0, 30.0, 30.0, 29.0, 20.0, 26.0, 24.0, 19.0, 13.0, 18.0, 11.0, 10.0, 15.0, 9.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.985017776489258, -24.15036964416504, -23.315719604492188, -22.48107147216797, -21.64642333984375, -20.81177520751953, -19.977127075195312, -19.14247703552246, -18.307828903198242, -17.473180770874023, -16.638530731201172, -15.803882598876953, -14.969234466552734, -14.134586334228516, -13.29993724822998, -12.465288162231445, -11.630640029907227, -10.795991897583008, -9.961342811584473, -9.126693725585938, -8.292045593261719, -7.457396984100342, -6.622748374938965, -5.788099765777588, -4.953451156616211, -4.118802547454834, -3.284153938293457, -2.44950532913208, -1.6148567199707031, -0.7802081108093262, 0.05444049835205078, 0.8890891075134277, 1.7237358093261719, 2.558384418487549, 3.393033027648926, 4.227681636810303, 5.06233024597168, 5.896978855133057, 6.731627464294434, 7.5662760734558105, 8.400924682617188, 9.235572814941406, 10.070221900939941, 10.904870986938477, 11.739519119262695, 12.574167251586914, 13.40881633758545, 14.243465423583984, 15.078113555908203, 15.912761688232422, 16.74740982055664, 17.582059860229492, 18.41670799255371, 19.25135612487793, 20.08600616455078, 20.920654296875, 21.75530242919922, 22.589950561523438, 23.424598693847656, 24.259248733520508, 25.093896865844727, 25.928544998168945, 26.763195037841797, 27.597843170166016, 28.432491302490234]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 8.0, 6.0, 11.0, 8.0, 20.0, 13.0, 16.0, 18.0, 23.0, 19.0, 20.0, 21.0, 30.0, 36.0, 31.0, 36.0, 32.0, 25.0, 38.0, 44.0, 38.0, 28.0, 36.0, 43.0, 36.0, 44.0, 39.0, 39.0, 33.0, 31.0, 29.0, 20.0, 20.0, 16.0, 16.0, 13.0, 15.0, 12.0, 10.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0], "bins": [-36.0355110168457, -35.02525329589844, -34.01499938964844, -33.00474166870117, -31.99448585510254, -30.984230041503906, -29.97397232055664, -28.963716506958008, -27.953460693359375, -26.943204879760742, -25.93294906616211, -24.922691345214844, -23.91243553161621, -22.902179718017578, -21.891921997070312, -20.88166618347168, -19.871410369873047, -18.861154556274414, -17.85089874267578, -16.840641021728516, -15.830385208129883, -14.82012939453125, -13.8098726272583, -12.799615859985352, -11.789360046386719, -10.779104232788086, -9.768847465515137, -8.758590698242188, -7.748334884643555, -6.738078594207764, -5.727822303771973, -4.717566013336182, -3.7073116302490234, -2.6970553398132324, -1.6867990493774414, -0.6765427589416504, 0.3337135314941406, 1.3439698219299316, 2.3542261123657227, 3.3644824028015137, 4.374738693237305, 5.384994983673096, 6.395251274108887, 7.405507564544678, 8.415763854980469, 9.426019668579102, 10.43627643585205, 11.446533203125, 12.456789016723633, 13.467044830322266, 14.477301597595215, 15.487558364868164, 16.497814178466797, 17.50806999206543, 18.518325805664062, 19.528583526611328, 20.53883934020996, 21.549095153808594, 22.55935287475586, 23.569608688354492, 24.579864501953125, 25.590120315551758, 26.60037612915039, 27.610633850097656, 28.62088966369629]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 18.0, 25.0, 33.0, 59.0, 75.0, 135.0, 216.0, 336.0, 499.0, 806.0, 1220.0, 1895.0, 3004.0, 4638.0, 7107.0, 11272.0, 16655.0, 26070.0, 37936.0, 54132.0, 73634.0, 93420.0, 110857.0, 119017.0, 115028.0, 100234.0, 80725.0, 60672.0, 43070.0, 29446.0, 19709.0, 12975.0, 8470.0, 5513.0, 3430.0, 2231.0, 1457.0, 902.0, 562.0, 356.0, 253.0, 152.0, 102.0, 77.0, 44.0, 38.0, 20.0, 8.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.3125, -24.560791015625, -23.80908203125, -23.057373046875, -22.3056640625, -21.553955078125, -20.80224609375, -20.050537109375, -19.298828125, -18.547119140625, -17.79541015625, -17.043701171875, -16.2919921875, -15.540283203125, -14.78857421875, -14.036865234375, -13.28515625, -12.533447265625, -11.78173828125, -11.030029296875, -10.2783203125, -9.526611328125, -8.77490234375, -8.023193359375, -7.271484375, -6.519775390625, -5.76806640625, -5.016357421875, -4.2646484375, -3.512939453125, -2.76123046875, -2.009521484375, -1.2578125, -0.506103515625, 0.24560546875, 0.997314453125, 1.7490234375, 2.500732421875, 3.25244140625, 4.004150390625, 4.755859375, 5.507568359375, 6.25927734375, 7.010986328125, 7.7626953125, 8.514404296875, 9.26611328125, 10.017822265625, 10.76953125, 11.521240234375, 12.27294921875, 13.024658203125, 13.7763671875, 14.528076171875, 15.27978515625, 16.031494140625, 16.783203125, 17.534912109375, 18.28662109375, 19.038330078125, 19.7900390625, 20.541748046875, 21.29345703125, 22.045166015625, 22.796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 9.0, 8.0, 12.0, 7.0, 8.0, 10.0, 19.0, 27.0, 13.0, 19.0, 34.0, 23.0, 26.0, 36.0, 31.0, 28.0, 45.0, 43.0, 31.0, 24.0, 32.0, 44.0, 31.0, 39.0, 45.0, 37.0, 38.0, 44.0, 23.0, 27.0, 26.0, 18.0, 20.0, 19.0, 14.0, 11.0, 12.0, 9.0, 13.0, 7.0, 10.0, 6.0, 8.0, 1.0, 3.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.953125, -31.007080078125, -30.06103515625, -29.114990234375, -28.1689453125, -27.222900390625, -26.27685546875, -25.330810546875, -24.384765625, -23.438720703125, -22.49267578125, -21.546630859375, -20.6005859375, -19.654541015625, -18.70849609375, -17.762451171875, -16.81640625, -15.870361328125, -14.92431640625, -13.978271484375, -13.0322265625, -12.086181640625, -11.14013671875, -10.194091796875, -9.248046875, -8.302001953125, -7.35595703125, -6.409912109375, -5.4638671875, -4.517822265625, -3.57177734375, -2.625732421875, -1.6796875, -0.733642578125, 0.21240234375, 1.158447265625, 2.1044921875, 3.050537109375, 3.99658203125, 4.942626953125, 5.888671875, 6.834716796875, 7.78076171875, 8.726806640625, 9.6728515625, 10.618896484375, 11.56494140625, 12.510986328125, 13.45703125, 14.403076171875, 15.34912109375, 16.295166015625, 17.2412109375, 18.187255859375, 19.13330078125, 20.079345703125, 21.025390625, 21.971435546875, 22.91748046875, 23.863525390625, 24.8095703125, 25.755615234375, 26.70166015625, 27.647705078125, 28.59375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 11.0, 10.0, 14.0, 38.0, 52.0, 86.0, 117.0, 199.0, 301.0, 471.0, 758.0, 1179.0, 1893.0, 2936.0, 4710.0, 7352.0, 11558.0, 17986.0, 27315.0, 41302.0, 59787.0, 83020.0, 105926.0, 123196.0, 126494.0, 116638.0, 95008.0, 72064.0, 50858.0, 34281.0, 22643.0, 14670.0, 9339.0, 6009.0, 3716.0, 2471.0, 1499.0, 955.0, 603.0, 405.0, 254.0, 162.0, 97.0, 54.0, 39.0, 28.0, 20.0, 16.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.40625, -25.561767578125, -24.71728515625, -23.872802734375, -23.0283203125, -22.183837890625, -21.33935546875, -20.494873046875, -19.650390625, -18.805908203125, -17.96142578125, -17.116943359375, -16.2724609375, -15.427978515625, -14.58349609375, -13.739013671875, -12.89453125, -12.050048828125, -11.20556640625, -10.361083984375, -9.5166015625, -8.672119140625, -7.82763671875, -6.983154296875, -6.138671875, -5.294189453125, -4.44970703125, -3.605224609375, -2.7607421875, -1.916259765625, -1.07177734375, -0.227294921875, 0.6171875, 1.461669921875, 2.30615234375, 3.150634765625, 3.9951171875, 4.839599609375, 5.68408203125, 6.528564453125, 7.373046875, 8.217529296875, 9.06201171875, 9.906494140625, 10.7509765625, 11.595458984375, 12.43994140625, 13.284423828125, 14.12890625, 14.973388671875, 15.81787109375, 16.662353515625, 17.5068359375, 18.351318359375, 19.19580078125, 20.040283203125, 20.884765625, 21.729248046875, 22.57373046875, 23.418212890625, 24.2626953125, 25.107177734375, 25.95166015625, 26.796142578125, 27.640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 5.0, 6.0, 10.0, 14.0, 9.0, 19.0, 14.0, 19.0, 16.0, 24.0, 26.0, 23.0, 35.0, 38.0, 46.0, 34.0, 47.0, 39.0, 39.0, 45.0, 34.0, 47.0, 44.0, 35.0, 38.0, 35.0, 29.0, 38.0, 26.0, 27.0, 22.0, 13.0, 20.0, 12.0, 5.0, 11.0, 11.0, 8.0, 6.0, 6.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.66552734375, -18.0029296875, -17.34033203125, -16.677734375, -16.01513671875, -15.3525390625, -14.68994140625, -14.02734375, -13.36474609375, -12.7021484375, -12.03955078125, -11.376953125, -10.71435546875, -10.0517578125, -9.38916015625, -8.7265625, -8.06396484375, -7.4013671875, -6.73876953125, -6.076171875, -5.41357421875, -4.7509765625, -4.08837890625, -3.42578125, -2.76318359375, -2.1005859375, -1.43798828125, -0.775390625, -0.11279296875, 0.5498046875, 1.21240234375, 1.875, 2.53759765625, 3.2001953125, 3.86279296875, 4.525390625, 5.18798828125, 5.8505859375, 6.51318359375, 7.17578125, 7.83837890625, 8.5009765625, 9.16357421875, 9.826171875, 10.48876953125, 11.1513671875, 11.81396484375, 12.4765625, 13.13916015625, 13.8017578125, 14.46435546875, 15.126953125, 15.78955078125, 16.4521484375, 17.11474609375, 17.77734375, 18.43994140625, 19.1025390625, 19.76513671875, 20.427734375, 21.09033203125, 21.7529296875, 22.41552734375, 23.078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 10.0, 12.0, 10.0, 21.0, 36.0, 61.0, 104.0, 162.0, 287.0, 461.0, 723.0, 1212.0, 2166.0, 3869.0, 6845.0, 12007.0, 21242.0, 36080.0, 61034.0, 94711.0, 131739.0, 158696.0, 157202.0, 129108.0, 91212.0, 58018.0, 34815.0, 20048.0, 11341.0, 6521.0, 3607.0, 2146.0, 1238.0, 710.0, 394.0, 253.0, 162.0, 88.0, 53.0, 42.0, 24.0, 29.0, 7.0, 7.0, 7.0, 9.0, 6.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.5546875, -7.302490234375, -7.05029296875, -6.798095703125, -6.5458984375, -6.293701171875, -6.04150390625, -5.789306640625, -5.537109375, -5.284912109375, -5.03271484375, -4.780517578125, -4.5283203125, -4.276123046875, -4.02392578125, -3.771728515625, -3.51953125, -3.267333984375, -3.01513671875, -2.762939453125, -2.5107421875, -2.258544921875, -2.00634765625, -1.754150390625, -1.501953125, -1.249755859375, -0.99755859375, -0.745361328125, -0.4931640625, -0.240966796875, 0.01123046875, 0.263427734375, 0.515625, 0.767822265625, 1.02001953125, 1.272216796875, 1.5244140625, 1.776611328125, 2.02880859375, 2.281005859375, 2.533203125, 2.785400390625, 3.03759765625, 3.289794921875, 3.5419921875, 3.794189453125, 4.04638671875, 4.298583984375, 4.55078125, 4.802978515625, 5.05517578125, 5.307373046875, 5.5595703125, 5.811767578125, 6.06396484375, 6.316162109375, 6.568359375, 6.820556640625, 7.07275390625, 7.324951171875, 7.5771484375, 7.829345703125, 8.08154296875, 8.333740234375, 8.5859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 8.0, 5.0, 14.0, 4.0, 19.0, 15.0, 15.0, 22.0, 24.0, 27.0, 35.0, 29.0, 37.0, 39.0, 43.0, 41.0, 48.0, 43.0, 52.0, 45.0, 44.0, 53.0, 39.0, 38.0, 33.0, 31.0, 30.0, 34.0, 22.0, 19.0, 18.0, 16.0, 9.0, 3.0, 4.0, 4.0, 11.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006666183471679688, -0.000645853579044342, -0.0006250888109207153, -0.0006043240427970886, -0.0005835592746734619, -0.0005627945065498352, -0.0005420297384262085, -0.0005212649703025818, -0.0005005002021789551, -0.00047973543405532837, -0.00045897066593170166, -0.00043820589780807495, -0.00041744112968444824, -0.00039667636156082153, -0.0003759115934371948, -0.0003551468253135681, -0.0003343820571899414, -0.0003136172890663147, -0.000292852520942688, -0.0002720877528190613, -0.00025132298469543457, -0.00023055821657180786, -0.00020979344844818115, -0.00018902868032455444, -0.00016826391220092773, -0.00014749914407730103, -0.00012673437595367432, -0.00010596960783004761, -8.52048397064209e-05, -6.444007158279419e-05, -4.367530345916748e-05, -2.291053533554077e-05, -2.1457672119140625e-06, 1.8619000911712646e-05, 3.9383769035339355e-05, 6.0148537158966064e-05, 8.091330528259277e-05, 0.00010167807340621948, 0.0001224428415298462, 0.0001432076096534729, 0.0001639723777770996, 0.00018473714590072632, 0.00020550191402435303, 0.00022626668214797974, 0.00024703145027160645, 0.00026779621839523315, 0.00028856098651885986, 0.00030932575464248657, 0.0003300905227661133, 0.00035085529088974, 0.0003716200590133667, 0.0003923848271369934, 0.0004131495952606201, 0.0004339143633842468, 0.00045467913150787354, 0.00047544389963150024, 0.000496208667755127, 0.0005169734358787537, 0.0005377382040023804, 0.0005585029721260071, 0.0005792677402496338, 0.0006000325083732605, 0.0006207972764968872, 0.0006415620446205139, 0.0006623268127441406]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 6.0, 5.0, 7.0, 11.0, 11.0, 17.0, 35.0, 70.0, 86.0, 122.0, 194.0, 296.0, 442.0, 639.0, 1054.0, 1599.0, 2462.0, 3604.0, 5780.0, 8853.0, 13682.0, 20424.0, 30360.0, 44378.0, 62751.0, 83193.0, 103048.0, 117263.0, 119380.0, 110422.0, 91763.0, 70352.0, 51416.0, 35401.0, 24139.0, 15735.0, 10151.0, 6721.0, 4436.0, 2902.0, 1764.0, 1244.0, 783.0, 517.0, 374.0, 214.0, 158.0, 119.0, 75.0, 45.0, 20.0, 13.0, 12.0, 9.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-5.9453125, -5.7484130859375, -5.551513671875, -5.3546142578125, -5.15771484375, -4.9608154296875, -4.763916015625, -4.5670166015625, -4.3701171875, -4.1732177734375, -3.976318359375, -3.7794189453125, -3.58251953125, -3.3856201171875, -3.188720703125, -2.9918212890625, -2.794921875, -2.5980224609375, -2.401123046875, -2.2042236328125, -2.00732421875, -1.8104248046875, -1.613525390625, -1.4166259765625, -1.2197265625, -1.0228271484375, -0.825927734375, -0.6290283203125, -0.43212890625, -0.2352294921875, -0.038330078125, 0.1585693359375, 0.35546875, 0.5523681640625, 0.749267578125, 0.9461669921875, 1.14306640625, 1.3399658203125, 1.536865234375, 1.7337646484375, 1.9306640625, 2.1275634765625, 2.324462890625, 2.5213623046875, 2.71826171875, 2.9151611328125, 3.112060546875, 3.3089599609375, 3.505859375, 3.7027587890625, 3.899658203125, 4.0965576171875, 4.29345703125, 4.4903564453125, 4.687255859375, 4.8841552734375, 5.0810546875, 5.2779541015625, 5.474853515625, 5.6717529296875, 5.86865234375, 6.0655517578125, 6.262451171875, 6.4593505859375, 6.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 12.0, 6.0, 10.0, 7.0, 15.0, 21.0, 19.0, 22.0, 23.0, 21.0, 25.0, 42.0, 37.0, 37.0, 40.0, 51.0, 40.0, 46.0, 48.0, 46.0, 40.0, 35.0, 41.0, 45.0, 31.0, 39.0, 29.0, 29.0, 27.0, 19.0, 16.0, 18.0, 14.0, 16.0, 9.0, 9.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12109375, -2.04443359375, -1.9677734375, -1.89111328125, -1.814453125, -1.73779296875, -1.6611328125, -1.58447265625, -1.5078125, -1.43115234375, -1.3544921875, -1.27783203125, -1.201171875, -1.12451171875, -1.0478515625, -0.97119140625, -0.89453125, -0.81787109375, -0.7412109375, -0.66455078125, -0.587890625, -0.51123046875, -0.4345703125, -0.35791015625, -0.28125, -0.20458984375, -0.1279296875, -0.05126953125, 0.025390625, 0.10205078125, 0.1787109375, 0.25537109375, 0.33203125, 0.40869140625, 0.4853515625, 0.56201171875, 0.638671875, 0.71533203125, 0.7919921875, 0.86865234375, 0.9453125, 1.02197265625, 1.0986328125, 1.17529296875, 1.251953125, 1.32861328125, 1.4052734375, 1.48193359375, 1.55859375, 1.63525390625, 1.7119140625, 1.78857421875, 1.865234375, 1.94189453125, 2.0185546875, 2.09521484375, 2.171875, 2.24853515625, 2.3251953125, 2.40185546875, 2.478515625, 2.55517578125, 2.6318359375, 2.70849609375, 2.78515625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 3.0, 6.0, 10.0, 10.0, 10.0, 14.0, 17.0, 18.0, 24.0, 25.0, 29.0, 25.0, 30.0, 36.0, 38.0, 29.0, 33.0, 40.0, 32.0, 58.0, 43.0, 36.0, 35.0, 32.0, 38.0, 31.0, 38.0, 28.0, 24.0, 32.0, 23.0, 22.0, 15.0, 14.0, 15.0, 17.0, 12.0, 12.0, 7.0, 7.0, 8.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-26.03148078918457, -25.20361328125, -24.37574577331543, -23.54787826538086, -22.720012664794922, -21.89214324951172, -21.06427764892578, -20.23641014099121, -19.40854263305664, -18.58067512512207, -17.7528076171875, -16.92494010925293, -16.09707260131836, -15.269206047058105, -14.441339492797852, -13.613471984863281, -12.785604476928711, -11.95773696899414, -11.12986946105957, -10.302002906799316, -9.474135398864746, -8.646267890930176, -7.818400859832764, -6.990533828735352, -6.162666320800781, -5.334798812866211, -4.506931781768799, -3.6790645122528076, -2.8511972427368164, -2.023329734802246, -1.195462703704834, -0.3675956726074219, 0.46027374267578125, 1.2881410121917725, 2.1160082817077637, 2.943875551223755, 3.771742820739746, 4.599610328674316, 5.4274773597717285, 6.255344390869141, 7.083211898803711, 7.911079406738281, 8.738946914672852, 9.566813468933105, 10.394680976867676, 11.222548484802246, 12.0504150390625, 12.87828254699707, 13.70615005493164, 14.534017562866211, 15.361885070800781, 16.18975257873535, 17.017620086669922, 17.84548568725586, 18.67335319519043, 19.501220703125, 20.32908821105957, 21.15695571899414, 21.98482322692871, 22.81269073486328, 23.64055633544922, 24.468425750732422, 25.29629135131836, 26.12415885925293, 26.9520263671875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 2.0, 9.0, 11.0, 11.0, 12.0, 20.0, 7.0, 23.0, 26.0, 19.0, 26.0, 32.0, 34.0, 35.0, 31.0, 29.0, 40.0, 45.0, 46.0, 46.0, 50.0, 41.0, 45.0, 37.0, 38.0, 41.0, 35.0, 29.0, 25.0, 15.0, 24.0, 14.0, 17.0, 15.0, 16.0, 10.0, 4.0, 7.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.694969177246094, -37.5576286315918, -36.4202880859375, -35.2829475402832, -34.145606994628906, -33.00826644897461, -31.870925903320312, -30.733585357666016, -29.59624481201172, -28.458904266357422, -27.321563720703125, -26.184223175048828, -25.04688262939453, -23.909542083740234, -22.772201538085938, -21.63486099243164, -20.497520446777344, -19.360179901123047, -18.22283935546875, -17.085498809814453, -15.948158264160156, -14.81081771850586, -13.673477172851562, -12.536136627197266, -11.398796081542969, -10.261455535888672, -9.124114990234375, -7.986774444580078, -6.849433898925781, -5.712093353271484, -4.5747528076171875, -3.4374122619628906, -2.300067901611328, -1.1627273559570312, -0.025386810302734375, 1.1119537353515625, 2.2492942810058594, 3.3866348266601562, 4.523975372314453, 5.66131591796875, 6.798656463623047, 7.935997009277344, 9.07333755493164, 10.210678100585938, 11.348018646240234, 12.485359191894531, 13.622699737548828, 14.760040283203125, 15.897380828857422, 17.03472137451172, 18.172061920166016, 19.309402465820312, 20.44674301147461, 21.584083557128906, 22.721424102783203, 23.8587646484375, 24.996105194091797, 26.133445739746094, 27.27078628540039, 28.408126831054688, 29.545467376708984, 30.68280792236328, 31.820148468017578, 32.957489013671875, 34.09482955932617]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 8.0, 11.0, 20.0, 38.0, 52.0, 76.0, 119.0, 190.0, 292.0, 539.0, 793.0, 1246.0, 2062.0, 3357.0, 5557.0, 9295.0, 15438.0, 25912.0, 42749.0, 72071.0, 118019.0, 192117.0, 298676.0, 434699.0, 561954.0, 617314.0, 564054.0, 438563.0, 301935.0, 194043.0, 118567.0, 71150.0, 42292.0, 25314.0, 14523.0, 8700.0, 5033.0, 2947.0, 1788.0, 1027.0, 678.0, 418.0, 236.0, 145.0, 83.0, 78.0, 31.0, 23.0, 19.0, 17.0, 3.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.6875, -24.89697265625, -24.1064453125, -23.31591796875, -22.525390625, -21.73486328125, -20.9443359375, -20.15380859375, -19.36328125, -18.57275390625, -17.7822265625, -16.99169921875, -16.201171875, -15.41064453125, -14.6201171875, -13.82958984375, -13.0390625, -12.24853515625, -11.4580078125, -10.66748046875, -9.876953125, -9.08642578125, -8.2958984375, -7.50537109375, -6.71484375, -5.92431640625, -5.1337890625, -4.34326171875, -3.552734375, -2.76220703125, -1.9716796875, -1.18115234375, -0.390625, 0.39990234375, 1.1904296875, 1.98095703125, 2.771484375, 3.56201171875, 4.3525390625, 5.14306640625, 5.93359375, 6.72412109375, 7.5146484375, 8.30517578125, 9.095703125, 9.88623046875, 10.6767578125, 11.46728515625, 12.2578125, 13.04833984375, 13.8388671875, 14.62939453125, 15.419921875, 16.21044921875, 17.0009765625, 17.79150390625, 18.58203125, 19.37255859375, 20.1630859375, 20.95361328125, 21.744140625, 22.53466796875, 23.3251953125, 24.11572265625, 24.90625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 4.0, 7.0, 6.0, 9.0, 10.0, 15.0, 17.0, 19.0, 16.0, 21.0, 40.0, 28.0, 27.0, 35.0, 25.0, 32.0, 38.0, 34.0, 47.0, 52.0, 47.0, 42.0, 44.0, 44.0, 45.0, 42.0, 38.0, 32.0, 30.0, 20.0, 18.0, 14.0, 17.0, 12.0, 13.0, 13.0, 6.0, 9.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.625, -24.8134765625, -24.001953125, -23.1904296875, -22.37890625, -21.5673828125, -20.755859375, -19.9443359375, -19.1328125, -18.3212890625, -17.509765625, -16.6982421875, -15.88671875, -15.0751953125, -14.263671875, -13.4521484375, -12.640625, -11.8291015625, -11.017578125, -10.2060546875, -9.39453125, -8.5830078125, -7.771484375, -6.9599609375, -6.1484375, -5.3369140625, -4.525390625, -3.7138671875, -2.90234375, -2.0908203125, -1.279296875, -0.4677734375, 0.34375, 1.1552734375, 1.966796875, 2.7783203125, 3.58984375, 4.4013671875, 5.212890625, 6.0244140625, 6.8359375, 7.6474609375, 8.458984375, 9.2705078125, 10.08203125, 10.8935546875, 11.705078125, 12.5166015625, 13.328125, 14.1396484375, 14.951171875, 15.7626953125, 16.57421875, 17.3857421875, 18.197265625, 19.0087890625, 19.8203125, 20.6318359375, 21.443359375, 22.2548828125, 23.06640625, 23.8779296875, 24.689453125, 25.5009765625, 26.3125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 9.0, 17.0, 17.0, 21.0, 35.0, 56.0, 91.0, 146.0, 236.0, 340.0, 655.0, 950.0, 1692.0, 2852.0, 4745.0, 8020.0, 13380.0, 22244.0, 36098.0, 57711.0, 90912.0, 139418.0, 203197.0, 282004.0, 367576.0, 442338.0, 482714.0, 475844.0, 425993.0, 345635.0, 263620.0, 185393.0, 126242.0, 82282.0, 51021.0, 31837.0, 19567.0, 11857.0, 6911.0, 4241.0, 2466.0, 1529.0, 980.0, 514.0, 308.0, 223.0, 126.0, 88.0, 57.0, 36.0, 17.0, 11.0, 13.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.765625, -19.12548828125, -18.4853515625, -17.84521484375, -17.205078125, -16.56494140625, -15.9248046875, -15.28466796875, -14.64453125, -14.00439453125, -13.3642578125, -12.72412109375, -12.083984375, -11.44384765625, -10.8037109375, -10.16357421875, -9.5234375, -8.88330078125, -8.2431640625, -7.60302734375, -6.962890625, -6.32275390625, -5.6826171875, -5.04248046875, -4.40234375, -3.76220703125, -3.1220703125, -2.48193359375, -1.841796875, -1.20166015625, -0.5615234375, 0.07861328125, 0.71875, 1.35888671875, 1.9990234375, 2.63916015625, 3.279296875, 3.91943359375, 4.5595703125, 5.19970703125, 5.83984375, 6.47998046875, 7.1201171875, 7.76025390625, 8.400390625, 9.04052734375, 9.6806640625, 10.32080078125, 10.9609375, 11.60107421875, 12.2412109375, 12.88134765625, 13.521484375, 14.16162109375, 14.8017578125, 15.44189453125, 16.08203125, 16.72216796875, 17.3623046875, 18.00244140625, 18.642578125, 19.28271484375, 19.9228515625, 20.56298828125, 21.203125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 10.0, 5.0, 5.0, 5.0, 22.0, 21.0, 29.0, 45.0, 47.0, 62.0, 74.0, 104.0, 120.0, 147.0, 185.0, 187.0, 210.0, 213.0, 247.0, 249.0, 268.0, 200.0, 241.0, 234.0, 191.0, 197.0, 172.0, 121.0, 104.0, 96.0, 74.0, 58.0, 34.0, 30.0, 20.0, 19.0, 12.0, 8.0, 4.0, 6.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.5859375, -13.1600341796875, -12.734130859375, -12.3082275390625, -11.88232421875, -11.4564208984375, -11.030517578125, -10.6046142578125, -10.1787109375, -9.7528076171875, -9.326904296875, -8.9010009765625, -8.47509765625, -8.0491943359375, -7.623291015625, -7.1973876953125, -6.771484375, -6.3455810546875, -5.919677734375, -5.4937744140625, -5.06787109375, -4.6419677734375, -4.216064453125, -3.7901611328125, -3.3642578125, -2.9383544921875, -2.512451171875, -2.0865478515625, -1.66064453125, -1.2347412109375, -0.808837890625, -0.3829345703125, 0.04296875, 0.4688720703125, 0.894775390625, 1.3206787109375, 1.74658203125, 2.1724853515625, 2.598388671875, 3.0242919921875, 3.4501953125, 3.8760986328125, 4.302001953125, 4.7279052734375, 5.15380859375, 5.5797119140625, 6.005615234375, 6.4315185546875, 6.857421875, 7.2833251953125, 7.709228515625, 8.1351318359375, 8.56103515625, 8.9869384765625, 9.412841796875, 9.8387451171875, 10.2646484375, 10.6905517578125, 11.116455078125, 11.5423583984375, 11.96826171875, 12.3941650390625, 12.820068359375, 13.2459716796875, 13.671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 4.0, 10.0, 11.0, 19.0, 17.0, 21.0, 27.0, 27.0, 28.0, 32.0, 27.0, 38.0, 48.0, 29.0, 52.0, 44.0, 47.0, 38.0, 41.0, 33.0, 46.0, 35.0, 30.0, 35.0, 37.0, 24.0, 19.0, 12.0, 23.0, 22.0, 21.0, 17.0, 13.0, 7.0, 8.0, 7.0, 3.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-22.566545486450195, -21.856828689575195, -21.147111892700195, -20.437395095825195, -19.727680206298828, -19.017963409423828, -18.308246612548828, -17.598529815673828, -16.888813018798828, -16.179096221923828, -15.469379425048828, -14.759663581848145, -14.049946784973145, -13.340229988098145, -12.630514144897461, -11.920797348022461, -11.211080551147461, -10.501363754272461, -9.791646957397461, -9.081931114196777, -8.372214317321777, -7.662497520446777, -6.9527812004089355, -6.243064880371094, -5.533348083496094, -4.823631286621094, -4.113914966583252, -3.404198408126831, -2.69448184967041, -1.9847652912139893, -1.2750487327575684, -0.5653324127197266, 0.14438438415527344, 0.8541009426116943, 1.5638175010681152, 2.273534059524536, 2.983250617980957, 3.692967176437378, 4.402683734893799, 5.112400054931641, 5.822116851806641, 6.531833648681641, 7.241549968719482, 7.951266288757324, 8.660983085632324, 9.370699882507324, 10.080415725708008, 10.790132522583008, 11.499849319458008, 12.209566116333008, 12.919282913208008, 13.628998756408691, 14.338715553283691, 15.048432350158691, 15.758148193359375, 16.467864990234375, 17.177581787109375, 17.887298583984375, 18.597015380859375, 19.306732177734375, 20.016448974609375, 20.726163864135742, 21.435880661010742, 22.145597457885742, 22.855314254760742]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 6.0, 6.0, 7.0, 9.0, 10.0, 13.0, 10.0, 17.0, 20.0, 18.0, 17.0, 20.0, 18.0, 34.0, 34.0, 30.0, 40.0, 46.0, 42.0, 36.0, 45.0, 45.0, 40.0, 38.0, 47.0, 48.0, 40.0, 38.0, 23.0, 23.0, 29.0, 23.0, 21.0, 20.0, 13.0, 18.0, 14.0, 15.0, 10.0, 5.0, 2.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-32.794593811035156, -31.882802963256836, -30.971010208129883, -30.059219360351562, -29.14742660522461, -28.23563575744629, -27.32384490966797, -26.412052154541016, -25.500259399414062, -24.588468551635742, -23.67667579650879, -22.76488494873047, -21.853092193603516, -20.941301345825195, -20.029510498046875, -19.117717742919922, -18.2059268951416, -17.29413604736328, -16.382343292236328, -15.470552444458008, -14.558759689331055, -13.646968841552734, -12.735177040100098, -11.823385238647461, -10.911593437194824, -9.999801635742188, -9.08800983428955, -8.176218032836914, -7.2644267082214355, -6.352634906768799, -5.44084358215332, -4.529051780700684, -3.6172618865966797, -2.705470085144043, -1.7936785221099854, -0.8818869590759277, 0.029904842376708984, 0.9416966438293457, 1.8534879684448242, 2.765279769897461, 3.6770715713500977, 4.588863372802734, 5.500655174255371, 6.41244649887085, 7.324238300323486, 8.236030578613281, 9.147821426391602, 10.059613227844238, 10.971405029296875, 11.883196830749512, 12.794988632202148, 13.706779479980469, 14.618572235107422, 15.530363082885742, 16.442153930664062, 17.353946685791016, 18.26573944091797, 19.17753028869629, 20.089323043823242, 21.001113891601562, 21.912906646728516, 22.824697494506836, 23.736488342285156, 24.64828109741211, 25.56007194519043]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 16.0, 9.0, 18.0, 38.0, 48.0, 54.0, 83.0, 127.0, 187.0, 330.0, 521.0, 713.0, 1065.0, 1596.0, 2533.0, 3816.0, 5994.0, 9422.0, 14990.0, 23529.0, 38773.0, 62718.0, 103772.0, 164799.0, 206324.0, 154762.0, 96360.0, 58914.0, 36072.0, 22293.0, 13835.0, 8706.0, 5641.0, 3640.0, 2349.0, 1483.0, 1012.0, 683.0, 437.0, 290.0, 197.0, 120.0, 94.0, 65.0, 36.0, 36.0, 14.0, 17.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0], "bins": [-5.3203125, -5.165771484375, -5.01123046875, -4.856689453125, -4.7021484375, -4.547607421875, -4.39306640625, -4.238525390625, -4.083984375, -3.929443359375, -3.77490234375, -3.620361328125, -3.4658203125, -3.311279296875, -3.15673828125, -3.002197265625, -2.84765625, -2.693115234375, -2.53857421875, -2.384033203125, -2.2294921875, -2.074951171875, -1.92041015625, -1.765869140625, -1.611328125, -1.456787109375, -1.30224609375, -1.147705078125, -0.9931640625, -0.838623046875, -0.68408203125, -0.529541015625, -0.375, -0.220458984375, -0.06591796875, 0.088623046875, 0.2431640625, 0.397705078125, 0.55224609375, 0.706787109375, 0.861328125, 1.015869140625, 1.17041015625, 1.324951171875, 1.4794921875, 1.634033203125, 1.78857421875, 1.943115234375, 2.09765625, 2.252197265625, 2.40673828125, 2.561279296875, 2.7158203125, 2.870361328125, 3.02490234375, 3.179443359375, 3.333984375, 3.488525390625, 3.64306640625, 3.797607421875, 3.9521484375, 4.106689453125, 4.26123046875, 4.415771484375, 4.5703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 10.0, 6.0, 13.0, 15.0, 8.0, 13.0, 22.0, 13.0, 16.0, 21.0, 31.0, 36.0, 27.0, 37.0, 38.0, 36.0, 44.0, 41.0, 45.0, 49.0, 45.0, 47.0, 37.0, 45.0, 38.0, 33.0, 31.0, 21.0, 31.0, 28.0, 19.0, 20.0, 14.0, 7.0, 16.0, 9.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-33.78125, -32.843505859375, -31.90576171875, -30.968017578125, -30.0302734375, -29.092529296875, -28.15478515625, -27.217041015625, -26.279296875, -25.341552734375, -24.40380859375, -23.466064453125, -22.5283203125, -21.590576171875, -20.65283203125, -19.715087890625, -18.77734375, -17.839599609375, -16.90185546875, -15.964111328125, -15.0263671875, -14.088623046875, -13.15087890625, -12.213134765625, -11.275390625, -10.337646484375, -9.39990234375, -8.462158203125, -7.5244140625, -6.586669921875, -5.64892578125, -4.711181640625, -3.7734375, -2.835693359375, -1.89794921875, -0.960205078125, -0.0224609375, 0.915283203125, 1.85302734375, 2.790771484375, 3.728515625, 4.666259765625, 5.60400390625, 6.541748046875, 7.4794921875, 8.417236328125, 9.35498046875, 10.292724609375, 11.23046875, 12.168212890625, 13.10595703125, 14.043701171875, 14.9814453125, 15.919189453125, 16.85693359375, 17.794677734375, 18.732421875, 19.670166015625, 20.60791015625, 21.545654296875, 22.4833984375, 23.421142578125, 24.35888671875, 25.296630859375, 26.234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 20.0, 17.0, 28.0, 43.0, 59.0, 107.0, 144.0, 241.0, 340.0, 467.0, 686.0, 964.0, 1391.0, 2002.0, 2868.0, 4240.0, 6749.0, 10383.0, 15827.0, 25021.0, 40937.0, 66970.0, 110326.0, 169883.0, 199114.0, 146750.0, 91705.0, 55668.0, 34347.0, 21162.0, 13514.0, 8652.0, 5821.0, 3854.0, 2519.0, 1795.0, 1172.0, 875.0, 575.0, 396.0, 277.0, 217.0, 126.0, 93.0, 70.0, 47.0, 28.0, 18.0, 14.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.779296875, -3.662353515625, -3.54541015625, -3.428466796875, -3.3115234375, -3.194580078125, -3.07763671875, -2.960693359375, -2.84375, -2.726806640625, -2.60986328125, -2.492919921875, -2.3759765625, -2.259033203125, -2.14208984375, -2.025146484375, -1.908203125, -1.791259765625, -1.67431640625, -1.557373046875, -1.4404296875, -1.323486328125, -1.20654296875, -1.089599609375, -0.97265625, -0.855712890625, -0.73876953125, -0.621826171875, -0.5048828125, -0.387939453125, -0.27099609375, -0.154052734375, -0.037109375, 0.079833984375, 0.19677734375, 0.313720703125, 0.4306640625, 0.547607421875, 0.66455078125, 0.781494140625, 0.8984375, 1.015380859375, 1.13232421875, 1.249267578125, 1.3662109375, 1.483154296875, 1.60009765625, 1.717041015625, 1.833984375, 1.950927734375, 2.06787109375, 2.184814453125, 2.3017578125, 2.418701171875, 2.53564453125, 2.652587890625, 2.76953125, 2.886474609375, 3.00341796875, 3.120361328125, 3.2373046875, 3.354248046875, 3.47119140625, 3.588134765625, 3.705078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 5.0, 2.0, 8.0, 6.0, 10.0, 7.0, 11.0, 17.0, 12.0, 16.0, 17.0, 35.0, 20.0, 25.0, 29.0, 33.0, 36.0, 44.0, 35.0, 39.0, 37.0, 46.0, 42.0, 32.0, 45.0, 38.0, 33.0, 39.0, 32.0, 28.0, 39.0, 25.0, 19.0, 25.0, 25.0, 15.0, 12.0, 12.0, 14.0, 10.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.84375, -21.210693359375, -20.57763671875, -19.944580078125, -19.3115234375, -18.678466796875, -18.04541015625, -17.412353515625, -16.779296875, -16.146240234375, -15.51318359375, -14.880126953125, -14.2470703125, -13.614013671875, -12.98095703125, -12.347900390625, -11.71484375, -11.081787109375, -10.44873046875, -9.815673828125, -9.1826171875, -8.549560546875, -7.91650390625, -7.283447265625, -6.650390625, -6.017333984375, -5.38427734375, -4.751220703125, -4.1181640625, -3.485107421875, -2.85205078125, -2.218994140625, -1.5859375, -0.952880859375, -0.31982421875, 0.313232421875, 0.9462890625, 1.579345703125, 2.21240234375, 2.845458984375, 3.478515625, 4.111572265625, 4.74462890625, 5.377685546875, 6.0107421875, 6.643798828125, 7.27685546875, 7.909912109375, 8.54296875, 9.176025390625, 9.80908203125, 10.442138671875, 11.0751953125, 11.708251953125, 12.34130859375, 12.974365234375, 13.607421875, 14.240478515625, 14.87353515625, 15.506591796875, 16.1396484375, 16.772705078125, 17.40576171875, 18.038818359375, 18.671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 8.0, 15.0, 8.0, 24.0, 35.0, 44.0, 86.0, 104.0, 153.0, 246.0, 333.0, 509.0, 813.0, 1322.0, 1939.0, 3269.0, 5407.0, 9133.0, 15977.0, 30446.0, 60145.0, 128299.0, 291730.0, 264157.0, 114241.0, 54634.0, 28158.0, 15300.0, 8607.0, 4956.0, 3070.0, 1858.0, 1208.0, 801.0, 529.0, 351.0, 212.0, 154.0, 104.0, 46.0, 44.0, 16.0, 26.0, 6.0, 15.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.4072265625, -0.3940620422363281, -0.38089752197265625, -0.3677330017089844, -0.3545684814453125, -0.3414039611816406, -0.32823944091796875, -0.3150749206542969, -0.301910400390625, -0.2887458801269531, -0.27558135986328125, -0.2624168395996094, -0.2492523193359375, -0.23608779907226562, -0.22292327880859375, -0.20975875854492188, -0.19659423828125, -0.18342971801757812, -0.17026519775390625, -0.15710067749023438, -0.1439361572265625, -0.13077163696289062, -0.11760711669921875, -0.10444259643554688, -0.091278076171875, -0.07811355590820312, -0.06494903564453125, -0.051784515380859375, -0.0386199951171875, -0.025455474853515625, -0.01229095458984375, 0.000873565673828125, 0.0140380859375, 0.027202606201171875, 0.04036712646484375, 0.053531646728515625, 0.0666961669921875, 0.07986068725585938, 0.09302520751953125, 0.10618972778320312, 0.119354248046875, 0.13251876831054688, 0.14568328857421875, 0.15884780883789062, 0.1720123291015625, 0.18517684936523438, 0.19834136962890625, 0.21150588989257812, 0.22467041015625, 0.23783493041992188, 0.25099945068359375, 0.2641639709472656, 0.2773284912109375, 0.2904930114746094, 0.30365753173828125, 0.3168220520019531, 0.329986572265625, 0.3431510925292969, 0.35631561279296875, 0.3694801330566406, 0.3826446533203125, 0.3958091735839844, 0.40897369384765625, 0.4221382141113281, 0.435302734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 13.0, 12.0, 25.0, 20.0, 45.0, 40.0, 47.0, 59.0, 58.0, 76.0, 83.0, 62.0, 76.0, 75.0, 56.0, 42.0, 31.0, 25.0, 37.0, 20.0, 19.0, 17.0, 9.0, 4.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.638071060180664e-05, -9.363610297441483e-05, -9.089149534702301e-05, -8.81468877196312e-05, -8.540228009223938e-05, -8.265767246484756e-05, -7.991306483745575e-05, -7.716845721006393e-05, -7.442384958267212e-05, -7.16792419552803e-05, -6.893463432788849e-05, -6.619002670049667e-05, -6.344541907310486e-05, -6.070081144571304e-05, -5.795620381832123e-05, -5.521159619092941e-05, -5.24669885635376e-05, -4.972238093614578e-05, -4.697777330875397e-05, -4.423316568136215e-05, -4.148855805397034e-05, -3.874395042657852e-05, -3.5999342799186707e-05, -3.325473517179489e-05, -3.0510127544403076e-05, -2.776551991701126e-05, -2.5020912289619446e-05, -2.227630466222763e-05, -1.9531697034835815e-05, -1.6787089407444e-05, -1.4042481780052185e-05, -1.129787415266037e-05, -8.553266525268555e-06, -5.8086588978767395e-06, -3.0640512704849243e-06, -3.1944364309310913e-07, 2.425163984298706e-06, 5.169771611690521e-06, 7.914379239082336e-06, 1.0658986866474152e-05, 1.3403594493865967e-05, 1.6148202121257782e-05, 1.8892809748649597e-05, 2.1637417376041412e-05, 2.4382025003433228e-05, 2.7126632630825043e-05, 2.9871240258216858e-05, 3.261584788560867e-05, 3.536045551300049e-05, 3.8105063140392303e-05, 4.084967076778412e-05, 4.3594278395175934e-05, 4.633888602256775e-05, 4.9083493649959564e-05, 5.182810127735138e-05, 5.4572708904743195e-05, 5.731731653213501e-05, 6.0061924159526825e-05, 6.280653178691864e-05, 6.555113941431046e-05, 6.829574704170227e-05, 7.104035466909409e-05, 7.37849622964859e-05, 7.652956992387772e-05, 7.927417755126953e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 10.0, 13.0, 19.0, 29.0, 45.0, 53.0, 84.0, 111.0, 147.0, 188.0, 284.0, 401.0, 565.0, 773.0, 1031.0, 1473.0, 1988.0, 2952.0, 4091.0, 5925.0, 8667.0, 12880.0, 19325.0, 30095.0, 48167.0, 80823.0, 147926.0, 292938.0, 158100.0, 85087.0, 50282.0, 31013.0, 19809.0, 13231.0, 9032.0, 6103.0, 4352.0, 3017.0, 2097.0, 1586.0, 1086.0, 780.0, 574.0, 400.0, 297.0, 202.0, 156.0, 107.0, 74.0, 52.0, 38.0, 24.0, 12.0, 19.0, 15.0, 3.0, 9.0, 3.0, 1.0], "bins": [-1.1396484375, -1.1046295166015625, -1.069610595703125, -1.0345916748046875, -0.99957275390625, -0.9645538330078125, -0.929534912109375, -0.8945159912109375, -0.8594970703125, -0.8244781494140625, -0.789459228515625, -0.7544403076171875, -0.71942138671875, -0.6844024658203125, -0.649383544921875, -0.6143646240234375, -0.579345703125, -0.5443267822265625, -0.509307861328125, -0.4742889404296875, -0.43927001953125, -0.4042510986328125, -0.369232177734375, -0.3342132568359375, -0.2991943359375, -0.2641754150390625, -0.229156494140625, -0.1941375732421875, -0.15911865234375, -0.1240997314453125, -0.089080810546875, -0.0540618896484375, -0.01904296875, 0.0159759521484375, 0.050994873046875, 0.0860137939453125, 0.12103271484375, 0.1560516357421875, 0.191070556640625, 0.2260894775390625, 0.2611083984375, 0.2961273193359375, 0.331146240234375, 0.3661651611328125, 0.40118408203125, 0.4362030029296875, 0.471221923828125, 0.5062408447265625, 0.541259765625, 0.5762786865234375, 0.611297607421875, 0.6463165283203125, 0.68133544921875, 0.7163543701171875, 0.751373291015625, 0.7863922119140625, 0.8214111328125, 0.8564300537109375, 0.891448974609375, 0.9264678955078125, 0.96148681640625, 0.9965057373046875, 1.031524658203125, 1.0665435791015625, 1.1015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 15.0, 9.0, 10.0, 18.0, 15.0, 24.0, 23.0, 33.0, 39.0, 39.0, 36.0, 51.0, 45.0, 47.0, 42.0, 50.0, 52.0, 27.0, 42.0, 56.0, 39.0, 35.0, 33.0, 33.0, 27.0, 14.0, 29.0, 13.0, 20.0, 22.0, 6.0, 7.0, 4.0, 11.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6687393188476562, -0.6470489501953125, -0.6253585815429688, -0.603668212890625, -0.5819778442382812, -0.5602874755859375, -0.5385971069335938, -0.51690673828125, -0.49521636962890625, -0.4735260009765625, -0.45183563232421875, -0.430145263671875, -0.40845489501953125, -0.3867645263671875, -0.36507415771484375, -0.3433837890625, -0.32169342041015625, -0.3000030517578125, -0.27831268310546875, -0.256622314453125, -0.23493194580078125, -0.2132415771484375, -0.19155120849609375, -0.16986083984375, -0.14817047119140625, -0.1264801025390625, -0.10478973388671875, -0.083099365234375, -0.06140899658203125, -0.0397186279296875, -0.01802825927734375, 0.003662109375, 0.02535247802734375, 0.0470428466796875, 0.06873321533203125, 0.090423583984375, 0.11211395263671875, 0.1338043212890625, 0.15549468994140625, 0.17718505859375, 0.19887542724609375, 0.2205657958984375, 0.24225616455078125, 0.263946533203125, 0.28563690185546875, 0.3073272705078125, 0.32901763916015625, 0.3507080078125, 0.37239837646484375, 0.3940887451171875, 0.41577911376953125, 0.437469482421875, 0.45915985107421875, 0.4808502197265625, 0.5025405883789062, 0.52423095703125, 0.5459213256835938, 0.5676116943359375, 0.5893020629882812, 0.610992431640625, 0.6326828002929688, 0.6543731689453125, 0.6760635375976562, 0.69775390625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 1.0, 8.0, 7.0, 9.0, 8.0, 17.0, 16.0, 18.0, 27.0, 21.0, 35.0, 28.0, 24.0, 40.0, 41.0, 43.0, 39.0, 56.0, 40.0, 47.0, 29.0, 47.0, 44.0, 37.0, 28.0, 33.0, 40.0, 24.0, 20.0, 21.0, 22.0, 24.0, 16.0, 19.0, 13.0, 12.0, 10.0, 3.0, 7.0, 2.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-21.998687744140625, -21.287479400634766, -20.57627296447754, -19.86506462097168, -19.15385627746582, -18.442649841308594, -17.731441497802734, -17.020233154296875, -16.309024810791016, -15.597817420959473, -14.886609077453613, -14.17540168762207, -13.464193344116211, -12.752985954284668, -12.041778564453125, -11.330570220947266, -10.619363784790039, -9.908156394958496, -9.196948051452637, -8.485740661621094, -7.774532794952393, -7.063324928283691, -6.352117538452148, -5.640909671783447, -4.929701805114746, -4.218493938446045, -3.507286310195923, -2.796078681945801, -2.0848708152770996, -1.3736629486083984, -0.6624555587768555, 0.0487523078918457, 0.7599620819091797, 1.4711698293685913, 2.182377576828003, 2.893585205078125, 3.604793071746826, 4.316000938415527, 5.02720832824707, 5.7384161949157715, 6.449624061584473, 7.160831928253174, 7.872039794921875, 8.583247184753418, 9.294454574584961, 10.00566291809082, 10.716870307922363, 11.428077697753906, 12.139286041259766, 12.850493431091309, 13.561701774597168, 14.272909164428711, 14.98411750793457, 15.695324897766113, 16.406532287597656, 17.117740631103516, 17.828948974609375, 18.540157318115234, 19.25136375427246, 19.96257209777832, 20.67378044128418, 21.384986877441406, 22.096195220947266, 22.807403564453125, 23.51861000061035]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 8.0, 16.0, 9.0, 16.0, 22.0, 19.0, 14.0, 19.0, 27.0, 21.0, 42.0, 25.0, 37.0, 53.0, 45.0, 35.0, 44.0, 48.0, 38.0, 38.0, 47.0, 49.0, 38.0, 37.0, 28.0, 26.0, 27.0, 17.0, 29.0, 14.0, 20.0, 15.0, 11.0, 20.0, 6.0, 3.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-32.71379089355469, -31.807483673095703, -30.901174545288086, -29.9948673248291, -29.088558197021484, -28.1822509765625, -27.275943756103516, -26.3696346282959, -25.46332550048828, -24.557018280029297, -23.65070915222168, -22.744401931762695, -21.838092803955078, -20.931785583496094, -20.02547836303711, -19.119169235229492, -18.212862014770508, -17.306554794311523, -16.400245666503906, -15.493938446044922, -14.587629318237305, -13.68132209777832, -12.77501392364502, -11.868705749511719, -10.962397575378418, -10.056089401245117, -9.149781227111816, -8.243473052978516, -7.337165355682373, -6.430857181549072, -5.52454948425293, -4.618241310119629, -3.711935043334961, -2.80562686920166, -1.8993189334869385, -0.9930109977722168, -0.08670282363891602, 0.8196053504943848, 1.7259130477905273, 2.632221221923828, 3.538529396057129, 4.44483757019043, 5.3511457443237305, 6.257453441619873, 7.163761615753174, 8.070070266723633, 8.976377487182617, 9.882685661315918, 10.788993835449219, 11.69530200958252, 12.60161018371582, 13.507917404174805, 14.414226531982422, 15.320533752441406, 16.22684097290039, 17.133150100708008, 18.039459228515625, 18.94576644897461, 19.852075576782227, 20.75838279724121, 21.664691925048828, 22.570999145507812, 23.477306365966797, 24.383615493774414, 25.2899227142334]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 15.0, 14.0, 19.0, 52.0, 62.0, 110.0, 194.0, 270.0, 501.0, 839.0, 1361.0, 2290.0, 3860.0, 5927.0, 9516.0, 15094.0, 23730.0, 35654.0, 52885.0, 72420.0, 94124.0, 112422.0, 121855.0, 118929.0, 104563.0, 84320.0, 62879.0, 43681.0, 29623.0, 19234.0, 12253.0, 7738.0, 4669.0, 2833.0, 1824.0, 1078.0, 695.0, 403.0, 256.0, 127.0, 93.0, 60.0, 42.0, 10.0, 11.0, 15.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.576416015625, -16.96533203125, -16.354248046875, -15.7431640625, -15.132080078125, -14.52099609375, -13.909912109375, -13.298828125, -12.687744140625, -12.07666015625, -11.465576171875, -10.8544921875, -10.243408203125, -9.63232421875, -9.021240234375, -8.41015625, -7.799072265625, -7.18798828125, -6.576904296875, -5.9658203125, -5.354736328125, -4.74365234375, -4.132568359375, -3.521484375, -2.910400390625, -2.29931640625, -1.688232421875, -1.0771484375, -0.466064453125, 0.14501953125, 0.756103515625, 1.3671875, 1.978271484375, 2.58935546875, 3.200439453125, 3.8115234375, 4.422607421875, 5.03369140625, 5.644775390625, 6.255859375, 6.866943359375, 7.47802734375, 8.089111328125, 8.7001953125, 9.311279296875, 9.92236328125, 10.533447265625, 11.14453125, 11.755615234375, 12.36669921875, 12.977783203125, 13.5888671875, 14.199951171875, 14.81103515625, 15.422119140625, 16.033203125, 16.644287109375, 17.25537109375, 17.866455078125, 18.4775390625, 19.088623046875, 19.69970703125, 20.310791015625, 20.921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 7.0, 14.0, 14.0, 11.0, 18.0, 16.0, 25.0, 24.0, 24.0, 32.0, 26.0, 33.0, 34.0, 41.0, 41.0, 40.0, 40.0, 42.0, 42.0, 48.0, 36.0, 48.0, 37.0, 37.0, 30.0, 33.0, 24.0, 29.0, 22.0, 20.0, 17.0, 10.0, 19.0, 11.0, 12.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-31.6875, -30.821044921875, -29.95458984375, -29.088134765625, -28.2216796875, -27.355224609375, -26.48876953125, -25.622314453125, -24.755859375, -23.889404296875, -23.02294921875, -22.156494140625, -21.2900390625, -20.423583984375, -19.55712890625, -18.690673828125, -17.82421875, -16.957763671875, -16.09130859375, -15.224853515625, -14.3583984375, -13.491943359375, -12.62548828125, -11.759033203125, -10.892578125, -10.026123046875, -9.15966796875, -8.293212890625, -7.4267578125, -6.560302734375, -5.69384765625, -4.827392578125, -3.9609375, -3.094482421875, -2.22802734375, -1.361572265625, -0.4951171875, 0.371337890625, 1.23779296875, 2.104248046875, 2.970703125, 3.837158203125, 4.70361328125, 5.570068359375, 6.4365234375, 7.302978515625, 8.16943359375, 9.035888671875, 9.90234375, 10.768798828125, 11.63525390625, 12.501708984375, 13.3681640625, 14.234619140625, 15.10107421875, 15.967529296875, 16.833984375, 17.700439453125, 18.56689453125, 19.433349609375, 20.2998046875, 21.166259765625, 22.03271484375, 22.899169921875, 23.765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 7.0, 6.0, 24.0, 29.0, 56.0, 73.0, 140.0, 198.0, 309.0, 505.0, 772.0, 1244.0, 1843.0, 2980.0, 4468.0, 7231.0, 10932.0, 16330.0, 24482.0, 35929.0, 50522.0, 68351.0, 86802.0, 102874.0, 112295.0, 111534.0, 101826.0, 86078.0, 67043.0, 49485.0, 34780.0, 23800.0, 15906.0, 10475.0, 6804.0, 4558.0, 2918.0, 1848.0, 1166.0, 680.0, 460.0, 305.0, 174.0, 135.0, 73.0, 41.0, 23.0, 18.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-20.140625, -19.547607421875, -18.95458984375, -18.361572265625, -17.7685546875, -17.175537109375, -16.58251953125, -15.989501953125, -15.396484375, -14.803466796875, -14.21044921875, -13.617431640625, -13.0244140625, -12.431396484375, -11.83837890625, -11.245361328125, -10.65234375, -10.059326171875, -9.46630859375, -8.873291015625, -8.2802734375, -7.687255859375, -7.09423828125, -6.501220703125, -5.908203125, -5.315185546875, -4.72216796875, -4.129150390625, -3.5361328125, -2.943115234375, -2.35009765625, -1.757080078125, -1.1640625, -0.571044921875, 0.02197265625, 0.614990234375, 1.2080078125, 1.801025390625, 2.39404296875, 2.987060546875, 3.580078125, 4.173095703125, 4.76611328125, 5.359130859375, 5.9521484375, 6.545166015625, 7.13818359375, 7.731201171875, 8.32421875, 8.917236328125, 9.51025390625, 10.103271484375, 10.6962890625, 11.289306640625, 11.88232421875, 12.475341796875, 13.068359375, 13.661376953125, 14.25439453125, 14.847412109375, 15.4404296875, 16.033447265625, 16.62646484375, 17.219482421875, 17.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 10.0, 7.0, 5.0, 12.0, 20.0, 11.0, 23.0, 13.0, 21.0, 15.0, 28.0, 26.0, 34.0, 40.0, 34.0, 29.0, 23.0, 49.0, 36.0, 31.0, 46.0, 44.0, 37.0, 41.0, 27.0, 27.0, 39.0, 32.0, 28.0, 27.0, 29.0, 16.0, 18.0, 20.0, 14.0, 18.0, 8.0, 13.0, 13.0, 8.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.609375, -17.076904296875, -16.54443359375, -16.011962890625, -15.4794921875, -14.947021484375, -14.41455078125, -13.882080078125, -13.349609375, -12.817138671875, -12.28466796875, -11.752197265625, -11.2197265625, -10.687255859375, -10.15478515625, -9.622314453125, -9.08984375, -8.557373046875, -8.02490234375, -7.492431640625, -6.9599609375, -6.427490234375, -5.89501953125, -5.362548828125, -4.830078125, -4.297607421875, -3.76513671875, -3.232666015625, -2.7001953125, -2.167724609375, -1.63525390625, -1.102783203125, -0.5703125, -0.037841796875, 0.49462890625, 1.027099609375, 1.5595703125, 2.092041015625, 2.62451171875, 3.156982421875, 3.689453125, 4.221923828125, 4.75439453125, 5.286865234375, 5.8193359375, 6.351806640625, 6.88427734375, 7.416748046875, 7.94921875, 8.481689453125, 9.01416015625, 9.546630859375, 10.0791015625, 10.611572265625, 11.14404296875, 11.676513671875, 12.208984375, 12.741455078125, 13.27392578125, 13.806396484375, 14.3388671875, 14.871337890625, 15.40380859375, 15.936279296875, 16.46875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 11.0, 5.0, 16.0, 23.0, 24.0, 42.0, 64.0, 121.0, 179.0, 273.0, 456.0, 721.0, 1262.0, 1959.0, 3221.0, 5392.0, 8980.0, 14900.0, 24119.0, 39201.0, 60609.0, 88794.0, 118713.0, 140765.0, 143328.0, 124643.0, 94584.0, 65621.0, 42470.0, 26917.0, 16213.0, 9641.0, 6040.0, 3692.0, 2146.0, 1267.0, 834.0, 491.0, 299.0, 191.0, 121.0, 79.0, 40.0, 20.0, 23.0, 17.0, 12.0, 3.0, 6.0, 4.0, 1.0, 1.0, 3.0], "bins": [-7.01953125, -6.81951904296875, -6.6195068359375, -6.41949462890625, -6.219482421875, -6.01947021484375, -5.8194580078125, -5.61944580078125, -5.41943359375, -5.21942138671875, -5.0194091796875, -4.81939697265625, -4.619384765625, -4.41937255859375, -4.2193603515625, -4.01934814453125, -3.8193359375, -3.61932373046875, -3.4193115234375, -3.21929931640625, -3.019287109375, -2.81927490234375, -2.6192626953125, -2.41925048828125, -2.21923828125, -2.01922607421875, -1.8192138671875, -1.61920166015625, -1.419189453125, -1.21917724609375, -1.0191650390625, -0.81915283203125, -0.619140625, -0.41912841796875, -0.2191162109375, -0.01910400390625, 0.180908203125, 0.38092041015625, 0.5809326171875, 0.78094482421875, 0.98095703125, 1.18096923828125, 1.3809814453125, 1.58099365234375, 1.781005859375, 1.98101806640625, 2.1810302734375, 2.38104248046875, 2.5810546875, 2.78106689453125, 2.9810791015625, 3.18109130859375, 3.381103515625, 3.58111572265625, 3.7811279296875, 3.98114013671875, 4.18115234375, 4.38116455078125, 4.5811767578125, 4.78118896484375, 4.981201171875, 5.18121337890625, 5.3812255859375, 5.58123779296875, 5.78125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 16.0, 12.0, 19.0, 25.0, 29.0, 49.0, 44.0, 57.0, 64.0, 76.0, 65.0, 67.0, 65.0, 52.0, 56.0, 58.0, 43.0, 34.0, 29.0, 32.0, 22.0, 15.0, 10.0, 9.0, 6.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008831024169921875, -0.0008567050099372864, -0.0008303076028823853, -0.0008039101958274841, -0.000777512788772583, -0.0007511153817176819, -0.0007247179746627808, -0.0006983205676078796, -0.0006719231605529785, -0.0006455257534980774, -0.0006191283464431763, -0.0005927309393882751, -0.000566333532333374, -0.0005399361252784729, -0.0005135387182235718, -0.00048714131116867065, -0.00046074390411376953, -0.0004343464970588684, -0.0004079490900039673, -0.00038155168294906616, -0.00035515427589416504, -0.0003287568688392639, -0.0003023594617843628, -0.00027596205472946167, -0.00024956464767456055, -0.00022316724061965942, -0.0001967698335647583, -0.00017037242650985718, -0.00014397501945495605, -0.00011757761240005493, -9.118020534515381e-05, -6.478279829025269e-05, -3.838539123535156e-05, -1.198798418045044e-05, 1.4409422874450684e-05, 4.080682992935181e-05, 6.720423698425293e-05, 9.360164403915405e-05, 0.00011999905109405518, 0.0001463964581489563, 0.00017279386520385742, 0.00019919127225875854, 0.00022558867931365967, 0.0002519860863685608, 0.0002783834934234619, 0.00030478090047836304, 0.00033117830753326416, 0.0003575757145881653, 0.0003839731216430664, 0.00041037052869796753, 0.00043676793575286865, 0.0004631653428077698, 0.0004895627498626709, 0.000515960156917572, 0.0005423575639724731, 0.0005687549710273743, 0.0005951523780822754, 0.0006215497851371765, 0.0006479471921920776, 0.0006743445992469788, 0.0007007420063018799, 0.000727139413356781, 0.0007535368204116821, 0.0007799342274665833, 0.0008063316345214844]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 9.0, 10.0, 6.0, 8.0, 4.0, 16.0, 20.0, 39.0, 61.0, 98.0, 157.0, 219.0, 306.0, 471.0, 790.0, 1219.0, 1855.0, 2919.0, 4602.0, 7197.0, 11344.0, 17842.0, 27339.0, 42078.0, 61484.0, 85479.0, 109435.0, 126277.0, 130193.0, 116621.0, 93706.0, 69282.0, 48193.0, 32146.0, 20457.0, 13275.0, 8359.0, 5509.0, 3352.0, 2130.0, 1442.0, 883.0, 577.0, 436.0, 264.0, 160.0, 101.0, 63.0, 41.0, 33.0, 24.0, 16.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.30078125, -6.11083984375, -5.9208984375, -5.73095703125, -5.541015625, -5.35107421875, -5.1611328125, -4.97119140625, -4.78125, -4.59130859375, -4.4013671875, -4.21142578125, -4.021484375, -3.83154296875, -3.6416015625, -3.45166015625, -3.26171875, -3.07177734375, -2.8818359375, -2.69189453125, -2.501953125, -2.31201171875, -2.1220703125, -1.93212890625, -1.7421875, -1.55224609375, -1.3623046875, -1.17236328125, -0.982421875, -0.79248046875, -0.6025390625, -0.41259765625, -0.22265625, -0.03271484375, 0.1572265625, 0.34716796875, 0.537109375, 0.72705078125, 0.9169921875, 1.10693359375, 1.296875, 1.48681640625, 1.6767578125, 1.86669921875, 2.056640625, 2.24658203125, 2.4365234375, 2.62646484375, 2.81640625, 3.00634765625, 3.1962890625, 3.38623046875, 3.576171875, 3.76611328125, 3.9560546875, 4.14599609375, 4.3359375, 4.52587890625, 4.7158203125, 4.90576171875, 5.095703125, 5.28564453125, 5.4755859375, 5.66552734375, 5.85546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 4.0, 5.0, 4.0, 9.0, 12.0, 5.0, 11.0, 12.0, 14.0, 16.0, 34.0, 34.0, 35.0, 56.0, 42.0, 41.0, 49.0, 48.0, 65.0, 45.0, 65.0, 48.0, 36.0, 44.0, 43.0, 37.0, 34.0, 31.0, 19.0, 14.0, 18.0, 11.0, 16.0, 8.0, 10.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.10546875, -3.01123046875, -2.9169921875, -2.82275390625, -2.728515625, -2.63427734375, -2.5400390625, -2.44580078125, -2.3515625, -2.25732421875, -2.1630859375, -2.06884765625, -1.974609375, -1.88037109375, -1.7861328125, -1.69189453125, -1.59765625, -1.50341796875, -1.4091796875, -1.31494140625, -1.220703125, -1.12646484375, -1.0322265625, -0.93798828125, -0.84375, -0.74951171875, -0.6552734375, -0.56103515625, -0.466796875, -0.37255859375, -0.2783203125, -0.18408203125, -0.08984375, 0.00439453125, 0.0986328125, 0.19287109375, 0.287109375, 0.38134765625, 0.4755859375, 0.56982421875, 0.6640625, 0.75830078125, 0.8525390625, 0.94677734375, 1.041015625, 1.13525390625, 1.2294921875, 1.32373046875, 1.41796875, 1.51220703125, 1.6064453125, 1.70068359375, 1.794921875, 1.88916015625, 1.9833984375, 2.07763671875, 2.171875, 2.26611328125, 2.3603515625, 2.45458984375, 2.548828125, 2.64306640625, 2.7373046875, 2.83154296875, 2.92578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 3.0, 8.0, 9.0, 12.0, 19.0, 21.0, 19.0, 25.0, 38.0, 37.0, 37.0, 49.0, 40.0, 53.0, 54.0, 61.0, 45.0, 45.0, 40.0, 58.0, 35.0, 47.0, 32.0, 28.0, 29.0, 20.0, 18.0, 22.0, 18.0, 22.0, 14.0, 8.0, 8.0, 4.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.414396286010742, -24.58373260498047, -23.753070831298828, -22.922407150268555, -22.09174346923828, -21.26108169555664, -20.430418014526367, -19.599754333496094, -18.769092559814453, -17.93842887878418, -17.10776710510254, -16.277103424072266, -15.446440696716309, -14.615777969360352, -13.785114288330078, -12.954451560974121, -12.123788833618164, -11.293126106262207, -10.46246337890625, -9.631799697875977, -8.80113697052002, -7.9704742431640625, -7.139811038970947, -6.309147834777832, -5.478485107421875, -4.647822380065918, -3.8171591758728027, -2.9864962100982666, -2.1558332443237305, -1.3251705169677734, -0.4945073127746582, 0.33615589141845703, 1.1668205261230469, 1.997483491897583, 2.828146457672119, 3.6588094234466553, 4.489472389221191, 5.320135116577148, 6.150798320770264, 6.981461524963379, 7.812124252319336, 8.642786979675293, 9.47344970703125, 10.304113388061523, 11.13477611541748, 11.965438842773438, 12.796102523803711, 13.626765251159668, 14.457427978515625, 15.288090705871582, 16.11875343322754, 16.949417114257812, 17.780078887939453, 18.610742568969727, 19.44140625, 20.27206802368164, 21.102731704711914, 21.933395385742188, 22.764057159423828, 23.5947208404541, 24.425384521484375, 25.256046295166016, 26.08670997619629, 26.917373657226562, 27.748035430908203]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 9.0, 6.0, 3.0, 5.0, 9.0, 14.0, 7.0, 18.0, 12.0, 16.0, 24.0, 22.0, 19.0, 36.0, 28.0, 31.0, 28.0, 35.0, 32.0, 31.0, 40.0, 30.0, 34.0, 38.0, 45.0, 51.0, 47.0, 34.0, 33.0, 27.0, 18.0, 25.0, 29.0, 20.0, 18.0, 24.0, 22.0, 11.0, 12.0, 6.0, 8.0, 8.0, 6.0, 5.0, 6.0, 9.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-28.657997131347656, -27.8220157623291, -26.986034393310547, -26.150053024291992, -25.314071655273438, -24.478090286254883, -23.642108917236328, -22.806129455566406, -21.97014617919922, -21.134164810180664, -20.29818344116211, -19.462202072143555, -18.626220703125, -17.790239334106445, -16.95425796508789, -16.11827850341797, -15.282297134399414, -14.44631576538086, -13.610334396362305, -12.77435302734375, -11.938371658325195, -11.10239028930664, -10.266409873962402, -9.430428504943848, -8.594447135925293, -7.758465766906738, -6.922484397888184, -6.086503505706787, -5.250522136688232, -4.414540767669678, -3.5785598754882812, -2.7425785064697266, -1.906595230102539, -1.070613980293274, -0.2346327304840088, 0.6013484001159668, 1.4373297691345215, 2.273311138153076, 3.1092920303344727, 3.9452733993530273, 4.781254768371582, 5.617236137390137, 6.453217506408691, 7.289198398590088, 8.125179290771484, 8.961160659790039, 9.797142028808594, 10.633123397827148, 11.469104766845703, 12.305086135864258, 13.141067504882812, 13.977048873901367, 14.813030242919922, 15.649011611938477, 16.48499298095703, 17.320972442626953, 18.15695571899414, 18.992937088012695, 19.82891845703125, 20.664899826049805, 21.50088119506836, 22.336862564086914, 23.17284393310547, 24.00882339477539, 24.844804763793945]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 13.0, 17.0, 16.0, 23.0, 59.0, 71.0, 142.0, 233.0, 355.0, 624.0, 979.0, 1659.0, 2754.0, 4437.0, 7442.0, 12478.0, 20401.0, 33396.0, 54626.0, 87447.0, 139413.0, 213990.0, 317024.0, 432895.0, 532935.0, 567224.0, 520805.0, 415208.0, 298943.0, 199175.0, 128024.0, 80136.0, 48669.0, 29225.0, 17560.0, 10541.0, 6311.0, 3745.0, 2167.0, 1256.0, 769.0, 452.0, 271.0, 142.0, 107.0, 53.0, 24.0, 20.0, 19.0, 12.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.22705078125, -18.5947265625, -17.96240234375, -17.330078125, -16.69775390625, -16.0654296875, -15.43310546875, -14.80078125, -14.16845703125, -13.5361328125, -12.90380859375, -12.271484375, -11.63916015625, -11.0068359375, -10.37451171875, -9.7421875, -9.10986328125, -8.4775390625, -7.84521484375, -7.212890625, -6.58056640625, -5.9482421875, -5.31591796875, -4.68359375, -4.05126953125, -3.4189453125, -2.78662109375, -2.154296875, -1.52197265625, -0.8896484375, -0.25732421875, 0.375, 1.00732421875, 1.6396484375, 2.27197265625, 2.904296875, 3.53662109375, 4.1689453125, 4.80126953125, 5.43359375, 6.06591796875, 6.6982421875, 7.33056640625, 7.962890625, 8.59521484375, 9.2275390625, 9.85986328125, 10.4921875, 11.12451171875, 11.7568359375, 12.38916015625, 13.021484375, 13.65380859375, 14.2861328125, 14.91845703125, 15.55078125, 16.18310546875, 16.8154296875, 17.44775390625, 18.080078125, 18.71240234375, 19.3447265625, 19.97705078125, 20.609375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 4.0, 4.0, 6.0, 5.0, 5.0, 14.0, 8.0, 8.0, 18.0, 16.0, 18.0, 18.0, 27.0, 21.0, 34.0, 24.0, 27.0, 39.0, 30.0, 32.0, 30.0, 31.0, 32.0, 50.0, 45.0, 36.0, 38.0, 36.0, 36.0, 37.0, 26.0, 29.0, 27.0, 22.0, 21.0, 17.0, 17.0, 17.0, 18.0, 14.0, 14.0, 12.0, 4.0, 6.0, 6.0, 8.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0], "bins": [-21.421875, -20.817626953125, -20.21337890625, -19.609130859375, -19.0048828125, -18.400634765625, -17.79638671875, -17.192138671875, -16.587890625, -15.983642578125, -15.37939453125, -14.775146484375, -14.1708984375, -13.566650390625, -12.96240234375, -12.358154296875, -11.75390625, -11.149658203125, -10.54541015625, -9.941162109375, -9.3369140625, -8.732666015625, -8.12841796875, -7.524169921875, -6.919921875, -6.315673828125, -5.71142578125, -5.107177734375, -4.5029296875, -3.898681640625, -3.29443359375, -2.690185546875, -2.0859375, -1.481689453125, -0.87744140625, -0.273193359375, 0.3310546875, 0.935302734375, 1.53955078125, 2.143798828125, 2.748046875, 3.352294921875, 3.95654296875, 4.560791015625, 5.1650390625, 5.769287109375, 6.37353515625, 6.977783203125, 7.58203125, 8.186279296875, 8.79052734375, 9.394775390625, 9.9990234375, 10.603271484375, 11.20751953125, 11.811767578125, 12.416015625, 13.020263671875, 13.62451171875, 14.228759765625, 14.8330078125, 15.437255859375, 16.04150390625, 16.645751953125, 17.25]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 1.0, 9.0, 12.0, 26.0, 32.0, 65.0, 100.0, 176.0, 258.0, 431.0, 714.0, 1044.0, 1850.0, 3100.0, 5028.0, 8010.0, 12865.0, 20428.0, 32121.0, 49316.0, 74010.0, 109254.0, 154155.0, 211060.0, 273754.0, 336481.0, 388162.0, 417711.0, 417678.0, 388335.0, 334896.0, 272860.0, 210132.0, 153096.0, 108718.0, 73707.0, 49244.0, 31965.0, 20032.0, 12831.0, 8052.0, 4948.0, 3030.0, 1863.0, 1096.0, 645.0, 396.0, 234.0, 142.0, 95.0, 49.0, 35.0, 23.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.296875, -14.8187255859375, -14.340576171875, -13.8624267578125, -13.38427734375, -12.9061279296875, -12.427978515625, -11.9498291015625, -11.4716796875, -10.9935302734375, -10.515380859375, -10.0372314453125, -9.55908203125, -9.0809326171875, -8.602783203125, -8.1246337890625, -7.646484375, -7.1683349609375, -6.690185546875, -6.2120361328125, -5.73388671875, -5.2557373046875, -4.777587890625, -4.2994384765625, -3.8212890625, -3.3431396484375, -2.864990234375, -2.3868408203125, -1.90869140625, -1.4305419921875, -0.952392578125, -0.4742431640625, 0.00390625, 0.4820556640625, 0.960205078125, 1.4383544921875, 1.91650390625, 2.3946533203125, 2.872802734375, 3.3509521484375, 3.8291015625, 4.3072509765625, 4.785400390625, 5.2635498046875, 5.74169921875, 6.2198486328125, 6.697998046875, 7.1761474609375, 7.654296875, 8.1324462890625, 8.610595703125, 9.0887451171875, 9.56689453125, 10.0450439453125, 10.523193359375, 11.0013427734375, 11.4794921875, 11.9576416015625, 12.435791015625, 12.9139404296875, 13.39208984375, 13.8702392578125, 14.348388671875, 14.8265380859375, 15.3046875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 12.0, 9.0, 16.0, 17.0, 17.0, 19.0, 38.0, 37.0, 46.0, 53.0, 53.0, 76.0, 103.0, 108.0, 101.0, 116.0, 151.0, 173.0, 174.0, 178.0, 191.0, 177.0, 201.0, 179.0, 202.0, 191.0, 204.0, 161.0, 166.0, 120.0, 111.0, 109.0, 100.0, 83.0, 76.0, 56.0, 41.0, 36.0, 35.0, 25.0, 28.0, 16.0, 12.0, 15.0, 6.0, 4.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.4609375, -8.181884765625, -7.90283203125, -7.623779296875, -7.3447265625, -7.065673828125, -6.78662109375, -6.507568359375, -6.228515625, -5.949462890625, -5.67041015625, -5.391357421875, -5.1123046875, -4.833251953125, -4.55419921875, -4.275146484375, -3.99609375, -3.717041015625, -3.43798828125, -3.158935546875, -2.8798828125, -2.600830078125, -2.32177734375, -2.042724609375, -1.763671875, -1.484619140625, -1.20556640625, -0.926513671875, -0.6474609375, -0.368408203125, -0.08935546875, 0.189697265625, 0.46875, 0.747802734375, 1.02685546875, 1.305908203125, 1.5849609375, 1.864013671875, 2.14306640625, 2.422119140625, 2.701171875, 2.980224609375, 3.25927734375, 3.538330078125, 3.8173828125, 4.096435546875, 4.37548828125, 4.654541015625, 4.93359375, 5.212646484375, 5.49169921875, 5.770751953125, 6.0498046875, 6.328857421875, 6.60791015625, 6.886962890625, 7.166015625, 7.445068359375, 7.72412109375, 8.003173828125, 8.2822265625, 8.561279296875, 8.84033203125, 9.119384765625, 9.3984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 10.0, 5.0, 9.0, 11.0, 19.0, 21.0, 21.0, 35.0, 25.0, 39.0, 36.0, 36.0, 26.0, 41.0, 48.0, 48.0, 53.0, 40.0, 34.0, 40.0, 41.0, 37.0, 46.0, 40.0, 18.0, 26.0, 33.0, 21.0, 24.0, 15.0, 17.0, 15.0, 12.0, 10.0, 11.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-21.126115798950195, -20.4793758392334, -19.8326358795166, -19.185895919799805, -18.539154052734375, -17.892414093017578, -17.24567413330078, -16.598934173583984, -15.952194213867188, -15.30545425415039, -14.658714294433594, -14.01197338104248, -13.365233421325684, -12.718493461608887, -12.071752548217773, -11.425012588500977, -10.77827262878418, -10.131532669067383, -9.484792709350586, -8.838051795959473, -8.191311836242676, -7.544571876525879, -6.897831439971924, -6.251091003417969, -5.604351043701172, -4.957611083984375, -4.31087064743042, -3.664130449295044, -3.017390251159668, -2.370650053024292, -1.723909854888916, -1.077169418334961, -0.43042945861816406, 0.21631073951721191, 0.8630509376525879, 1.5097911357879639, 2.15653133392334, 2.803271532058716, 3.450011730194092, 4.096752166748047, 4.743492126464844, 5.390232086181641, 6.036972522735596, 6.683712959289551, 7.330452919006348, 7.9771928787231445, 8.623933792114258, 9.270673751831055, 9.917413711547852, 10.564153671264648, 11.210893630981445, 11.857634544372559, 12.504374504089355, 13.151114463806152, 13.797855377197266, 14.444595336914062, 15.09133529663086, 15.738075256347656, 16.384815216064453, 17.03155517578125, 17.678295135498047, 18.325037002563477, 18.971776962280273, 19.61851692199707, 20.265256881713867]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 10.0, 9.0, 11.0, 8.0, 11.0, 24.0, 13.0, 26.0, 17.0, 25.0, 18.0, 24.0, 25.0, 41.0, 29.0, 43.0, 29.0, 42.0, 39.0, 40.0, 37.0, 41.0, 32.0, 45.0, 40.0, 28.0, 37.0, 25.0, 27.0, 19.0, 19.0, 19.0, 22.0, 23.0, 16.0, 12.0, 10.0, 3.0, 15.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.80310821533203, -21.084636688232422, -20.366165161132812, -19.647693634033203, -18.929222106933594, -18.210750579833984, -17.492279052734375, -16.7738094329834, -16.05533790588379, -15.33686637878418, -14.61839485168457, -13.899923324584961, -13.181452751159668, -12.462981224060059, -11.74450969696045, -11.026039123535156, -10.30756664276123, -9.589095115661621, -8.870623588562012, -8.152153015136719, -7.433681488037109, -6.7152099609375, -5.996738433837891, -5.2782673835754395, -4.55979585647583, -3.8413245677948, -3.1228532791137695, -2.40438175201416, -1.6859104633331299, -0.9674391746520996, -0.24896764755249023, 0.46950340270996094, 1.1879749298095703, 1.9064462184906006, 2.624917507171631, 3.3433890342712402, 4.061860084533691, 4.780331611633301, 5.49880313873291, 6.217274188995361, 6.935745716094971, 7.65421724319458, 8.372688293457031, 9.09115982055664, 9.80963134765625, 10.52810287475586, 11.246574401855469, 11.965044975280762, 12.683516502380371, 13.40198802947998, 14.12045955657959, 14.838930130004883, 15.557401657104492, 16.2758731842041, 16.99434471130371, 17.71281623840332, 18.43128776550293, 19.14975929260254, 19.86823081970215, 20.586702346801758, 21.305173873901367, 22.023643493652344, 22.742115020751953, 23.460586547851562, 24.179058074951172]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 14.0, 11.0, 27.0, 26.0, 61.0, 90.0, 109.0, 166.0, 250.0, 352.0, 547.0, 869.0, 1259.0, 1806.0, 2772.0, 4325.0, 6395.0, 10046.0, 15854.0, 25526.0, 40587.0, 65603.0, 105128.0, 160218.0, 198920.0, 148289.0, 96195.0, 60895.0, 37424.0, 23056.0, 14639.0, 9431.0, 6009.0, 3939.0, 2510.0, 1722.0, 1145.0, 738.0, 506.0, 359.0, 240.0, 138.0, 114.0, 74.0, 56.0, 34.0, 28.0, 13.0, 10.0, 11.0, 2.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0], "bins": [-3.58203125, -3.467987060546875, -3.35394287109375, -3.239898681640625, -3.1258544921875, -3.011810302734375, -2.89776611328125, -2.783721923828125, -2.669677734375, -2.555633544921875, -2.44158935546875, -2.327545166015625, -2.2135009765625, -2.099456787109375, -1.98541259765625, -1.871368408203125, -1.75732421875, -1.643280029296875, -1.52923583984375, -1.415191650390625, -1.3011474609375, -1.187103271484375, -1.07305908203125, -0.959014892578125, -0.844970703125, -0.730926513671875, -0.61688232421875, -0.502838134765625, -0.3887939453125, -0.274749755859375, -0.16070556640625, -0.046661376953125, 0.0673828125, 0.181427001953125, 0.29547119140625, 0.409515380859375, 0.5235595703125, 0.637603759765625, 0.75164794921875, 0.865692138671875, 0.979736328125, 1.093780517578125, 1.20782470703125, 1.321868896484375, 1.4359130859375, 1.549957275390625, 1.66400146484375, 1.778045654296875, 1.89208984375, 2.006134033203125, 2.12017822265625, 2.234222412109375, 2.3482666015625, 2.462310791015625, 2.57635498046875, 2.690399169921875, 2.804443359375, 2.918487548828125, 3.03253173828125, 3.146575927734375, 3.2606201171875, 3.374664306640625, 3.48870849609375, 3.602752685546875, 3.716796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 14.0, 12.0, 11.0, 11.0, 11.0, 16.0, 20.0, 18.0, 20.0, 18.0, 25.0, 30.0, 37.0, 39.0, 32.0, 38.0, 46.0, 50.0, 46.0, 33.0, 41.0, 32.0, 34.0, 38.0, 28.0, 27.0, 31.0, 25.0, 30.0, 19.0, 17.0, 14.0, 16.0, 22.0, 11.0, 11.0, 13.0, 10.0, 9.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.125, -23.384765625, -22.64453125, -21.904296875, -21.1640625, -20.423828125, -19.68359375, -18.943359375, -18.203125, -17.462890625, -16.72265625, -15.982421875, -15.2421875, -14.501953125, -13.76171875, -13.021484375, -12.28125, -11.541015625, -10.80078125, -10.060546875, -9.3203125, -8.580078125, -7.83984375, -7.099609375, -6.359375, -5.619140625, -4.87890625, -4.138671875, -3.3984375, -2.658203125, -1.91796875, -1.177734375, -0.4375, 0.302734375, 1.04296875, 1.783203125, 2.5234375, 3.263671875, 4.00390625, 4.744140625, 5.484375, 6.224609375, 6.96484375, 7.705078125, 8.4453125, 9.185546875, 9.92578125, 10.666015625, 11.40625, 12.146484375, 12.88671875, 13.626953125, 14.3671875, 15.107421875, 15.84765625, 16.587890625, 17.328125, 18.068359375, 18.80859375, 19.548828125, 20.2890625, 21.029296875, 21.76953125, 22.509765625, 23.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 14.0, 17.0, 26.0, 35.0, 51.0, 66.0, 112.0, 141.0, 228.0, 355.0, 489.0, 757.0, 1174.0, 1667.0, 2470.0, 3514.0, 5169.0, 7876.0, 11737.0, 18082.0, 27845.0, 43850.0, 68515.0, 107996.0, 159745.0, 187166.0, 140707.0, 92761.0, 58604.0, 37129.0, 23685.0, 15580.0, 10253.0, 6564.0, 4581.0, 3098.0, 2118.0, 1390.0, 995.0, 630.0, 444.0, 297.0, 195.0, 146.0, 108.0, 69.0, 31.0, 35.0, 20.0, 9.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.95703125, -2.86553955078125, -2.7740478515625, -2.68255615234375, -2.591064453125, -2.49957275390625, -2.4080810546875, -2.31658935546875, -2.22509765625, -2.13360595703125, -2.0421142578125, -1.95062255859375, -1.859130859375, -1.76763916015625, -1.6761474609375, -1.58465576171875, -1.4931640625, -1.40167236328125, -1.3101806640625, -1.21868896484375, -1.127197265625, -1.03570556640625, -0.9442138671875, -0.85272216796875, -0.76123046875, -0.66973876953125, -0.5782470703125, -0.48675537109375, -0.395263671875, -0.30377197265625, -0.2122802734375, -0.12078857421875, -0.029296875, 0.06219482421875, 0.1536865234375, 0.24517822265625, 0.336669921875, 0.42816162109375, 0.5196533203125, 0.61114501953125, 0.70263671875, 0.79412841796875, 0.8856201171875, 0.97711181640625, 1.068603515625, 1.16009521484375, 1.2515869140625, 1.34307861328125, 1.4345703125, 1.52606201171875, 1.6175537109375, 1.70904541015625, 1.800537109375, 1.89202880859375, 1.9835205078125, 2.07501220703125, 2.16650390625, 2.25799560546875, 2.3494873046875, 2.44097900390625, 2.532470703125, 2.62396240234375, 2.7154541015625, 2.80694580078125, 2.8984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 8.0, 10.0, 8.0, 8.0, 14.0, 7.0, 15.0, 17.0, 23.0, 17.0, 33.0, 38.0, 33.0, 35.0, 29.0, 40.0, 41.0, 35.0, 25.0, 41.0, 41.0, 40.0, 36.0, 31.0, 42.0, 32.0, 31.0, 36.0, 31.0, 35.0, 29.0, 17.0, 17.0, 11.0, 16.0, 13.0, 11.0, 12.0, 9.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.59375, -16.082763671875, -15.57177734375, -15.060791015625, -14.5498046875, -14.038818359375, -13.52783203125, -13.016845703125, -12.505859375, -11.994873046875, -11.48388671875, -10.972900390625, -10.4619140625, -9.950927734375, -9.43994140625, -8.928955078125, -8.41796875, -7.906982421875, -7.39599609375, -6.885009765625, -6.3740234375, -5.863037109375, -5.35205078125, -4.841064453125, -4.330078125, -3.819091796875, -3.30810546875, -2.797119140625, -2.2861328125, -1.775146484375, -1.26416015625, -0.753173828125, -0.2421875, 0.268798828125, 0.77978515625, 1.290771484375, 1.8017578125, 2.312744140625, 2.82373046875, 3.334716796875, 3.845703125, 4.356689453125, 4.86767578125, 5.378662109375, 5.8896484375, 6.400634765625, 6.91162109375, 7.422607421875, 7.93359375, 8.444580078125, 8.95556640625, 9.466552734375, 9.9775390625, 10.488525390625, 10.99951171875, 11.510498046875, 12.021484375, 12.532470703125, 13.04345703125, 13.554443359375, 14.0654296875, 14.576416015625, 15.08740234375, 15.598388671875, 16.109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 13.0, 19.0, 16.0, 25.0, 36.0, 60.0, 106.0, 146.0, 206.0, 334.0, 479.0, 735.0, 1133.0, 1757.0, 2678.0, 4264.0, 6947.0, 11512.0, 19793.0, 35705.0, 69547.0, 147186.0, 304683.0, 224853.0, 100260.0, 49953.0, 26933.0, 15217.0, 8880.0, 5412.0, 3341.0, 2222.0, 1374.0, 973.0, 594.0, 380.0, 266.0, 190.0, 102.0, 54.0, 45.0, 38.0, 38.0, 12.0, 9.0, 6.0, 5.0, 9.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238525390625, -0.23077011108398438, -0.22301483154296875, -0.21525955200195312, -0.2075042724609375, -0.19974899291992188, -0.19199371337890625, -0.18423843383789062, -0.176483154296875, -0.16872787475585938, -0.16097259521484375, -0.15321731567382812, -0.1454620361328125, -0.13770675659179688, -0.12995147705078125, -0.12219619750976562, -0.11444091796875, -0.10668563842773438, -0.09893035888671875, -0.09117507934570312, -0.0834197998046875, -0.07566452026367188, -0.06790924072265625, -0.060153961181640625, -0.052398681640625, -0.044643402099609375, -0.03688812255859375, -0.029132843017578125, -0.0213775634765625, -0.013622283935546875, -0.00586700439453125, 0.001888275146484375, 0.0096435546875, 0.017398834228515625, 0.02515411376953125, 0.032909393310546875, 0.0406646728515625, 0.048419952392578125, 0.05617523193359375, 0.06393051147460938, 0.071685791015625, 0.07944107055664062, 0.08719635009765625, 0.09495162963867188, 0.1027069091796875, 0.11046218872070312, 0.11821746826171875, 0.12597274780273438, 0.13372802734375, 0.14148330688476562, 0.14923858642578125, 0.15699386596679688, 0.1647491455078125, 0.17250442504882812, 0.18025970458984375, 0.18801498413085938, 0.195770263671875, 0.20352554321289062, 0.21128082275390625, 0.21903610229492188, 0.2267913818359375, 0.23454666137695312, 0.24230194091796875, 0.2500572204589844, 0.2578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 8.0, 20.0, 25.0, 30.0, 42.0, 49.0, 61.0, 78.0, 77.0, 80.0, 69.0, 94.0, 68.0, 63.0, 50.0, 42.0, 32.0, 24.0, 14.0, 17.0, 11.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.003545761108398e-05, -6.810110062360764e-05, -6.616674363613129e-05, -6.423238664865494e-05, -6.229802966117859e-05, -6.036367267370224e-05, -5.842931568622589e-05, -5.649495869874954e-05, -5.456060171127319e-05, -5.2626244723796844e-05, -5.0691887736320496e-05, -4.875753074884415e-05, -4.68231737613678e-05, -4.488881677389145e-05, -4.29544597864151e-05, -4.102010279893875e-05, -3.90857458114624e-05, -3.7151388823986053e-05, -3.5217031836509705e-05, -3.3282674849033356e-05, -3.134831786155701e-05, -2.9413960874080658e-05, -2.747960388660431e-05, -2.554524689912796e-05, -2.361088991165161e-05, -2.1676532924175262e-05, -1.9742175936698914e-05, -1.7807818949222565e-05, -1.5873461961746216e-05, -1.3939104974269867e-05, -1.2004747986793518e-05, -1.007039099931717e-05, -8.13603401184082e-06, -6.2016770243644714e-06, -4.2673200368881226e-06, -2.3329630494117737e-06, -3.986060619354248e-07, 1.535750925540924e-06, 3.470107913017273e-06, 5.404464900493622e-06, 7.338821887969971e-06, 9.27317887544632e-06, 1.1207535862922668e-05, 1.3141892850399017e-05, 1.5076249837875366e-05, 1.7010606825351715e-05, 1.8944963812828064e-05, 2.0879320800304413e-05, 2.2813677787780762e-05, 2.474803477525711e-05, 2.668239176273346e-05, 2.861674875020981e-05, 3.055110573768616e-05, 3.2485462725162506e-05, 3.4419819712638855e-05, 3.6354176700115204e-05, 3.828853368759155e-05, 4.02228906750679e-05, 4.215724766254425e-05, 4.40916046500206e-05, 4.602596163749695e-05, 4.79603186249733e-05, 4.9894675612449646e-05, 5.1829032599925995e-05, 5.3763389587402344e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 14.0, 18.0, 29.0, 40.0, 65.0, 101.0, 132.0, 251.0, 343.0, 578.0, 915.0, 1585.0, 2556.0, 4337.0, 7466.0, 13301.0, 25208.0, 48274.0, 96985.0, 226977.0, 346002.0, 134811.0, 64973.0, 32871.0, 17587.0, 9423.0, 5485.0, 3180.0, 1872.0, 1193.0, 722.0, 482.0, 295.0, 148.0, 101.0, 78.0, 51.0, 26.0, 28.0, 20.0, 8.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9523696899414062, -0.9228057861328125, -0.8932418823242188, -0.863677978515625, -0.8341140747070312, -0.8045501708984375, -0.7749862670898438, -0.74542236328125, -0.7158584594726562, -0.6862945556640625, -0.6567306518554688, -0.627166748046875, -0.5976028442382812, -0.5680389404296875, -0.5384750366210938, -0.5089111328125, -0.47934722900390625, -0.4497833251953125, -0.42021942138671875, -0.390655517578125, -0.36109161376953125, -0.3315277099609375, -0.30196380615234375, -0.27239990234375, -0.24283599853515625, -0.2132720947265625, -0.18370819091796875, -0.154144287109375, -0.12458038330078125, -0.0950164794921875, -0.06545257568359375, -0.035888671875, -0.00632476806640625, 0.0232391357421875, 0.05280303955078125, 0.082366943359375, 0.11193084716796875, 0.1414947509765625, 0.17105865478515625, 0.20062255859375, 0.23018646240234375, 0.2597503662109375, 0.28931427001953125, 0.318878173828125, 0.34844207763671875, 0.3780059814453125, 0.40756988525390625, 0.4371337890625, 0.46669769287109375, 0.4962615966796875, 0.5258255004882812, 0.555389404296875, 0.5849533081054688, 0.6145172119140625, 0.6440811157226562, 0.67364501953125, 0.7032089233398438, 0.7327728271484375, 0.7623367309570312, 0.791900634765625, 0.8214645385742188, 0.8510284423828125, 0.8805923461914062, 0.91015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 8.0, 4.0, 7.0, 7.0, 10.0, 14.0, 14.0, 22.0, 20.0, 25.0, 32.0, 30.0, 42.0, 39.0, 47.0, 46.0, 38.0, 48.0, 51.0, 49.0, 38.0, 35.0, 52.0, 56.0, 41.0, 39.0, 31.0, 33.0, 22.0, 12.0, 13.0, 13.0, 16.0, 10.0, 6.0, 9.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.438232421875, -0.4240760803222656, -0.40991973876953125, -0.3957633972167969, -0.3816070556640625, -0.3674507141113281, -0.35329437255859375, -0.3391380310058594, -0.324981689453125, -0.3108253479003906, -0.29666900634765625, -0.2825126647949219, -0.2683563232421875, -0.2541999816894531, -0.24004364013671875, -0.22588729858398438, -0.21173095703125, -0.19757461547851562, -0.18341827392578125, -0.16926193237304688, -0.1551055908203125, -0.14094924926757812, -0.12679290771484375, -0.11263656616210938, -0.098480224609375, -0.08432388305664062, -0.07016754150390625, -0.056011199951171875, -0.0418548583984375, -0.027698516845703125, -0.01354217529296875, 0.000614166259765625, 0.0147705078125, 0.028926849365234375, 0.04308319091796875, 0.057239532470703125, 0.0713958740234375, 0.08555221557617188, 0.09970855712890625, 0.11386489868164062, 0.128021240234375, 0.14217758178710938, 0.15633392333984375, 0.17049026489257812, 0.1846466064453125, 0.19880294799804688, 0.21295928955078125, 0.22711563110351562, 0.24127197265625, 0.2554283142089844, 0.26958465576171875, 0.2837409973144531, 0.2978973388671875, 0.3120536804199219, 0.32621002197265625, 0.3403663635253906, 0.354522705078125, 0.3686790466308594, 0.38283538818359375, 0.3969917297363281, 0.4111480712890625, 0.4253044128417969, 0.43946075439453125, 0.4536170959472656, 0.4677734375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 9.0, 6.0, 10.0, 13.0, 15.0, 24.0, 19.0, 31.0, 31.0, 39.0, 34.0, 27.0, 34.0, 42.0, 40.0, 41.0, 54.0, 44.0, 37.0, 40.0, 35.0, 45.0, 38.0, 39.0, 26.0, 26.0, 29.0, 21.0, 20.0, 18.0, 20.0, 18.0, 13.0, 9.0, 11.0, 7.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-19.849225997924805, -19.220840454101562, -18.592456817626953, -17.96407127380371, -17.33568572998047, -16.70730209350586, -16.078916549682617, -15.450531005859375, -14.82214641571045, -14.193761825561523, -13.565376281738281, -12.936991691589355, -12.30860710144043, -11.680221557617188, -11.051836967468262, -10.423452377319336, -9.795066833496094, -9.166682243347168, -8.538296699523926, -7.909912109375, -7.281527042388916, -6.653141975402832, -6.024757385253906, -5.396372318267822, -4.767987251281738, -4.139602184295654, -3.5112173557281494, -2.8828325271606445, -2.2544474601745605, -1.6260623931884766, -0.9976775646209717, -0.3692927360534668, 0.2590904235839844, 0.8874753713607788, 1.5158603191375732, 2.144245147705078, 2.772630214691162, 3.401015281677246, 4.029399871826172, 4.657784938812256, 5.28617000579834, 5.914555072784424, 6.542940139770508, 7.171324729919434, 7.799709796905518, 8.428094863891602, 9.056479454040527, 9.684864044189453, 10.313249588012695, 10.941634178161621, 11.570019721984863, 12.198404312133789, 12.826789855957031, 13.455174446105957, 14.083559036254883, 14.711944580078125, 15.34032917022705, 15.968713760375977, 16.59709930419922, 17.22548484802246, 17.85386848449707, 18.482254028320312, 19.110639572143555, 19.739023208618164, 20.367408752441406]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 7.0, 11.0, 9.0, 11.0, 8.0, 12.0, 19.0, 19.0, 19.0, 21.0, 24.0, 19.0, 24.0, 23.0, 39.0, 33.0, 30.0, 42.0, 33.0, 46.0, 37.0, 42.0, 38.0, 33.0, 50.0, 39.0, 29.0, 34.0, 26.0, 28.0, 18.0, 21.0, 18.0, 20.0, 22.0, 24.0, 11.0, 6.0, 6.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.98387336730957, -21.26636505126953, -20.548858642578125, -19.831350326538086, -19.11384391784668, -18.39633560180664, -17.678829193115234, -16.961320877075195, -16.243812561035156, -15.526305198669434, -14.808797836303711, -14.091289520263672, -13.373783111572266, -12.656274795532227, -11.938767433166504, -11.221260070800781, -10.503753662109375, -9.786246299743652, -9.06873893737793, -8.35123062133789, -7.633723735809326, -6.9162163734436035, -6.198708534240723, -5.481201171875, -4.763693809509277, -4.046186447143555, -3.328678846359253, -2.611171245574951, -1.8936638832092285, -1.1761565208435059, -0.458648681640625, 0.25885868072509766, 0.9763660430908203, 1.6938735246658325, 2.4113810062408447, 3.1288886070251465, 3.846395969390869, 4.563903331756592, 5.281411170959473, 5.998918533325195, 6.716425895690918, 7.433933258056641, 8.151440620422363, 8.868947982788086, 9.586456298828125, 10.303962707519531, 11.02147102355957, 11.738978385925293, 12.456485748291016, 13.173993110656738, 13.891500473022461, 14.6090087890625, 15.326515197753906, 16.044023513793945, 16.761531829833984, 17.47903823852539, 18.196544647216797, 18.914052963256836, 19.631559371948242, 20.34906768798828, 21.066574096679688, 21.784082412719727, 22.501590728759766, 23.219097137451172, 23.93660545349121]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 8.0, 7.0, 19.0, 19.0, 42.0, 71.0, 118.0, 236.0, 365.0, 624.0, 1067.0, 1687.0, 2768.0, 4462.0, 7312.0, 11736.0, 18616.0, 28219.0, 41838.0, 59384.0, 79773.0, 99219.0, 113428.0, 119214.0, 112266.0, 97195.0, 77658.0, 57081.0, 40445.0, 27137.0, 17482.0, 11012.0, 7077.0, 4341.0, 2618.0, 1633.0, 945.0, 568.0, 347.0, 206.0, 122.0, 83.0, 50.0, 31.0, 14.0, 7.0, 6.0, 6.0, 5.0, 0.0, 3.0], "bins": [-18.734375, -18.2203369140625, -17.706298828125, -17.1922607421875, -16.67822265625, -16.1641845703125, -15.650146484375, -15.1361083984375, -14.6220703125, -14.1080322265625, -13.593994140625, -13.0799560546875, -12.56591796875, -12.0518798828125, -11.537841796875, -11.0238037109375, -10.509765625, -9.9957275390625, -9.481689453125, -8.9676513671875, -8.45361328125, -7.9395751953125, -7.425537109375, -6.9114990234375, -6.3974609375, -5.8834228515625, -5.369384765625, -4.8553466796875, -4.34130859375, -3.8272705078125, -3.313232421875, -2.7991943359375, -2.28515625, -1.7711181640625, -1.257080078125, -0.7430419921875, -0.22900390625, 0.2850341796875, 0.799072265625, 1.3131103515625, 1.8271484375, 2.3411865234375, 2.855224609375, 3.3692626953125, 3.88330078125, 4.3973388671875, 4.911376953125, 5.4254150390625, 5.939453125, 6.4534912109375, 6.967529296875, 7.4815673828125, 7.99560546875, 8.5096435546875, 9.023681640625, 9.5377197265625, 10.0517578125, 10.5657958984375, 11.079833984375, 11.5938720703125, 12.10791015625, 12.6219482421875, 13.135986328125, 13.6500244140625, 14.1640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 4.0, 7.0, 11.0, 10.0, 7.0, 11.0, 17.0, 11.0, 19.0, 28.0, 27.0, 21.0, 22.0, 33.0, 24.0, 33.0, 25.0, 39.0, 41.0, 39.0, 29.0, 40.0, 45.0, 46.0, 30.0, 44.0, 32.0, 27.0, 35.0, 35.0, 28.0, 21.0, 23.0, 16.0, 11.0, 19.0, 11.0, 15.0, 14.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.3125, -19.612060546875, -18.91162109375, -18.211181640625, -17.5107421875, -16.810302734375, -16.10986328125, -15.409423828125, -14.708984375, -14.008544921875, -13.30810546875, -12.607666015625, -11.9072265625, -11.206787109375, -10.50634765625, -9.805908203125, -9.10546875, -8.405029296875, -7.70458984375, -7.004150390625, -6.3037109375, -5.603271484375, -4.90283203125, -4.202392578125, -3.501953125, -2.801513671875, -2.10107421875, -1.400634765625, -0.7001953125, 0.000244140625, 0.70068359375, 1.401123046875, 2.1015625, 2.802001953125, 3.50244140625, 4.202880859375, 4.9033203125, 5.603759765625, 6.30419921875, 7.004638671875, 7.705078125, 8.405517578125, 9.10595703125, 9.806396484375, 10.5068359375, 11.207275390625, 11.90771484375, 12.608154296875, 13.30859375, 14.009033203125, 14.70947265625, 15.409912109375, 16.1103515625, 16.810791015625, 17.51123046875, 18.211669921875, 18.912109375, 19.612548828125, 20.31298828125, 21.013427734375, 21.7138671875, 22.414306640625, 23.11474609375, 23.815185546875, 24.515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 11.0, 22.0, 30.0, 42.0, 71.0, 117.0, 169.0, 256.0, 429.0, 638.0, 915.0, 1465.0, 2260.0, 3470.0, 5485.0, 8128.0, 12055.0, 18730.0, 26956.0, 38183.0, 53059.0, 69752.0, 86045.0, 98688.0, 106550.0, 105550.0, 97731.0, 82868.0, 66641.0, 50193.0, 36482.0, 25556.0, 17157.0, 11332.0, 7532.0, 4944.0, 3202.0, 1979.0, 1362.0, 828.0, 596.0, 385.0, 243.0, 156.0, 117.0, 60.0, 43.0, 21.0, 19.0, 13.0, 6.0, 5.0, 5.0, 1.0, 1.0], "bins": [-15.875, -15.4068603515625, -14.938720703125, -14.4705810546875, -14.00244140625, -13.5343017578125, -13.066162109375, -12.5980224609375, -12.1298828125, -11.6617431640625, -11.193603515625, -10.7254638671875, -10.25732421875, -9.7891845703125, -9.321044921875, -8.8529052734375, -8.384765625, -7.9166259765625, -7.448486328125, -6.9803466796875, -6.51220703125, -6.0440673828125, -5.575927734375, -5.1077880859375, -4.6396484375, -4.1715087890625, -3.703369140625, -3.2352294921875, -2.76708984375, -2.2989501953125, -1.830810546875, -1.3626708984375, -0.89453125, -0.4263916015625, 0.041748046875, 0.5098876953125, 0.97802734375, 1.4461669921875, 1.914306640625, 2.3824462890625, 2.8505859375, 3.3187255859375, 3.786865234375, 4.2550048828125, 4.72314453125, 5.1912841796875, 5.659423828125, 6.1275634765625, 6.595703125, 7.0638427734375, 7.531982421875, 8.0001220703125, 8.46826171875, 8.9364013671875, 9.404541015625, 9.8726806640625, 10.3408203125, 10.8089599609375, 11.277099609375, 11.7452392578125, 12.21337890625, 12.6815185546875, 13.149658203125, 13.6177978515625, 14.0859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 3.0, 2.0, 6.0, 11.0, 9.0, 11.0, 15.0, 16.0, 16.0, 15.0, 19.0, 28.0, 23.0, 27.0, 34.0, 37.0, 34.0, 23.0, 49.0, 37.0, 40.0, 35.0, 48.0, 49.0, 47.0, 36.0, 29.0, 40.0, 35.0, 27.0, 21.0, 25.0, 27.0, 19.0, 19.0, 13.0, 11.0, 9.0, 5.0, 11.0, 9.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-15.03125, -14.5692138671875, -14.107177734375, -13.6451416015625, -13.18310546875, -12.7210693359375, -12.259033203125, -11.7969970703125, -11.3349609375, -10.8729248046875, -10.410888671875, -9.9488525390625, -9.48681640625, -9.0247802734375, -8.562744140625, -8.1007080078125, -7.638671875, -7.1766357421875, -6.714599609375, -6.2525634765625, -5.79052734375, -5.3284912109375, -4.866455078125, -4.4044189453125, -3.9423828125, -3.4803466796875, -3.018310546875, -2.5562744140625, -2.09423828125, -1.6322021484375, -1.170166015625, -0.7081298828125, -0.24609375, 0.2159423828125, 0.677978515625, 1.1400146484375, 1.60205078125, 2.0640869140625, 2.526123046875, 2.9881591796875, 3.4501953125, 3.9122314453125, 4.374267578125, 4.8363037109375, 5.29833984375, 5.7603759765625, 6.222412109375, 6.6844482421875, 7.146484375, 7.6085205078125, 8.070556640625, 8.5325927734375, 8.99462890625, 9.4566650390625, 9.918701171875, 10.3807373046875, 10.8427734375, 11.3048095703125, 11.766845703125, 12.2288818359375, 12.69091796875, 13.1529541015625, 13.614990234375, 14.0770263671875, 14.5390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 16.0, 21.0, 30.0, 38.0, 45.0, 73.0, 119.0, 215.0, 316.0, 494.0, 850.0, 1389.0, 2432.0, 4428.0, 7691.0, 13415.0, 23351.0, 39997.0, 65015.0, 98583.0, 133225.0, 153567.0, 150099.0, 124701.0, 89074.0, 57653.0, 34368.0, 20235.0, 11372.0, 6723.0, 3690.0, 2043.0, 1306.0, 736.0, 443.0, 276.0, 181.0, 121.0, 89.0, 45.0, 29.0, 13.0, 13.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94921875, -5.7564697265625, -5.563720703125, -5.3709716796875, -5.17822265625, -4.9854736328125, -4.792724609375, -4.5999755859375, -4.4072265625, -4.2144775390625, -4.021728515625, -3.8289794921875, -3.63623046875, -3.4434814453125, -3.250732421875, -3.0579833984375, -2.865234375, -2.6724853515625, -2.479736328125, -2.2869873046875, -2.09423828125, -1.9014892578125, -1.708740234375, -1.5159912109375, -1.3232421875, -1.1304931640625, -0.937744140625, -0.7449951171875, -0.55224609375, -0.3594970703125, -0.166748046875, 0.0260009765625, 0.21875, 0.4114990234375, 0.604248046875, 0.7969970703125, 0.98974609375, 1.1824951171875, 1.375244140625, 1.5679931640625, 1.7607421875, 1.9534912109375, 2.146240234375, 2.3389892578125, 2.53173828125, 2.7244873046875, 2.917236328125, 3.1099853515625, 3.302734375, 3.4954833984375, 3.688232421875, 3.8809814453125, 4.07373046875, 4.2664794921875, 4.459228515625, 4.6519775390625, 4.8447265625, 5.0374755859375, 5.230224609375, 5.4229736328125, 5.61572265625, 5.8084716796875, 6.001220703125, 6.1939697265625, 6.38671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 13.0, 12.0, 26.0, 21.0, 20.0, 17.0, 27.0, 27.0, 33.0, 36.0, 35.0, 43.0, 56.0, 50.0, 49.0, 51.0, 50.0, 44.0, 43.0, 50.0, 29.0, 40.0, 33.0, 30.0, 30.0, 21.0, 22.0, 15.0, 16.0, 8.0, 7.0, 9.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006279945373535156, -0.0006105229258537292, -0.0005930513143539429, -0.0005755797028541565, -0.0005581080913543701, -0.0005406364798545837, -0.0005231648683547974, -0.000505693256855011, -0.0004882216453552246, -0.00047075003385543823, -0.00045327842235565186, -0.0004358068108558655, -0.0004183351993560791, -0.0004008635878562927, -0.00038339197635650635, -0.00036592036485671997, -0.0003484487533569336, -0.0003309771418571472, -0.00031350553035736084, -0.00029603391885757446, -0.0002785623073577881, -0.0002610906958580017, -0.00024361908435821533, -0.00022614747285842896, -0.00020867586135864258, -0.0001912042498588562, -0.00017373263835906982, -0.00015626102685928345, -0.00013878941535949707, -0.0001213178038597107, -0.00010384619235992432, -8.637458086013794e-05, -6.890296936035156e-05, -5.1431357860565186e-05, -3.395974636077881e-05, -1.648813486099243e-05, 9.834766387939453e-07, 1.8455088138580322e-05, 3.59266996383667e-05, 5.3398311138153076e-05, 7.086992263793945e-05, 8.834153413772583e-05, 0.00010581314563751221, 0.00012328475713729858, 0.00014075636863708496, 0.00015822798013687134, 0.00017569959163665771, 0.0001931712031364441, 0.00021064281463623047, 0.00022811442613601685, 0.0002455860376358032, 0.0002630576491355896, 0.000280529260635376, 0.00029800087213516235, 0.00031547248363494873, 0.0003329440951347351, 0.0003504157066345215, 0.00036788731813430786, 0.00038535892963409424, 0.0004028305411338806, 0.000420302152633667, 0.00043777376413345337, 0.00045524537563323975, 0.0004727169871330261, 0.0004901885986328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 13.0, 21.0, 27.0, 43.0, 62.0, 85.0, 118.0, 193.0, 321.0, 473.0, 767.0, 1142.0, 1844.0, 2634.0, 4317.0, 6758.0, 10840.0, 16929.0, 26247.0, 39628.0, 57388.0, 78305.0, 101292.0, 118408.0, 124724.0, 117330.0, 99163.0, 76372.0, 55585.0, 38138.0, 24984.0, 15974.0, 10300.0, 6575.0, 4192.0, 2618.0, 1717.0, 1019.0, 719.0, 473.0, 291.0, 166.0, 116.0, 75.0, 55.0, 35.0, 30.0, 8.0, 15.0, 6.0, 6.0, 4.0, 4.0, 3.0], "bins": [-5.6875, -5.52239990234375, -5.3572998046875, -5.19219970703125, -5.027099609375, -4.86199951171875, -4.6968994140625, -4.53179931640625, -4.36669921875, -4.20159912109375, -4.0364990234375, -3.87139892578125, -3.706298828125, -3.54119873046875, -3.3760986328125, -3.21099853515625, -3.0458984375, -2.88079833984375, -2.7156982421875, -2.55059814453125, -2.385498046875, -2.22039794921875, -2.0552978515625, -1.89019775390625, -1.72509765625, -1.55999755859375, -1.3948974609375, -1.22979736328125, -1.064697265625, -0.89959716796875, -0.7344970703125, -0.56939697265625, -0.404296875, -0.23919677734375, -0.0740966796875, 0.09100341796875, 0.256103515625, 0.42120361328125, 0.5863037109375, 0.75140380859375, 0.91650390625, 1.08160400390625, 1.2467041015625, 1.41180419921875, 1.576904296875, 1.74200439453125, 1.9071044921875, 2.07220458984375, 2.2373046875, 2.40240478515625, 2.5675048828125, 2.73260498046875, 2.897705078125, 3.06280517578125, 3.2279052734375, 3.39300537109375, 3.55810546875, 3.72320556640625, 3.8883056640625, 4.05340576171875, 4.218505859375, 4.38360595703125, 4.5487060546875, 4.71380615234375, 4.87890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 9.0, 10.0, 10.0, 13.0, 11.0, 24.0, 19.0, 32.0, 37.0, 28.0, 23.0, 26.0, 49.0, 48.0, 37.0, 39.0, 47.0, 40.0, 42.0, 41.0, 44.0, 47.0, 40.0, 36.0, 35.0, 17.0, 31.0, 16.0, 28.0, 17.0, 13.0, 16.0, 18.0, 10.0, 8.0, 2.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.431640625, -2.360595703125, -2.28955078125, -2.218505859375, -2.1474609375, -2.076416015625, -2.00537109375, -1.934326171875, -1.86328125, -1.792236328125, -1.72119140625, -1.650146484375, -1.5791015625, -1.508056640625, -1.43701171875, -1.365966796875, -1.294921875, -1.223876953125, -1.15283203125, -1.081787109375, -1.0107421875, -0.939697265625, -0.86865234375, -0.797607421875, -0.7265625, -0.655517578125, -0.58447265625, -0.513427734375, -0.4423828125, -0.371337890625, -0.30029296875, -0.229248046875, -0.158203125, -0.087158203125, -0.01611328125, 0.054931640625, 0.1259765625, 0.197021484375, 0.26806640625, 0.339111328125, 0.41015625, 0.481201171875, 0.55224609375, 0.623291015625, 0.6943359375, 0.765380859375, 0.83642578125, 0.907470703125, 0.978515625, 1.049560546875, 1.12060546875, 1.191650390625, 1.2626953125, 1.333740234375, 1.40478515625, 1.475830078125, 1.546875, 1.617919921875, 1.68896484375, 1.760009765625, 1.8310546875, 1.902099609375, 1.97314453125, 2.044189453125, 2.115234375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 10.0, 4.0, 3.0, 6.0, 8.0, 11.0, 14.0, 12.0, 22.0, 27.0, 22.0, 30.0, 33.0, 27.0, 29.0, 31.0, 47.0, 49.0, 44.0, 54.0, 34.0, 44.0, 56.0, 37.0, 36.0, 31.0, 36.0, 32.0, 29.0, 17.0, 26.0, 22.0, 18.0, 20.0, 17.0, 15.0, 8.0, 14.0, 6.0, 2.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.69333839416504, -19.070175170898438, -18.44701385498047, -17.823850631713867, -17.2006893157959, -16.577526092529297, -15.954364776611328, -15.331201553344727, -14.708040237426758, -14.084877967834473, -13.461715698242188, -12.838553428649902, -12.215391159057617, -11.592228889465332, -10.969066619873047, -10.345903396606445, -9.72274112701416, -9.099578857421875, -8.47641658782959, -7.853254318237305, -7.2300920486450195, -6.606929779052734, -5.983767032623291, -5.360604763031006, -4.737442493438721, -4.1142802238464355, -3.4911179542541504, -2.867955446243286, -2.244793176651001, -1.6216309070587158, -0.9984683990478516, -0.3753061294555664, 0.24785614013671875, 0.8710184693336487, 1.4941807985305786, 2.1173431873321533, 2.7405054569244385, 3.3636677265167236, 3.986830234527588, 4.609992504119873, 5.233154773712158, 5.856317043304443, 6.4794793128967285, 7.102642059326172, 7.725804328918457, 8.348966598510742, 8.972128868103027, 9.595291137695312, 10.218453407287598, 10.841615676879883, 11.464777946472168, 12.087940216064453, 12.711102485656738, 13.334264755249023, 13.957427978515625, 14.580589294433594, 15.203752517700195, 15.82691478729248, 16.450077056884766, 17.073240280151367, 17.696401596069336, 18.319564819335938, 18.942726135253906, 19.565889358520508, 20.189050674438477]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 9.0, 11.0, 6.0, 15.0, 15.0, 15.0, 15.0, 21.0, 15.0, 19.0, 23.0, 30.0, 26.0, 31.0, 45.0, 31.0, 35.0, 44.0, 47.0, 41.0, 43.0, 35.0, 36.0, 32.0, 35.0, 35.0, 29.0, 29.0, 27.0, 27.0, 23.0, 29.0, 9.0, 20.0, 18.0, 11.0, 10.0, 15.0, 8.0, 4.0, 7.0, 1.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.66383934020996, -21.906023025512695, -21.14820671081543, -20.390392303466797, -19.63257598876953, -18.874759674072266, -18.116943359375, -17.359127044677734, -16.60131072998047, -15.843494415283203, -15.085679054260254, -14.327862739562988, -13.570047378540039, -12.812231063842773, -12.054414749145508, -11.296598434448242, -10.53878402709961, -9.780967712402344, -9.023152351379395, -8.265336036682129, -7.5075201988220215, -6.749704360961914, -5.991888046264648, -5.234072208404541, -4.476256370544434, -3.718440532684326, -2.9606244564056396, -2.202808380126953, -1.4449925422668457, -0.6871767044067383, 0.07063961029052734, 0.8284554481506348, 1.5862712860107422, 2.3440871238708496, 3.101903200149536, 3.8597192764282227, 4.61753511428833, 5.3753509521484375, 6.133167266845703, 6.8909831047058105, 7.648798942565918, 8.406615257263184, 9.164430618286133, 9.922246932983398, 10.680063247680664, 11.437878608703613, 12.195694923400879, 12.953510284423828, 13.711326599121094, 14.46914291381836, 15.226958274841309, 15.984774589538574, 16.742589950561523, 17.50040626525879, 18.258222579956055, 19.01603889465332, 19.773853302001953, 20.53166961669922, 21.289485931396484, 22.04730224609375, 22.805116653442383, 23.56293296813965, 24.320749282836914, 25.07856559753418, 25.836381912231445]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 15.0, 27.0, 44.0, 64.0, 110.0, 189.0, 293.0, 463.0, 667.0, 1067.0, 1716.0, 2626.0, 4184.0, 6432.0, 9971.0, 15678.0, 23948.0, 37188.0, 56319.0, 84469.0, 124540.0, 178942.0, 248936.0, 328801.0, 404343.0, 457729.0, 467615.0, 433900.0, 364196.0, 284770.0, 209687.0, 149072.0, 101443.0, 67792.0, 45039.0, 29052.0, 18841.0, 12241.0, 8050.0, 4934.0, 3250.0, 2050.0, 1289.0, 869.0, 522.0, 310.0, 245.0, 137.0, 79.0, 53.0, 33.0, 22.0, 9.0, 6.0, 6.0, 3.0, 1.0], "bins": [-15.734375, -15.2608642578125, -14.787353515625, -14.3138427734375, -13.84033203125, -13.3668212890625, -12.893310546875, -12.4197998046875, -11.9462890625, -11.4727783203125, -10.999267578125, -10.5257568359375, -10.05224609375, -9.5787353515625, -9.105224609375, -8.6317138671875, -8.158203125, -7.6846923828125, -7.211181640625, -6.7376708984375, -6.26416015625, -5.7906494140625, -5.317138671875, -4.8436279296875, -4.3701171875, -3.8966064453125, -3.423095703125, -2.9495849609375, -2.47607421875, -2.0025634765625, -1.529052734375, -1.0555419921875, -0.58203125, -0.1085205078125, 0.364990234375, 0.8385009765625, 1.31201171875, 1.7855224609375, 2.259033203125, 2.7325439453125, 3.2060546875, 3.6795654296875, 4.153076171875, 4.6265869140625, 5.10009765625, 5.5736083984375, 6.047119140625, 6.5206298828125, 6.994140625, 7.4676513671875, 7.941162109375, 8.4146728515625, 8.88818359375, 9.3616943359375, 9.835205078125, 10.3087158203125, 10.7822265625, 11.2557373046875, 11.729248046875, 12.2027587890625, 12.67626953125, 13.1497802734375, 13.623291015625, 14.0968017578125, 14.5703125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 3.0, 10.0, 10.0, 10.0, 12.0, 13.0, 13.0, 13.0, 24.0, 27.0, 16.0, 22.0, 25.0, 44.0, 25.0, 38.0, 39.0, 38.0, 46.0, 49.0, 41.0, 44.0, 27.0, 40.0, 35.0, 32.0, 29.0, 36.0, 29.0, 20.0, 16.0, 21.0, 18.0, 20.0, 8.0, 19.0, 15.0, 13.0, 13.0, 5.0, 10.0, 1.0, 6.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.0625, -17.504150390625, -16.94580078125, -16.387451171875, -15.8291015625, -15.270751953125, -14.71240234375, -14.154052734375, -13.595703125, -13.037353515625, -12.47900390625, -11.920654296875, -11.3623046875, -10.803955078125, -10.24560546875, -9.687255859375, -9.12890625, -8.570556640625, -8.01220703125, -7.453857421875, -6.8955078125, -6.337158203125, -5.77880859375, -5.220458984375, -4.662109375, -4.103759765625, -3.54541015625, -2.987060546875, -2.4287109375, -1.870361328125, -1.31201171875, -0.753662109375, -0.1953125, 0.363037109375, 0.92138671875, 1.479736328125, 2.0380859375, 2.596435546875, 3.15478515625, 3.713134765625, 4.271484375, 4.829833984375, 5.38818359375, 5.946533203125, 6.5048828125, 7.063232421875, 7.62158203125, 8.179931640625, 8.73828125, 9.296630859375, 9.85498046875, 10.413330078125, 10.9716796875, 11.530029296875, 12.08837890625, 12.646728515625, 13.205078125, 13.763427734375, 14.32177734375, 14.880126953125, 15.4384765625, 15.996826171875, 16.55517578125, 17.113525390625, 17.671875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 10.0, 9.0, 16.0, 22.0, 40.0, 89.0, 126.0, 246.0, 419.0, 710.0, 1204.0, 2172.0, 3750.0, 6410.0, 11174.0, 19314.0, 32394.0, 53622.0, 85925.0, 133262.0, 196391.0, 273441.0, 357475.0, 430821.0, 473545.0, 474782.0, 433361.0, 361686.0, 280432.0, 200981.0, 136814.0, 88936.0, 54850.0, 33433.0, 19774.0, 11322.0, 6571.0, 3775.0, 2136.0, 1230.0, 694.0, 385.0, 221.0, 127.0, 85.0, 54.0, 30.0, 15.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9453125, -14.4476318359375, -13.949951171875, -13.4522705078125, -12.95458984375, -12.4569091796875, -11.959228515625, -11.4615478515625, -10.9638671875, -10.4661865234375, -9.968505859375, -9.4708251953125, -8.97314453125, -8.4754638671875, -7.977783203125, -7.4801025390625, -6.982421875, -6.4847412109375, -5.987060546875, -5.4893798828125, -4.99169921875, -4.4940185546875, -3.996337890625, -3.4986572265625, -3.0009765625, -2.5032958984375, -2.005615234375, -1.5079345703125, -1.01025390625, -0.5125732421875, -0.014892578125, 0.4827880859375, 0.98046875, 1.4781494140625, 1.975830078125, 2.4735107421875, 2.97119140625, 3.4688720703125, 3.966552734375, 4.4642333984375, 4.9619140625, 5.4595947265625, 5.957275390625, 6.4549560546875, 6.95263671875, 7.4503173828125, 7.947998046875, 8.4456787109375, 8.943359375, 9.4410400390625, 9.938720703125, 10.4364013671875, 10.93408203125, 11.4317626953125, 11.929443359375, 12.4271240234375, 12.9248046875, 13.4224853515625, 13.920166015625, 14.4178466796875, 14.91552734375, 15.4132080078125, 15.910888671875, 16.4085693359375, 16.90625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 6.0, 5.0, 15.0, 11.0, 15.0, 23.0, 30.0, 39.0, 42.0, 48.0, 66.0, 102.0, 91.0, 106.0, 105.0, 144.0, 150.0, 159.0, 184.0, 195.0, 178.0, 201.0, 207.0, 226.0, 207.0, 183.0, 189.0, 168.0, 142.0, 154.0, 107.0, 107.0, 76.0, 61.0, 73.0, 55.0, 37.0, 31.0, 35.0, 27.0, 13.0, 17.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.0234375, -8.7467041015625, -8.469970703125, -8.1932373046875, -7.91650390625, -7.6397705078125, -7.363037109375, -7.0863037109375, -6.8095703125, -6.5328369140625, -6.256103515625, -5.9793701171875, -5.70263671875, -5.4259033203125, -5.149169921875, -4.8724365234375, -4.595703125, -4.3189697265625, -4.042236328125, -3.7655029296875, -3.48876953125, -3.2120361328125, -2.935302734375, -2.6585693359375, -2.3818359375, -2.1051025390625, -1.828369140625, -1.5516357421875, -1.27490234375, -0.9981689453125, -0.721435546875, -0.4447021484375, -0.16796875, 0.1087646484375, 0.385498046875, 0.6622314453125, 0.93896484375, 1.2156982421875, 1.492431640625, 1.7691650390625, 2.0458984375, 2.3226318359375, 2.599365234375, 2.8760986328125, 3.15283203125, 3.4295654296875, 3.706298828125, 3.9830322265625, 4.259765625, 4.5364990234375, 4.813232421875, 5.0899658203125, 5.36669921875, 5.6434326171875, 5.920166015625, 6.1968994140625, 6.4736328125, 6.7503662109375, 7.027099609375, 7.3038330078125, 7.58056640625, 7.8572998046875, 8.134033203125, 8.4107666015625, 8.6875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 10.0, 9.0, 10.0, 14.0, 16.0, 18.0, 30.0, 25.0, 33.0, 29.0, 49.0, 45.0, 47.0, 53.0, 45.0, 53.0, 71.0, 53.0, 45.0, 49.0, 40.0, 31.0, 37.0, 22.0, 34.0, 25.0, 18.0, 20.0, 23.0, 13.0, 10.0, 7.0, 5.0, 1.0, 9.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.792701721191406, -18.082082748413086, -17.371461868286133, -16.660842895507812, -15.950222969055176, -15.239603042602539, -14.528984069824219, -13.818364143371582, -13.107744216918945, -12.397124290466309, -11.686504364013672, -10.975885391235352, -10.265265464782715, -9.554645538330078, -8.844026565551758, -8.133406639099121, -7.422786712646484, -6.712166786193848, -6.001547336578369, -5.290927886962891, -4.580307960510254, -3.8696882724761963, -3.1590685844421387, -2.44844913482666, -1.7378292083740234, -1.0272095203399658, -0.3165898323059082, 0.3940298557281494, 1.104649543762207, 1.8152692317962646, 2.5258889198303223, 3.236508369445801, 3.9471282958984375, 4.657748222351074, 5.368367671966553, 6.078987121582031, 6.789607048034668, 7.500226974487305, 8.210845947265625, 8.921465873718262, 9.632085800170898, 10.342705726623535, 11.053325653076172, 11.763944625854492, 12.474564552307129, 13.185184478759766, 13.895803451538086, 14.606423377990723, 15.31704330444336, 16.02766227722168, 16.738283157348633, 17.448902130126953, 18.159523010253906, 18.870141983032227, 19.580760955810547, 20.2913818359375, 21.00200080871582, 21.71261978149414, 22.423240661621094, 23.133859634399414, 23.844478607177734, 24.555099487304688, 25.265718460083008, 25.976337432861328, 26.68695831298828]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 15.0, 11.0, 13.0, 16.0, 27.0, 24.0, 24.0, 32.0, 34.0, 44.0, 49.0, 34.0, 40.0, 46.0, 56.0, 39.0, 43.0, 33.0, 41.0, 33.0, 35.0, 36.0, 40.0, 22.0, 24.0, 24.0, 22.0, 21.0, 15.0, 12.0, 8.0, 9.0, 7.0, 6.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.516550064086914, -20.770729064941406, -20.02490997314453, -19.279088973999023, -18.533267974853516, -17.78744888305664, -17.041627883911133, -16.295806884765625, -15.54998779296875, -14.804167747497559, -14.058347702026367, -13.31252670288086, -12.566706657409668, -11.820886611938477, -11.075065612792969, -10.329245567321777, -9.583425521850586, -8.837605476379395, -8.091785430908203, -7.345964431762695, -6.600144386291504, -5.8543243408203125, -5.108503818511963, -4.362683296203613, -3.616863250732422, -2.8710429668426514, -2.125222682952881, -1.3794023990631104, -0.6335821151733398, 0.11223816871643066, 0.8580584526062012, 1.6038789749145508, 2.349700927734375, 3.0955212116241455, 3.841341495513916, 4.587162017822266, 5.332982063293457, 6.078802108764648, 6.824622631072998, 7.570443153381348, 8.316263198852539, 9.06208324432373, 9.807903289794922, 10.55372428894043, 11.299544334411621, 12.045364379882812, 12.79118537902832, 13.537005424499512, 14.282825469970703, 15.028645515441895, 15.774465560913086, 16.520286560058594, 17.26610565185547, 18.011926651000977, 18.757747650146484, 19.50356674194336, 20.249387741088867, 20.995208740234375, 21.74102783203125, 22.486848831176758, 23.232669830322266, 23.97848892211914, 24.72430992126465, 25.470130920410156, 26.21595001220703]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 10.0, 24.0, 35.0, 43.0, 77.0, 112.0, 163.0, 253.0, 371.0, 593.0, 861.0, 1298.0, 2087.0, 3070.0, 4839.0, 7475.0, 11773.0, 18250.0, 28870.0, 44508.0, 69316.0, 106399.0, 156577.0, 186002.0, 140415.0, 93920.0, 61312.0, 38982.0, 25378.0, 16252.0, 10553.0, 6598.0, 4296.0, 2734.0, 1787.0, 1159.0, 740.0, 480.0, 317.0, 205.0, 125.0, 95.0, 53.0, 40.0, 33.0, 29.0, 14.0, 15.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.8494873046875, -2.755615234375, -2.6617431640625, -2.56787109375, -2.4739990234375, -2.380126953125, -2.2862548828125, -2.1923828125, -2.0985107421875, -2.004638671875, -1.9107666015625, -1.81689453125, -1.7230224609375, -1.629150390625, -1.5352783203125, -1.44140625, -1.3475341796875, -1.253662109375, -1.1597900390625, -1.06591796875, -0.9720458984375, -0.878173828125, -0.7843017578125, -0.6904296875, -0.5965576171875, -0.502685546875, -0.4088134765625, -0.31494140625, -0.2210693359375, -0.127197265625, -0.0333251953125, 0.060546875, 0.1544189453125, 0.248291015625, 0.3421630859375, 0.43603515625, 0.5299072265625, 0.623779296875, 0.7176513671875, 0.8115234375, 0.9053955078125, 0.999267578125, 1.0931396484375, 1.18701171875, 1.2808837890625, 1.374755859375, 1.4686279296875, 1.5625, 1.6563720703125, 1.750244140625, 1.8441162109375, 1.93798828125, 2.0318603515625, 2.125732421875, 2.2196044921875, 2.3134765625, 2.4073486328125, 2.501220703125, 2.5950927734375, 2.68896484375, 2.7828369140625, 2.876708984375, 2.9705810546875, 3.064453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 8.0, 13.0, 8.0, 8.0, 13.0, 17.0, 14.0, 19.0, 20.0, 26.0, 28.0, 31.0, 40.0, 33.0, 48.0, 45.0, 42.0, 44.0, 55.0, 44.0, 41.0, 45.0, 45.0, 35.0, 34.0, 25.0, 20.0, 40.0, 27.0, 25.0, 20.0, 10.0, 17.0, 12.0, 7.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.984375, -22.206787109375, -21.42919921875, -20.651611328125, -19.8740234375, -19.096435546875, -18.31884765625, -17.541259765625, -16.763671875, -15.986083984375, -15.20849609375, -14.430908203125, -13.6533203125, -12.875732421875, -12.09814453125, -11.320556640625, -10.54296875, -9.765380859375, -8.98779296875, -8.210205078125, -7.4326171875, -6.655029296875, -5.87744140625, -5.099853515625, -4.322265625, -3.544677734375, -2.76708984375, -1.989501953125, -1.2119140625, -0.434326171875, 0.34326171875, 1.120849609375, 1.8984375, 2.676025390625, 3.45361328125, 4.231201171875, 5.0087890625, 5.786376953125, 6.56396484375, 7.341552734375, 8.119140625, 8.896728515625, 9.67431640625, 10.451904296875, 11.2294921875, 12.007080078125, 12.78466796875, 13.562255859375, 14.33984375, 15.117431640625, 15.89501953125, 16.672607421875, 17.4501953125, 18.227783203125, 19.00537109375, 19.782958984375, 20.560546875, 21.338134765625, 22.11572265625, 22.893310546875, 23.6708984375, 24.448486328125, 25.22607421875, 26.003662109375, 26.78125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 11.0, 13.0, 16.0, 29.0, 62.0, 65.0, 119.0, 143.0, 217.0, 315.0, 504.0, 701.0, 1022.0, 1412.0, 1942.0, 3040.0, 4200.0, 6212.0, 9318.0, 14261.0, 21584.0, 33063.0, 52240.0, 81266.0, 126684.0, 181011.0, 173621.0, 118904.0, 76389.0, 48291.0, 30706.0, 20094.0, 13078.0, 8897.0, 6053.0, 4043.0, 2730.0, 1961.0, 1320.0, 972.0, 593.0, 464.0, 307.0, 232.0, 153.0, 97.0, 70.0, 41.0, 32.0, 26.0, 18.0, 7.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.638671875, -2.5533447265625, -2.468017578125, -2.3826904296875, -2.29736328125, -2.2120361328125, -2.126708984375, -2.0413818359375, -1.9560546875, -1.8707275390625, -1.785400390625, -1.7000732421875, -1.61474609375, -1.5294189453125, -1.444091796875, -1.3587646484375, -1.2734375, -1.1881103515625, -1.102783203125, -1.0174560546875, -0.93212890625, -0.8468017578125, -0.761474609375, -0.6761474609375, -0.5908203125, -0.5054931640625, -0.420166015625, -0.3348388671875, -0.24951171875, -0.1641845703125, -0.078857421875, 0.0064697265625, 0.091796875, 0.1771240234375, 0.262451171875, 0.3477783203125, 0.43310546875, 0.5184326171875, 0.603759765625, 0.6890869140625, 0.7744140625, 0.8597412109375, 0.945068359375, 1.0303955078125, 1.11572265625, 1.2010498046875, 1.286376953125, 1.3717041015625, 1.45703125, 1.5423583984375, 1.627685546875, 1.7130126953125, 1.79833984375, 1.8836669921875, 1.968994140625, 2.0543212890625, 2.1396484375, 2.2249755859375, 2.310302734375, 2.3956298828125, 2.48095703125, 2.5662841796875, 2.651611328125, 2.7369384765625, 2.822265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 8.0, 3.0, 9.0, 10.0, 12.0, 11.0, 17.0, 12.0, 14.0, 12.0, 19.0, 23.0, 25.0, 31.0, 33.0, 28.0, 37.0, 36.0, 33.0, 26.0, 44.0, 50.0, 37.0, 36.0, 43.0, 41.0, 40.0, 15.0, 34.0, 24.0, 30.0, 33.0, 27.0, 20.0, 16.0, 21.0, 22.0, 12.0, 11.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-14.65625, -14.21142578125, -13.7666015625, -13.32177734375, -12.876953125, -12.43212890625, -11.9873046875, -11.54248046875, -11.09765625, -10.65283203125, -10.2080078125, -9.76318359375, -9.318359375, -8.87353515625, -8.4287109375, -7.98388671875, -7.5390625, -7.09423828125, -6.6494140625, -6.20458984375, -5.759765625, -5.31494140625, -4.8701171875, -4.42529296875, -3.98046875, -3.53564453125, -3.0908203125, -2.64599609375, -2.201171875, -1.75634765625, -1.3115234375, -0.86669921875, -0.421875, 0.02294921875, 0.4677734375, 0.91259765625, 1.357421875, 1.80224609375, 2.2470703125, 2.69189453125, 3.13671875, 3.58154296875, 4.0263671875, 4.47119140625, 4.916015625, 5.36083984375, 5.8056640625, 6.25048828125, 6.6953125, 7.14013671875, 7.5849609375, 8.02978515625, 8.474609375, 8.91943359375, 9.3642578125, 9.80908203125, 10.25390625, 10.69873046875, 11.1435546875, 11.58837890625, 12.033203125, 12.47802734375, 12.9228515625, 13.36767578125, 13.8125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 14.0, 18.0, 35.0, 47.0, 75.0, 99.0, 148.0, 223.0, 359.0, 491.0, 795.0, 1143.0, 1891.0, 3013.0, 4949.0, 8500.0, 15153.0, 28527.0, 58683.0, 134774.0, 331318.0, 257400.0, 101036.0, 45880.0, 23170.0, 12241.0, 7131.0, 4232.0, 2503.0, 1561.0, 1042.0, 683.0, 481.0, 309.0, 191.0, 129.0, 95.0, 61.0, 40.0, 31.0, 22.0, 15.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2255859375, -0.21850013732910156, -0.21141433715820312, -0.2043285369873047, -0.19724273681640625, -0.1901569366455078, -0.18307113647460938, -0.17598533630371094, -0.1688995361328125, -0.16181373596191406, -0.15472793579101562, -0.1476421356201172, -0.14055633544921875, -0.1334705352783203, -0.12638473510742188, -0.11929893493652344, -0.112213134765625, -0.10512733459472656, -0.09804153442382812, -0.09095573425292969, -0.08386993408203125, -0.07678413391113281, -0.06969833374023438, -0.06261253356933594, -0.0555267333984375, -0.04844093322753906, -0.041355133056640625, -0.03426933288574219, -0.02718353271484375, -0.020097732543945312, -0.013011932373046875, -0.0059261322021484375, 0.00115966796875, 0.008245468139648438, 0.015331268310546875, 0.022417068481445312, 0.02950286865234375, 0.03658866882324219, 0.043674468994140625, 0.05076026916503906, 0.0578460693359375, 0.06493186950683594, 0.07201766967773438, 0.07910346984863281, 0.08618927001953125, 0.09327507019042969, 0.10036087036132812, 0.10744667053222656, 0.114532470703125, 0.12161827087402344, 0.12870407104492188, 0.1357898712158203, 0.14287567138671875, 0.1499614715576172, 0.15704727172851562, 0.16413307189941406, 0.1712188720703125, 0.17830467224121094, 0.18539047241210938, 0.1924762725830078, 0.19956207275390625, 0.2066478729248047, 0.21373367309570312, 0.22081947326660156, 0.2279052734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 6.0, 7.0, 6.0, 6.0, 6.0, 5.0, 14.0, 6.0, 16.0, 15.0, 17.0, 26.0, 16.0, 23.0, 17.0, 36.0, 40.0, 37.0, 48.0, 48.0, 56.0, 48.0, 46.0, 39.0, 45.0, 39.0, 43.0, 25.0, 41.0, 37.0, 29.0, 30.0, 22.0, 22.0, 17.0, 10.0, 12.0, 13.0, 6.0, 7.0, 7.0, 7.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.5928020477294922e-05, -2.5063753128051758e-05, -2.4199485778808594e-05, -2.333521842956543e-05, -2.2470951080322266e-05, -2.16066837310791e-05, -2.0742416381835938e-05, -1.9878149032592773e-05, -1.901388168334961e-05, -1.8149614334106445e-05, -1.728534698486328e-05, -1.6421079635620117e-05, -1.5556812286376953e-05, -1.4692544937133789e-05, -1.3828277587890625e-05, -1.2964010238647461e-05, -1.2099742889404297e-05, -1.1235475540161133e-05, -1.0371208190917969e-05, -9.506940841674805e-06, -8.64267349243164e-06, -7.778406143188477e-06, -6.9141387939453125e-06, -6.0498714447021484e-06, -5.185604095458984e-06, -4.32133674621582e-06, -3.4570693969726562e-06, -2.592802047729492e-06, -1.7285346984863281e-06, -8.642673492431641e-07, 0.0, 8.642673492431641e-07, 1.7285346984863281e-06, 2.592802047729492e-06, 3.4570693969726562e-06, 4.32133674621582e-06, 5.185604095458984e-06, 6.0498714447021484e-06, 6.9141387939453125e-06, 7.778406143188477e-06, 8.64267349243164e-06, 9.506940841674805e-06, 1.0371208190917969e-05, 1.1235475540161133e-05, 1.2099742889404297e-05, 1.2964010238647461e-05, 1.3828277587890625e-05, 1.4692544937133789e-05, 1.5556812286376953e-05, 1.6421079635620117e-05, 1.728534698486328e-05, 1.8149614334106445e-05, 1.901388168334961e-05, 1.9878149032592773e-05, 2.0742416381835938e-05, 2.16066837310791e-05, 2.2470951080322266e-05, 2.333521842956543e-05, 2.4199485778808594e-05, 2.5063753128051758e-05, 2.5928020477294922e-05, 2.6792287826538086e-05, 2.765655517578125e-05, 2.8520822525024414e-05, 2.9385089874267578e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 12.0, 15.0, 33.0, 27.0, 60.0, 97.0, 124.0, 222.0, 332.0, 434.0, 628.0, 908.0, 1330.0, 2007.0, 2885.0, 4248.0, 6269.0, 8792.0, 12554.0, 18469.0, 27754.0, 42550.0, 68448.0, 117158.0, 228273.0, 207990.0, 109193.0, 64280.0, 40553.0, 26452.0, 17738.0, 11963.0, 8289.0, 5741.0, 4004.0, 2737.0, 1904.0, 1292.0, 916.0, 572.0, 460.0, 314.0, 177.0, 104.0, 77.0, 47.0, 42.0, 28.0, 16.0, 19.0, 10.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.446533203125, -0.43297576904296875, -0.4194183349609375, -0.40586090087890625, -0.392303466796875, -0.37874603271484375, -0.3651885986328125, -0.35163116455078125, -0.33807373046875, -0.32451629638671875, -0.3109588623046875, -0.29740142822265625, -0.283843994140625, -0.27028656005859375, -0.2567291259765625, -0.24317169189453125, -0.2296142578125, -0.21605682373046875, -0.2024993896484375, -0.18894195556640625, -0.175384521484375, -0.16182708740234375, -0.1482696533203125, -0.13471221923828125, -0.12115478515625, -0.10759735107421875, -0.0940399169921875, -0.08048248291015625, -0.066925048828125, -0.05336761474609375, -0.0398101806640625, -0.02625274658203125, -0.0126953125, 0.00086212158203125, 0.0144195556640625, 0.02797698974609375, 0.041534423828125, 0.05509185791015625, 0.0686492919921875, 0.08220672607421875, 0.09576416015625, 0.10932159423828125, 0.1228790283203125, 0.13643646240234375, 0.149993896484375, 0.16355133056640625, 0.1771087646484375, 0.19066619873046875, 0.2042236328125, 0.21778106689453125, 0.2313385009765625, 0.24489593505859375, 0.258453369140625, 0.27201080322265625, 0.2855682373046875, 0.29912567138671875, 0.31268310546875, 0.32624053955078125, 0.3397979736328125, 0.35335540771484375, 0.366912841796875, 0.38047027587890625, 0.3940277099609375, 0.40758514404296875, 0.421142578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 7.0, 5.0, 5.0, 10.0, 8.0, 10.0, 17.0, 18.0, 23.0, 14.0, 32.0, 19.0, 25.0, 34.0, 40.0, 38.0, 42.0, 61.0, 55.0, 62.0, 64.0, 53.0, 48.0, 42.0, 39.0, 37.0, 32.0, 24.0, 18.0, 24.0, 11.0, 10.0, 12.0, 9.0, 7.0, 9.0, 9.0, 5.0, 8.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31591796875, -0.3057594299316406, -0.29560089111328125, -0.2854423522949219, -0.2752838134765625, -0.2651252746582031, -0.25496673583984375, -0.24480819702148438, -0.234649658203125, -0.22449111938476562, -0.21433258056640625, -0.20417404174804688, -0.1940155029296875, -0.18385696411132812, -0.17369842529296875, -0.16353988647460938, -0.15338134765625, -0.14322280883789062, -0.13306427001953125, -0.12290573120117188, -0.1127471923828125, -0.10258865356445312, -0.09243011474609375, -0.08227157592773438, -0.072113037109375, -0.061954498291015625, -0.05179595947265625, -0.041637420654296875, -0.0314788818359375, -0.021320343017578125, -0.01116180419921875, -0.001003265380859375, 0.0091552734375, 0.019313812255859375, 0.02947235107421875, 0.039630889892578125, 0.0497894287109375, 0.059947967529296875, 0.07010650634765625, 0.08026504516601562, 0.090423583984375, 0.10058212280273438, 0.11074066162109375, 0.12089920043945312, 0.1310577392578125, 0.14121627807617188, 0.15137481689453125, 0.16153335571289062, 0.17169189453125, 0.18185043334960938, 0.19200897216796875, 0.20216751098632812, 0.2123260498046875, 0.22248458862304688, 0.23264312744140625, 0.24280166625976562, 0.252960205078125, 0.2631187438964844, 0.27327728271484375, 0.2834358215332031, 0.2935943603515625, 0.3037528991699219, 0.31391143798828125, 0.3240699768066406, 0.334228515625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 10.0, 10.0, 14.0, 15.0, 20.0, 21.0, 28.0, 36.0, 20.0, 45.0, 37.0, 56.0, 51.0, 36.0, 62.0, 52.0, 58.0, 56.0, 49.0, 45.0, 38.0, 24.0, 36.0, 30.0, 23.0, 30.0, 19.0, 18.0, 14.0, 13.0, 10.0, 8.0, 2.0, 2.0, 8.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.86077308654785, -18.159896850585938, -17.459020614624023, -16.75814437866211, -16.057270050048828, -15.356392860412598, -14.655517578125, -13.954641342163086, -13.253765106201172, -12.552888870239258, -11.852012634277344, -11.151137351989746, -10.450261116027832, -9.749384880065918, -9.04850959777832, -8.347633361816406, -7.646757125854492, -6.945880889892578, -6.245005130767822, -5.544129371643066, -4.843253135681152, -4.142376899719238, -3.4415011405944824, -2.7406253814697266, -2.0397491455078125, -1.3388731479644775, -0.6379971504211426, 0.06287884712219238, 0.7637548446655273, 1.4646308422088623, 2.1655068397521973, 2.866382598876953, 3.5672607421875, 4.268136978149414, 4.96901273727417, 5.669888496398926, 6.37076473236084, 7.071640968322754, 7.77251672744751, 8.473392486572266, 9.17426872253418, 9.875144958496094, 10.576021194458008, 11.276896476745605, 11.97777271270752, 12.678648948669434, 13.379524230957031, 14.080400466918945, 14.78127670288086, 15.482152938842773, 16.183029174804688, 16.8839054107666, 17.584781646728516, 18.285655975341797, 18.98653221130371, 19.687408447265625, 20.38828468322754, 21.089160919189453, 21.790037155151367, 22.49091339111328, 23.191787719726562, 23.892663955688477, 24.59354019165039, 25.294416427612305, 25.99529266357422]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 6.0, 1.0, 5.0, 5.0, 3.0, 5.0, 7.0, 8.0, 12.0, 8.0, 15.0, 11.0, 16.0, 12.0, 31.0, 23.0, 25.0, 28.0, 35.0, 47.0, 42.0, 40.0, 37.0, 48.0, 50.0, 49.0, 36.0, 38.0, 36.0, 31.0, 38.0, 38.0, 34.0, 25.0, 25.0, 27.0, 18.0, 20.0, 17.0, 9.0, 11.0, 5.0, 11.0, 6.0, 4.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.182872772216797, -20.446439743041992, -19.710006713867188, -18.973573684692383, -18.237140655517578, -17.500707626342773, -16.76427459716797, -16.027841567993164, -15.29140853881836, -14.554975509643555, -13.81854248046875, -13.082109451293945, -12.34567642211914, -11.609243392944336, -10.872810363769531, -10.136377334594727, -9.399944305419922, -8.663511276245117, -7.9270782470703125, -7.190645217895508, -6.454212188720703, -5.717779159545898, -4.981346130371094, -4.244913101196289, -3.5084800720214844, -2.7720470428466797, -2.035614013671875, -1.2991809844970703, -0.5627479553222656, 0.17368507385253906, 0.9101181030273438, 1.6465511322021484, 2.3829822540283203, 3.119415283203125, 3.8558483123779297, 4.592281341552734, 5.328714370727539, 6.065147399902344, 6.801580429077148, 7.538013458251953, 8.274446487426758, 9.010879516601562, 9.747312545776367, 10.483745574951172, 11.220178604125977, 11.956611633300781, 12.693044662475586, 13.42947769165039, 14.165910720825195, 14.90234375, 15.638776779174805, 16.37520980834961, 17.111642837524414, 17.84807586669922, 18.584508895874023, 19.320941925048828, 20.057374954223633, 20.793807983398438, 21.530241012573242, 22.266674041748047, 23.00310707092285, 23.739540100097656, 24.47597312927246, 25.212406158447266, 25.94883918762207]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 20.0, 25.0, 37.0, 57.0, 98.0, 178.0, 247.0, 394.0, 649.0, 1027.0, 1659.0, 2770.0, 4603.0, 7236.0, 11435.0, 17936.0, 27040.0, 39738.0, 55693.0, 74439.0, 92567.0, 107601.0, 114535.0, 111181.0, 98611.0, 82102.0, 62401.0, 45753.0, 31510.0, 20776.0, 13536.0, 8540.0, 5393.0, 3375.0, 2088.0, 1272.0, 787.0, 479.0, 271.0, 194.0, 115.0, 58.0, 41.0, 38.0, 13.0, 6.0, 14.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-14.890625, -14.4486083984375, -14.006591796875, -13.5645751953125, -13.12255859375, -12.6805419921875, -12.238525390625, -11.7965087890625, -11.3544921875, -10.9124755859375, -10.470458984375, -10.0284423828125, -9.58642578125, -9.1444091796875, -8.702392578125, -8.2603759765625, -7.818359375, -7.3763427734375, -6.934326171875, -6.4923095703125, -6.05029296875, -5.6082763671875, -5.166259765625, -4.7242431640625, -4.2822265625, -3.8402099609375, -3.398193359375, -2.9561767578125, -2.51416015625, -2.0721435546875, -1.630126953125, -1.1881103515625, -0.74609375, -0.3040771484375, 0.137939453125, 0.5799560546875, 1.02197265625, 1.4639892578125, 1.906005859375, 2.3480224609375, 2.7900390625, 3.2320556640625, 3.674072265625, 4.1160888671875, 4.55810546875, 5.0001220703125, 5.442138671875, 5.8841552734375, 6.326171875, 6.7681884765625, 7.210205078125, 7.6522216796875, 8.09423828125, 8.5362548828125, 8.978271484375, 9.4202880859375, 9.8623046875, 10.3043212890625, 10.746337890625, 11.1883544921875, 11.63037109375, 12.0723876953125, 12.514404296875, 12.9564208984375, 13.3984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 5.0, 13.0, 7.0, 11.0, 8.0, 9.0, 12.0, 19.0, 23.0, 18.0, 24.0, 44.0, 38.0, 35.0, 33.0, 37.0, 48.0, 40.0, 47.0, 47.0, 47.0, 43.0, 37.0, 51.0, 31.0, 37.0, 45.0, 27.0, 25.0, 24.0, 18.0, 25.0, 16.0, 10.0, 7.0, 5.0, 6.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.3974609375, -20.638671875, -19.8798828125, -19.12109375, -18.3623046875, -17.603515625, -16.8447265625, -16.0859375, -15.3271484375, -14.568359375, -13.8095703125, -13.05078125, -12.2919921875, -11.533203125, -10.7744140625, -10.015625, -9.2568359375, -8.498046875, -7.7392578125, -6.98046875, -6.2216796875, -5.462890625, -4.7041015625, -3.9453125, -3.1865234375, -2.427734375, -1.6689453125, -0.91015625, -0.1513671875, 0.607421875, 1.3662109375, 2.125, 2.8837890625, 3.642578125, 4.4013671875, 5.16015625, 5.9189453125, 6.677734375, 7.4365234375, 8.1953125, 8.9541015625, 9.712890625, 10.4716796875, 11.23046875, 11.9892578125, 12.748046875, 13.5068359375, 14.265625, 15.0244140625, 15.783203125, 16.5419921875, 17.30078125, 18.0595703125, 18.818359375, 19.5771484375, 20.3359375, 21.0947265625, 21.853515625, 22.6123046875, 23.37109375, 24.1298828125, 24.888671875, 25.6474609375, 26.40625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 14.0, 12.0, 31.0, 39.0, 74.0, 140.0, 231.0, 335.0, 594.0, 1044.0, 1840.0, 3051.0, 5523.0, 9330.0, 15938.0, 25908.0, 40623.0, 60761.0, 85115.0, 108571.0, 125831.0, 130328.0, 120180.0, 99736.0, 74615.0, 51912.0, 34234.0, 21305.0, 13066.0, 7658.0, 4367.0, 2619.0, 1397.0, 907.0, 465.0, 308.0, 182.0, 102.0, 60.0, 49.0, 24.0, 12.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9453125, -15.4359130859375, -14.926513671875, -14.4171142578125, -13.90771484375, -13.3983154296875, -12.888916015625, -12.3795166015625, -11.8701171875, -11.3607177734375, -10.851318359375, -10.3419189453125, -9.83251953125, -9.3231201171875, -8.813720703125, -8.3043212890625, -7.794921875, -7.2855224609375, -6.776123046875, -6.2667236328125, -5.75732421875, -5.2479248046875, -4.738525390625, -4.2291259765625, -3.7197265625, -3.2103271484375, -2.700927734375, -2.1915283203125, -1.68212890625, -1.1727294921875, -0.663330078125, -0.1539306640625, 0.35546875, 0.8648681640625, 1.374267578125, 1.8836669921875, 2.39306640625, 2.9024658203125, 3.411865234375, 3.9212646484375, 4.4306640625, 4.9400634765625, 5.449462890625, 5.9588623046875, 6.46826171875, 6.9776611328125, 7.487060546875, 7.9964599609375, 8.505859375, 9.0152587890625, 9.524658203125, 10.0340576171875, 10.54345703125, 11.0528564453125, 11.562255859375, 12.0716552734375, 12.5810546875, 13.0904541015625, 13.599853515625, 14.1092529296875, 14.61865234375, 15.1280517578125, 15.637451171875, 16.1468505859375, 16.65625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 2.0, 6.0, 8.0, 6.0, 9.0, 16.0, 17.0, 22.0, 24.0, 29.0, 35.0, 31.0, 31.0, 37.0, 40.0, 34.0, 39.0, 57.0, 70.0, 38.0, 58.0, 40.0, 58.0, 43.0, 32.0, 28.0, 29.0, 30.0, 17.0, 22.0, 22.0, 17.0, 21.0, 6.0, 6.0, 6.0, 4.0, 5.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.078125, -14.576171875, -14.07421875, -13.572265625, -13.0703125, -12.568359375, -12.06640625, -11.564453125, -11.0625, -10.560546875, -10.05859375, -9.556640625, -9.0546875, -8.552734375, -8.05078125, -7.548828125, -7.046875, -6.544921875, -6.04296875, -5.541015625, -5.0390625, -4.537109375, -4.03515625, -3.533203125, -3.03125, -2.529296875, -2.02734375, -1.525390625, -1.0234375, -0.521484375, -0.01953125, 0.482421875, 0.984375, 1.486328125, 1.98828125, 2.490234375, 2.9921875, 3.494140625, 3.99609375, 4.498046875, 5.0, 5.501953125, 6.00390625, 6.505859375, 7.0078125, 7.509765625, 8.01171875, 8.513671875, 9.015625, 9.517578125, 10.01953125, 10.521484375, 11.0234375, 11.525390625, 12.02734375, 12.529296875, 13.03125, 13.533203125, 14.03515625, 14.537109375, 15.0390625, 15.541015625, 16.04296875, 16.544921875, 17.046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 1.0, 8.0, 10.0, 4.0, 16.0, 26.0, 28.0, 43.0, 95.0, 112.0, 163.0, 233.0, 396.0, 567.0, 893.0, 1432.0, 2227.0, 3745.0, 6000.0, 9513.0, 15970.0, 25210.0, 39537.0, 58931.0, 83810.0, 109098.0, 128086.0, 132881.0, 121052.0, 98340.0, 72460.0, 50113.0, 33233.0, 20562.0, 12797.0, 8069.0, 4681.0, 2989.0, 1865.0, 1193.0, 762.0, 473.0, 340.0, 185.0, 147.0, 82.0, 63.0, 43.0, 34.0, 14.0, 11.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.62109375, -4.473388671875, -4.32568359375, -4.177978515625, -4.0302734375, -3.882568359375, -3.73486328125, -3.587158203125, -3.439453125, -3.291748046875, -3.14404296875, -2.996337890625, -2.8486328125, -2.700927734375, -2.55322265625, -2.405517578125, -2.2578125, -2.110107421875, -1.96240234375, -1.814697265625, -1.6669921875, -1.519287109375, -1.37158203125, -1.223876953125, -1.076171875, -0.928466796875, -0.78076171875, -0.633056640625, -0.4853515625, -0.337646484375, -0.18994140625, -0.042236328125, 0.10546875, 0.253173828125, 0.40087890625, 0.548583984375, 0.6962890625, 0.843994140625, 0.99169921875, 1.139404296875, 1.287109375, 1.434814453125, 1.58251953125, 1.730224609375, 1.8779296875, 2.025634765625, 2.17333984375, 2.321044921875, 2.46875, 2.616455078125, 2.76416015625, 2.911865234375, 3.0595703125, 3.207275390625, 3.35498046875, 3.502685546875, 3.650390625, 3.798095703125, 3.94580078125, 4.093505859375, 4.2412109375, 4.388916015625, 4.53662109375, 4.684326171875, 4.83203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 0.0, 9.0, 9.0, 12.0, 18.0, 17.0, 20.0, 25.0, 22.0, 27.0, 42.0, 48.0, 42.0, 54.0, 61.0, 39.0, 55.0, 49.0, 58.0, 56.0, 56.0, 47.0, 37.0, 38.0, 23.0, 23.0, 23.0, 18.0, 13.0, 15.0, 11.0, 11.0, 6.0, 4.0, 7.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0005578994750976562, -0.0005419217050075531, -0.00052594393491745, -0.0005099661648273468, -0.0004939883947372437, -0.0004780106246471405, -0.00046203285455703735, -0.0004460550844669342, -0.00043007731437683105, -0.0004140995442867279, -0.00039812177419662476, -0.0003821440041065216, -0.00036616623401641846, -0.0003501884639263153, -0.00033421069383621216, -0.000318232923746109, -0.00030225515365600586, -0.0002862773835659027, -0.00027029961347579956, -0.0002543218433856964, -0.00023834407329559326, -0.0002223663032054901, -0.00020638853311538696, -0.0001904107630252838, -0.00017443299293518066, -0.00015845522284507751, -0.00014247745275497437, -0.00012649968266487122, -0.00011052191257476807, -9.454414248466492e-05, -7.856637239456177e-05, -6.258860230445862e-05, -4.661083221435547e-05, -3.063306212425232e-05, -1.465529203414917e-05, 1.3224780559539795e-06, 1.730024814605713e-05, 3.327801823616028e-05, 4.925578832626343e-05, 6.523355841636658e-05, 8.121132850646973e-05, 9.718909859657288e-05, 0.00011316686868667603, 0.00012914463877677917, 0.00014512240886688232, 0.00016110017895698547, 0.00017707794904708862, 0.00019305571913719177, 0.00020903348922729492, 0.00022501125931739807, 0.00024098902940750122, 0.00025696679949760437, 0.0002729445695877075, 0.00028892233967781067, 0.0003049001097679138, 0.00032087787985801697, 0.0003368556499481201, 0.00035283342003822327, 0.0003688111901283264, 0.00038478896021842957, 0.0004007667303085327, 0.00041674450039863586, 0.000432722270488739, 0.00044870004057884216, 0.0004646778106689453]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 7.0, 9.0, 13.0, 24.0, 39.0, 69.0, 111.0, 210.0, 313.0, 531.0, 816.0, 1353.0, 2246.0, 3666.0, 6511.0, 11058.0, 18681.0, 31340.0, 51177.0, 78292.0, 110493.0, 137719.0, 148045.0, 136344.0, 109034.0, 76406.0, 49451.0, 30356.0, 18063.0, 10619.0, 6238.0, 3717.0, 2216.0, 1345.0, 801.0, 475.0, 297.0, 159.0, 122.0, 70.0, 50.0, 25.0, 21.0, 6.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.67578125, -5.49542236328125, -5.3150634765625, -5.13470458984375, -4.954345703125, -4.77398681640625, -4.5936279296875, -4.41326904296875, -4.23291015625, -4.05255126953125, -3.8721923828125, -3.69183349609375, -3.511474609375, -3.33111572265625, -3.1507568359375, -2.97039794921875, -2.7900390625, -2.60968017578125, -2.4293212890625, -2.24896240234375, -2.068603515625, -1.88824462890625, -1.7078857421875, -1.52752685546875, -1.34716796875, -1.16680908203125, -0.9864501953125, -0.80609130859375, -0.625732421875, -0.44537353515625, -0.2650146484375, -0.08465576171875, 0.095703125, 0.27606201171875, 0.4564208984375, 0.63677978515625, 0.817138671875, 0.99749755859375, 1.1778564453125, 1.35821533203125, 1.53857421875, 1.71893310546875, 1.8992919921875, 2.07965087890625, 2.260009765625, 2.44036865234375, 2.6207275390625, 2.80108642578125, 2.9814453125, 3.16180419921875, 3.3421630859375, 3.52252197265625, 3.702880859375, 3.88323974609375, 4.0635986328125, 4.24395751953125, 4.42431640625, 4.60467529296875, 4.7850341796875, 4.96539306640625, 5.145751953125, 5.32611083984375, 5.5064697265625, 5.68682861328125, 5.8671875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 8.0, 9.0, 16.0, 17.0, 22.0, 22.0, 34.0, 31.0, 41.0, 61.0, 56.0, 50.0, 60.0, 54.0, 84.0, 62.0, 65.0, 56.0, 51.0, 37.0, 27.0, 27.0, 23.0, 21.0, 15.0, 15.0, 10.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.288360595703125, -2.18414306640625, -2.079925537109375, -1.9757080078125, -1.871490478515625, -1.76727294921875, -1.663055419921875, -1.558837890625, -1.454620361328125, -1.35040283203125, -1.246185302734375, -1.1419677734375, -1.037750244140625, -0.93353271484375, -0.829315185546875, -0.72509765625, -0.620880126953125, -0.51666259765625, -0.412445068359375, -0.3082275390625, -0.204010009765625, -0.09979248046875, 0.004425048828125, 0.108642578125, 0.212860107421875, 0.31707763671875, 0.421295166015625, 0.5255126953125, 0.629730224609375, 0.73394775390625, 0.838165283203125, 0.9423828125, 1.046600341796875, 1.15081787109375, 1.255035400390625, 1.3592529296875, 1.463470458984375, 1.56768798828125, 1.671905517578125, 1.776123046875, 1.880340576171875, 1.98455810546875, 2.088775634765625, 2.1929931640625, 2.297210693359375, 2.40142822265625, 2.505645751953125, 2.60986328125, 2.714080810546875, 2.81829833984375, 2.922515869140625, 3.0267333984375, 3.130950927734375, 3.23516845703125, 3.339385986328125, 3.443603515625, 3.547821044921875, 3.65203857421875, 3.756256103515625, 3.8604736328125, 3.964691162109375, 4.06890869140625, 4.173126220703125, 4.27734375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 3.0, 6.0, 8.0, 11.0, 23.0, 19.0, 28.0, 26.0, 22.0, 18.0, 32.0, 32.0, 43.0, 42.0, 40.0, 46.0, 54.0, 47.0, 41.0, 52.0, 53.0, 32.0, 40.0, 34.0, 37.0, 28.0, 28.0, 20.0, 29.0, 18.0, 20.0, 15.0, 15.0, 7.0, 4.0, 7.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-17.382543563842773, -16.76424217224121, -16.14594078063965, -15.52763843536377, -14.90933609008789, -14.291034698486328, -13.672733306884766, -13.054431915283203, -12.436129570007324, -11.817828178405762, -11.199525833129883, -10.58122444152832, -9.962923049926758, -9.344620704650879, -8.726319313049316, -8.108016967773438, -7.489715576171875, -6.871413707733154, -6.253111839294434, -5.634810447692871, -5.01650857925415, -4.39820671081543, -3.779905080795288, -3.1616034507751465, -2.543301582336426, -1.9249998331069946, -1.3066980838775635, -0.6883963346481323, -0.07009458541870117, 0.5482072830200195, 1.1665089130401611, 1.7848105430603027, 2.4031124114990234, 3.021414279937744, 3.6397159099578857, 4.258017539978027, 4.876319408416748, 5.494621276855469, 6.112922668457031, 6.731224536895752, 7.349526405334473, 7.967828273773193, 8.586130142211914, 9.204431533813477, 9.822732925415039, 10.441035270690918, 11.05933666229248, 11.67763900756836, 12.295940399169922, 12.914241790771484, 13.532544136047363, 14.150845527648926, 14.769147872924805, 15.387449264526367, 16.00575065612793, 16.624052047729492, 17.242355346679688, 17.86065673828125, 18.478958129882812, 19.097261428833008, 19.71556282043457, 20.333864212036133, 20.952165603637695, 21.570466995239258, 22.18876838684082]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 5.0, 18.0, 4.0, 12.0, 11.0, 11.0, 16.0, 16.0, 15.0, 20.0, 25.0, 36.0, 30.0, 47.0, 48.0, 48.0, 39.0, 47.0, 33.0, 30.0, 56.0, 51.0, 33.0, 35.0, 30.0, 41.0, 29.0, 27.0, 18.0, 25.0, 29.0, 25.0, 23.0, 17.0, 10.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.262420654296875, -23.506309509277344, -22.750198364257812, -21.99408531188965, -21.237974166870117, -20.481863021850586, -19.725749969482422, -18.96963882446289, -18.21352767944336, -17.457416534423828, -16.701305389404297, -15.945192337036133, -15.189081192016602, -14.43297004699707, -13.676857948303223, -12.920745849609375, -12.164634704589844, -11.408523559570312, -10.652411460876465, -9.896299362182617, -9.140188217163086, -8.384077072143555, -7.627964973449707, -6.871853351593018, -6.115741729736328, -5.359630107879639, -4.603518486022949, -3.8474068641662598, -3.0912952423095703, -2.335183620452881, -1.5790719985961914, -0.822960376739502, -0.06684684753417969, 0.6892647743225098, 1.4453763961791992, 2.2014880180358887, 2.957599639892578, 3.7137112617492676, 4.469822883605957, 5.2259345054626465, 5.982046127319336, 6.738157749176025, 7.494269371032715, 8.250381469726562, 9.006492614746094, 9.762603759765625, 10.518715858459473, 11.27482795715332, 12.030939102172852, 12.787050247192383, 13.54316234588623, 14.299274444580078, 15.05538558959961, 15.81149673461914, 16.567607879638672, 17.323720932006836, 18.079832077026367, 18.8359432220459, 19.592056274414062, 20.348167419433594, 21.104278564453125, 21.860389709472656, 22.616500854492188, 23.37261390686035, 24.128725051879883]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 7.0, 19.0, 25.0, 50.0, 69.0, 111.0, 198.0, 282.0, 489.0, 912.0, 1322.0, 2281.0, 3505.0, 5801.0, 9377.0, 15022.0, 24234.0, 37952.0, 59206.0, 90666.0, 137251.0, 199301.0, 277145.0, 362930.0, 437987.0, 480758.0, 475340.0, 425482.0, 346039.0, 261072.0, 185642.0, 127163.0, 83288.0, 53664.0, 33941.0, 21299.0, 13293.0, 8169.0, 5065.0, 3134.0, 1901.0, 1113.0, 682.0, 418.0, 252.0, 156.0, 103.0, 62.0, 46.0, 31.0, 17.0, 11.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-15.1015625, -14.6424560546875, -14.183349609375, -13.7242431640625, -13.26513671875, -12.8060302734375, -12.346923828125, -11.8878173828125, -11.4287109375, -10.9696044921875, -10.510498046875, -10.0513916015625, -9.59228515625, -9.1331787109375, -8.674072265625, -8.2149658203125, -7.755859375, -7.2967529296875, -6.837646484375, -6.3785400390625, -5.91943359375, -5.4603271484375, -5.001220703125, -4.5421142578125, -4.0830078125, -3.6239013671875, -3.164794921875, -2.7056884765625, -2.24658203125, -1.7874755859375, -1.328369140625, -0.8692626953125, -0.41015625, 0.0489501953125, 0.508056640625, 0.9671630859375, 1.42626953125, 1.8853759765625, 2.344482421875, 2.8035888671875, 3.2626953125, 3.7218017578125, 4.180908203125, 4.6400146484375, 5.09912109375, 5.5582275390625, 6.017333984375, 6.4764404296875, 6.935546875, 7.3946533203125, 7.853759765625, 8.3128662109375, 8.77197265625, 9.2310791015625, 9.690185546875, 10.1492919921875, 10.6083984375, 11.0675048828125, 11.526611328125, 11.9857177734375, 12.44482421875, 12.9039306640625, 13.363037109375, 13.8221435546875, 14.28125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 2.0, 9.0, 6.0, 12.0, 8.0, 13.0, 6.0, 10.0, 14.0, 16.0, 23.0, 33.0, 23.0, 31.0, 28.0, 38.0, 37.0, 48.0, 34.0, 44.0, 58.0, 39.0, 44.0, 43.0, 39.0, 31.0, 45.0, 28.0, 33.0, 29.0, 29.0, 20.0, 30.0, 17.0, 20.0, 14.0, 11.0, 7.0, 7.0, 1.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.390625, -16.81396484375, -16.2373046875, -15.66064453125, -15.083984375, -14.50732421875, -13.9306640625, -13.35400390625, -12.77734375, -12.20068359375, -11.6240234375, -11.04736328125, -10.470703125, -9.89404296875, -9.3173828125, -8.74072265625, -8.1640625, -7.58740234375, -7.0107421875, -6.43408203125, -5.857421875, -5.28076171875, -4.7041015625, -4.12744140625, -3.55078125, -2.97412109375, -2.3974609375, -1.82080078125, -1.244140625, -0.66748046875, -0.0908203125, 0.48583984375, 1.0625, 1.63916015625, 2.2158203125, 2.79248046875, 3.369140625, 3.94580078125, 4.5224609375, 5.09912109375, 5.67578125, 6.25244140625, 6.8291015625, 7.40576171875, 7.982421875, 8.55908203125, 9.1357421875, 9.71240234375, 10.2890625, 10.86572265625, 11.4423828125, 12.01904296875, 12.595703125, 13.17236328125, 13.7490234375, 14.32568359375, 14.90234375, 15.47900390625, 16.0556640625, 16.63232421875, 17.208984375, 17.78564453125, 18.3623046875, 18.93896484375, 19.515625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 7.0, 2.0, 8.0, 7.0, 14.0, 26.0, 50.0, 80.0, 101.0, 137.0, 265.0, 445.0, 762.0, 1266.0, 2015.0, 3409.0, 5493.0, 9170.0, 15056.0, 24284.0, 38661.0, 60722.0, 90923.0, 134255.0, 189047.0, 252133.0, 319002.0, 380012.0, 420544.0, 430301.0, 410113.0, 362120.0, 299282.0, 231723.0, 170890.0, 119857.0, 80918.0, 53350.0, 33845.0, 21218.0, 12836.0, 7940.0, 4631.0, 2887.0, 1736.0, 1049.0, 645.0, 407.0, 229.0, 160.0, 94.0, 56.0, 40.0, 22.0, 18.0, 16.0, 6.0, 5.0, 4.0, 2.0], "bins": [-14.109375, -13.686279296875, -13.26318359375, -12.840087890625, -12.4169921875, -11.993896484375, -11.57080078125, -11.147705078125, -10.724609375, -10.301513671875, -9.87841796875, -9.455322265625, -9.0322265625, -8.609130859375, -8.18603515625, -7.762939453125, -7.33984375, -6.916748046875, -6.49365234375, -6.070556640625, -5.6474609375, -5.224365234375, -4.80126953125, -4.378173828125, -3.955078125, -3.531982421875, -3.10888671875, -2.685791015625, -2.2626953125, -1.839599609375, -1.41650390625, -0.993408203125, -0.5703125, -0.147216796875, 0.27587890625, 0.698974609375, 1.1220703125, 1.545166015625, 1.96826171875, 2.391357421875, 2.814453125, 3.237548828125, 3.66064453125, 4.083740234375, 4.5068359375, 4.929931640625, 5.35302734375, 5.776123046875, 6.19921875, 6.622314453125, 7.04541015625, 7.468505859375, 7.8916015625, 8.314697265625, 8.73779296875, 9.160888671875, 9.583984375, 10.007080078125, 10.43017578125, 10.853271484375, 11.2763671875, 11.699462890625, 12.12255859375, 12.545654296875, 12.96875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 9.0, 12.0, 19.0, 13.0, 27.0, 31.0, 54.0, 43.0, 52.0, 74.0, 88.0, 108.0, 99.0, 137.0, 159.0, 145.0, 188.0, 203.0, 202.0, 219.0, 240.0, 200.0, 223.0, 204.0, 187.0, 170.0, 129.0, 144.0, 127.0, 97.0, 96.0, 82.0, 61.0, 49.0, 38.0, 28.0, 21.0, 24.0, 16.0, 13.0, 16.0, 9.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.5234375, -8.254150390625, -7.98486328125, -7.715576171875, -7.4462890625, -7.177001953125, -6.90771484375, -6.638427734375, -6.369140625, -6.099853515625, -5.83056640625, -5.561279296875, -5.2919921875, -5.022705078125, -4.75341796875, -4.484130859375, -4.21484375, -3.945556640625, -3.67626953125, -3.406982421875, -3.1376953125, -2.868408203125, -2.59912109375, -2.329833984375, -2.060546875, -1.791259765625, -1.52197265625, -1.252685546875, -0.9833984375, -0.714111328125, -0.44482421875, -0.175537109375, 0.09375, 0.363037109375, 0.63232421875, 0.901611328125, 1.1708984375, 1.440185546875, 1.70947265625, 1.978759765625, 2.248046875, 2.517333984375, 2.78662109375, 3.055908203125, 3.3251953125, 3.594482421875, 3.86376953125, 4.133056640625, 4.40234375, 4.671630859375, 4.94091796875, 5.210205078125, 5.4794921875, 5.748779296875, 6.01806640625, 6.287353515625, 6.556640625, 6.825927734375, 7.09521484375, 7.364501953125, 7.6337890625, 7.903076171875, 8.17236328125, 8.441650390625, 8.7109375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 13.0, 15.0, 17.0, 18.0, 22.0, 27.0, 24.0, 22.0, 35.0, 38.0, 61.0, 59.0, 65.0, 54.0, 54.0, 60.0, 48.0, 50.0, 43.0, 38.0, 31.0, 35.0, 33.0, 24.0, 19.0, 19.0, 14.0, 13.0, 10.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.391103744506836, -16.73643684387207, -16.081768035888672, -15.427101135253906, -14.772433280944824, -14.117765426635742, -13.463098526000977, -12.808430671691895, -12.153762817382812, -11.49909496307373, -10.844427108764648, -10.189760208129883, -9.5350923538208, -8.880424499511719, -8.225757598876953, -7.571089744567871, -6.916421890258789, -6.261754035949707, -5.607086658477783, -4.952419281005859, -4.297751426696777, -3.6430838108062744, -2.9884161949157715, -2.3337488174438477, -1.6790809631347656, -1.0244133472442627, -0.36974573135375977, 0.28492188453674316, 0.9395895004272461, 1.594257116317749, 2.248924732208252, 2.903592109680176, 3.558259963989258, 4.21292781829834, 4.867595195770264, 5.5222625732421875, 6.1769304275512695, 6.831598281860352, 7.486265659332275, 8.1409330368042, 8.795600891113281, 9.450268745422363, 10.104936599731445, 10.759603500366211, 11.414271354675293, 12.068939208984375, 12.72360610961914, 13.378273963928223, 14.032941818237305, 14.687609672546387, 15.342277526855469, 15.996944427490234, 16.651611328125, 17.3062801361084, 17.960947036743164, 18.615615844726562, 19.270282745361328, 19.924949645996094, 20.579618453979492, 21.234285354614258, 21.888954162597656, 22.543621063232422, 23.198287963867188, 23.852954864501953, 24.50762367248535]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 5.0, 12.0, 12.0, 11.0, 10.0, 12.0, 17.0, 21.0, 23.0, 17.0, 28.0, 35.0, 36.0, 39.0, 26.0, 43.0, 46.0, 33.0, 42.0, 32.0, 43.0, 43.0, 28.0, 37.0, 45.0, 46.0, 34.0, 36.0, 25.0, 22.0, 28.0, 19.0, 21.0, 12.0, 15.0, 13.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.653776168823242, -18.978042602539062, -18.30230712890625, -17.62657356262207, -16.95083999633789, -16.27510643005371, -15.599371910095215, -14.923637390136719, -14.247903823852539, -13.57217025756836, -12.896435737609863, -12.220701217651367, -11.544967651367188, -10.869234085083008, -10.193499565124512, -9.517765045166016, -8.842031478881836, -8.166297912597656, -7.49056339263916, -6.814829349517822, -6.139095306396484, -5.4633612632751465, -4.787627220153809, -4.111893177032471, -3.436159133911133, -2.760425090789795, -2.084691047668457, -1.4089570045471191, -0.7332229614257812, -0.05748891830444336, 0.6182451248168945, 1.2939791679382324, 1.9697151184082031, 2.645449161529541, 3.321183204650879, 3.996917247772217, 4.672651290893555, 5.348385334014893, 6.0241193771362305, 6.699853420257568, 7.375587463378906, 8.051321029663086, 8.727055549621582, 9.402790069580078, 10.078523635864258, 10.754257202148438, 11.429991722106934, 12.10572624206543, 12.78145980834961, 13.457193374633789, 14.132927894592285, 14.808662414550781, 15.484395980834961, 16.16012954711914, 16.835865020751953, 17.511598587036133, 18.187332153320312, 18.863065719604492, 19.538799285888672, 20.214534759521484, 20.890268325805664, 21.566001892089844, 22.241737365722656, 22.917470932006836, 23.593204498291016]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 4.0, 3.0, 8.0, 17.0, 26.0, 32.0, 48.0, 84.0, 106.0, 167.0, 208.0, 331.0, 463.0, 693.0, 990.0, 1431.0, 2159.0, 3156.0, 4638.0, 6816.0, 10047.0, 15383.0, 22235.0, 33401.0, 49836.0, 74654.0, 107590.0, 149401.0, 163078.0, 127550.0, 89593.0, 60281.0, 40792.0, 27121.0, 18195.0, 12147.0, 8459.0, 5603.0, 3713.0, 2549.0, 1827.0, 1150.0, 807.0, 538.0, 390.0, 256.0, 187.0, 131.0, 92.0, 61.0, 41.0, 23.0, 16.0, 23.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0], "bins": [-2.375, -2.30133056640625, -2.2276611328125, -2.15399169921875, -2.080322265625, -2.00665283203125, -1.9329833984375, -1.85931396484375, -1.78564453125, -1.71197509765625, -1.6383056640625, -1.56463623046875, -1.490966796875, -1.41729736328125, -1.3436279296875, -1.26995849609375, -1.1962890625, -1.12261962890625, -1.0489501953125, -0.97528076171875, -0.901611328125, -0.82794189453125, -0.7542724609375, -0.68060302734375, -0.60693359375, -0.53326416015625, -0.4595947265625, -0.38592529296875, -0.312255859375, -0.23858642578125, -0.1649169921875, -0.09124755859375, -0.017578125, 0.05609130859375, 0.1297607421875, 0.20343017578125, 0.277099609375, 0.35076904296875, 0.4244384765625, 0.49810791015625, 0.57177734375, 0.64544677734375, 0.7191162109375, 0.79278564453125, 0.866455078125, 0.94012451171875, 1.0137939453125, 1.08746337890625, 1.1611328125, 1.23480224609375, 1.3084716796875, 1.38214111328125, 1.455810546875, 1.52947998046875, 1.6031494140625, 1.67681884765625, 1.75048828125, 1.82415771484375, 1.8978271484375, 1.97149658203125, 2.045166015625, 2.11883544921875, 2.1925048828125, 2.26617431640625, 2.33984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 3.0, 4.0, 8.0, 8.0, 12.0, 10.0, 15.0, 18.0, 10.0, 17.0, 25.0, 27.0, 39.0, 34.0, 37.0, 46.0, 32.0, 38.0, 44.0, 50.0, 48.0, 45.0, 42.0, 30.0, 51.0, 48.0, 40.0, 34.0, 34.0, 27.0, 31.0, 17.0, 18.0, 11.0, 14.0, 14.0, 5.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.21875, -20.466796875, -19.71484375, -18.962890625, -18.2109375, -17.458984375, -16.70703125, -15.955078125, -15.203125, -14.451171875, -13.69921875, -12.947265625, -12.1953125, -11.443359375, -10.69140625, -9.939453125, -9.1875, -8.435546875, -7.68359375, -6.931640625, -6.1796875, -5.427734375, -4.67578125, -3.923828125, -3.171875, -2.419921875, -1.66796875, -0.916015625, -0.1640625, 0.587890625, 1.33984375, 2.091796875, 2.84375, 3.595703125, 4.34765625, 5.099609375, 5.8515625, 6.603515625, 7.35546875, 8.107421875, 8.859375, 9.611328125, 10.36328125, 11.115234375, 11.8671875, 12.619140625, 13.37109375, 14.123046875, 14.875, 15.626953125, 16.37890625, 17.130859375, 17.8828125, 18.634765625, 19.38671875, 20.138671875, 20.890625, 21.642578125, 22.39453125, 23.146484375, 23.8984375, 24.650390625, 25.40234375, 26.154296875, 26.90625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 10.0, 11.0, 12.0, 23.0, 37.0, 66.0, 97.0, 130.0, 186.0, 262.0, 445.0, 603.0, 953.0, 1322.0, 1936.0, 2893.0, 4356.0, 6610.0, 10519.0, 16504.0, 26828.0, 44233.0, 74289.0, 121823.0, 185033.0, 198271.0, 135473.0, 83165.0, 50402.0, 29939.0, 18537.0, 11381.0, 7490.0, 4837.0, 3185.0, 2193.0, 1442.0, 979.0, 656.0, 469.0, 320.0, 199.0, 150.0, 90.0, 68.0, 47.0, 20.0, 22.0, 11.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.697265625, -2.61328125, -2.529296875, -2.4453125, -2.361328125, -2.27734375, -2.193359375, -2.109375, -2.025390625, -1.94140625, -1.857421875, -1.7734375, -1.689453125, -1.60546875, -1.521484375, -1.4375, -1.353515625, -1.26953125, -1.185546875, -1.1015625, -1.017578125, -0.93359375, -0.849609375, -0.765625, -0.681640625, -0.59765625, -0.513671875, -0.4296875, -0.345703125, -0.26171875, -0.177734375, -0.09375, -0.009765625, 0.07421875, 0.158203125, 0.2421875, 0.326171875, 0.41015625, 0.494140625, 0.578125, 0.662109375, 0.74609375, 0.830078125, 0.9140625, 0.998046875, 1.08203125, 1.166015625, 1.25, 1.333984375, 1.41796875, 1.501953125, 1.5859375, 1.669921875, 1.75390625, 1.837890625, 1.921875, 2.005859375, 2.08984375, 2.173828125, 2.2578125, 2.341796875, 2.42578125, 2.509765625, 2.59375, 2.677734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 9.0, 5.0, 6.0, 10.0, 7.0, 17.0, 13.0, 20.0, 13.0, 26.0, 26.0, 25.0, 25.0, 33.0, 36.0, 40.0, 36.0, 28.0, 42.0, 49.0, 46.0, 55.0, 43.0, 46.0, 45.0, 36.0, 43.0, 28.0, 21.0, 23.0, 30.0, 28.0, 19.0, 20.0, 10.0, 8.0, 12.0, 5.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-15.3515625, -14.8994140625, -14.447265625, -13.9951171875, -13.54296875, -13.0908203125, -12.638671875, -12.1865234375, -11.734375, -11.2822265625, -10.830078125, -10.3779296875, -9.92578125, -9.4736328125, -9.021484375, -8.5693359375, -8.1171875, -7.6650390625, -7.212890625, -6.7607421875, -6.30859375, -5.8564453125, -5.404296875, -4.9521484375, -4.5, -4.0478515625, -3.595703125, -3.1435546875, -2.69140625, -2.2392578125, -1.787109375, -1.3349609375, -0.8828125, -0.4306640625, 0.021484375, 0.4736328125, 0.92578125, 1.3779296875, 1.830078125, 2.2822265625, 2.734375, 3.1865234375, 3.638671875, 4.0908203125, 4.54296875, 4.9951171875, 5.447265625, 5.8994140625, 6.3515625, 6.8037109375, 7.255859375, 7.7080078125, 8.16015625, 8.6123046875, 9.064453125, 9.5166015625, 9.96875, 10.4208984375, 10.873046875, 11.3251953125, 11.77734375, 12.2294921875, 12.681640625, 13.1337890625, 13.5859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 19.0, 19.0, 32.0, 51.0, 65.0, 111.0, 139.0, 227.0, 298.0, 476.0, 713.0, 1032.0, 1389.0, 2007.0, 3028.0, 4337.0, 6568.0, 10057.0, 16017.0, 25545.0, 43926.0, 79489.0, 154201.0, 277444.0, 191564.0, 94850.0, 51952.0, 30283.0, 18328.0, 11559.0, 7368.0, 4834.0, 3358.0, 2207.0, 1518.0, 1101.0, 777.0, 519.0, 362.0, 256.0, 160.0, 116.0, 83.0, 56.0, 29.0, 27.0, 13.0, 11.0, 17.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11810302734375, -0.11424922943115234, -0.11039543151855469, -0.10654163360595703, -0.10268783569335938, -0.09883403778076172, -0.09498023986816406, -0.0911264419555664, -0.08727264404296875, -0.0834188461303711, -0.07956504821777344, -0.07571125030517578, -0.07185745239257812, -0.06800365447998047, -0.06414985656738281, -0.060296058654785156, -0.0564422607421875, -0.052588462829589844, -0.04873466491699219, -0.04488086700439453, -0.041027069091796875, -0.03717327117919922, -0.03331947326660156, -0.029465675354003906, -0.02561187744140625, -0.021758079528808594, -0.017904281616210938, -0.014050483703613281, -0.010196685791015625, -0.006342887878417969, -0.0024890899658203125, 0.0013647079467773438, 0.005218505859375, 0.009072303771972656, 0.012926101684570312, 0.01677989959716797, 0.020633697509765625, 0.02448749542236328, 0.028341293334960938, 0.032195091247558594, 0.03604888916015625, 0.039902687072753906, 0.04375648498535156, 0.04761028289794922, 0.051464080810546875, 0.05531787872314453, 0.05917167663574219, 0.06302547454833984, 0.0668792724609375, 0.07073307037353516, 0.07458686828613281, 0.07844066619873047, 0.08229446411132812, 0.08614826202392578, 0.09000205993652344, 0.0938558578491211, 0.09770965576171875, 0.1015634536743164, 0.10541725158691406, 0.10927104949951172, 0.11312484741210938, 0.11697864532470703, 0.12083244323730469, 0.12468624114990234, 0.1285400390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 6.0, 10.0, 8.0, 12.0, 10.0, 11.0, 17.0, 22.0, 24.0, 32.0, 32.0, 34.0, 46.0, 45.0, 49.0, 43.0, 57.0, 30.0, 44.0, 48.0, 51.0, 33.0, 35.0, 37.0, 27.0, 36.0, 35.0, 23.0, 28.0, 27.0, 17.0, 14.0, 13.0, 8.0, 9.0, 7.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9609928131103516e-05, -1.8880702555179596e-05, -1.8151476979255676e-05, -1.7422251403331757e-05, -1.6693025827407837e-05, -1.5963800251483917e-05, -1.5234574675559998e-05, -1.4505349099636078e-05, -1.3776123523712158e-05, -1.3046897947788239e-05, -1.2317672371864319e-05, -1.15884467959404e-05, -1.085922122001648e-05, -1.012999564409256e-05, -9.40077006816864e-06, -8.67154449224472e-06, -7.9423189163208e-06, -7.213093340396881e-06, -6.4838677644729614e-06, -5.754642188549042e-06, -5.025416612625122e-06, -4.296191036701202e-06, -3.5669654607772827e-06, -2.837739884853363e-06, -2.1085143089294434e-06, -1.3792887330055237e-06, -6.50063157081604e-07, 7.916241884231567e-08, 8.083879947662354e-07, 1.537613570690155e-06, 2.2668391466140747e-06, 2.9960647225379944e-06, 3.725290298461914e-06, 4.454515874385834e-06, 5.183741450309753e-06, 5.912967026233673e-06, 6.642192602157593e-06, 7.3714181780815125e-06, 8.100643754005432e-06, 8.829869329929352e-06, 9.559094905853271e-06, 1.0288320481777191e-05, 1.101754605770111e-05, 1.174677163362503e-05, 1.247599720954895e-05, 1.320522278547287e-05, 1.393444836139679e-05, 1.466367393732071e-05, 1.539289951324463e-05, 1.612212508916855e-05, 1.6851350665092468e-05, 1.7580576241016388e-05, 1.8309801816940308e-05, 1.9039027392864227e-05, 1.9768252968788147e-05, 2.0497478544712067e-05, 2.1226704120635986e-05, 2.1955929696559906e-05, 2.2685155272483826e-05, 2.3414380848407745e-05, 2.4143606424331665e-05, 2.4872832000255585e-05, 2.5602057576179504e-05, 2.6331283152103424e-05, 2.7060508728027344e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 7.0, 15.0, 25.0, 32.0, 46.0, 67.0, 106.0, 154.0, 229.0, 324.0, 496.0, 804.0, 1333.0, 2028.0, 3080.0, 4841.0, 7854.0, 12327.0, 19440.0, 31695.0, 52558.0, 91879.0, 174781.0, 278941.0, 155076.0, 82982.0, 48384.0, 29294.0, 18198.0, 11540.0, 7210.0, 4637.0, 2947.0, 1823.0, 1179.0, 775.0, 512.0, 304.0, 225.0, 137.0, 81.0, 63.0, 42.0, 28.0, 19.0, 12.0, 11.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.277099609375, -0.2679901123046875, -0.258880615234375, -0.2497711181640625, -0.24066162109375, -0.2315521240234375, -0.222442626953125, -0.2133331298828125, -0.2042236328125, -0.1951141357421875, -0.186004638671875, -0.1768951416015625, -0.16778564453125, -0.1586761474609375, -0.149566650390625, -0.1404571533203125, -0.13134765625, -0.1222381591796875, -0.113128662109375, -0.1040191650390625, -0.09490966796875, -0.0858001708984375, -0.076690673828125, -0.0675811767578125, -0.0584716796875, -0.0493621826171875, -0.040252685546875, -0.0311431884765625, -0.02203369140625, -0.0129241943359375, -0.003814697265625, 0.0052947998046875, 0.014404296875, 0.0235137939453125, 0.032623291015625, 0.0417327880859375, 0.05084228515625, 0.0599517822265625, 0.069061279296875, 0.0781707763671875, 0.0872802734375, 0.0963897705078125, 0.105499267578125, 0.1146087646484375, 0.12371826171875, 0.1328277587890625, 0.141937255859375, 0.1510467529296875, 0.16015625, 0.1692657470703125, 0.178375244140625, 0.1874847412109375, 0.19659423828125, 0.2057037353515625, 0.214813232421875, 0.2239227294921875, 0.2330322265625, 0.2421417236328125, 0.251251220703125, 0.2603607177734375, 0.26947021484375, 0.2785797119140625, 0.287689208984375, 0.2967987060546875, 0.305908203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 1.0, 2.0, 5.0, 6.0, 4.0, 3.0, 10.0, 11.0, 12.0, 15.0, 23.0, 19.0, 34.0, 29.0, 36.0, 58.0, 54.0, 56.0, 60.0, 71.0, 47.0, 79.0, 58.0, 45.0, 48.0, 36.0, 27.0, 18.0, 23.0, 14.0, 16.0, 16.0, 5.0, 13.0, 10.0, 8.0, 2.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2027587890625, -0.19663238525390625, -0.1905059814453125, -0.18437957763671875, -0.178253173828125, -0.17212677001953125, -0.1660003662109375, -0.15987396240234375, -0.15374755859375, -0.14762115478515625, -0.1414947509765625, -0.13536834716796875, -0.129241943359375, -0.12311553955078125, -0.1169891357421875, -0.11086273193359375, -0.104736328125, -0.09860992431640625, -0.0924835205078125, -0.08635711669921875, -0.080230712890625, -0.07410430908203125, -0.0679779052734375, -0.06185150146484375, -0.05572509765625, -0.04959869384765625, -0.0434722900390625, -0.03734588623046875, -0.031219482421875, -0.02509307861328125, -0.0189666748046875, -0.01284027099609375, -0.0067138671875, -0.00058746337890625, 0.0055389404296875, 0.01166534423828125, 0.017791748046875, 0.02391815185546875, 0.0300445556640625, 0.03617095947265625, 0.04229736328125, 0.04842376708984375, 0.0545501708984375, 0.06067657470703125, 0.066802978515625, 0.07292938232421875, 0.0790557861328125, 0.08518218994140625, 0.09130859375, 0.09743499755859375, 0.1035614013671875, 0.10968780517578125, 0.115814208984375, 0.12194061279296875, 0.1280670166015625, 0.13419342041015625, 0.14031982421875, 0.14644622802734375, 0.1525726318359375, 0.15869903564453125, 0.164825439453125, 0.17095184326171875, 0.1770782470703125, 0.18320465087890625, 0.1893310546875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 2.0, 14.0, 11.0, 16.0, 14.0, 17.0, 31.0, 29.0, 24.0, 26.0, 36.0, 46.0, 62.0, 63.0, 62.0, 49.0, 59.0, 56.0, 47.0, 49.0, 40.0, 33.0, 27.0, 35.0, 37.0, 26.0, 13.0, 16.0, 8.0, 13.0, 10.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.597570419311523, -16.947839736938477, -16.298107147216797, -15.64837646484375, -14.998645782470703, -14.348915100097656, -13.699183464050293, -13.04945182800293, -12.399721145629883, -11.749990463256836, -11.100258827209473, -10.45052719116211, -9.800796508789062, -9.151065826416016, -8.501334190368652, -7.851603031158447, -7.201871871948242, -6.552140712738037, -5.902409553527832, -5.252678394317627, -4.602947235107422, -3.953216075897217, -3.3034849166870117, -2.6537537574768066, -2.0040225982666016, -1.3542914390563965, -0.7045602798461914, -0.05482912063598633, 0.5949020385742188, 1.2446331977844238, 1.894364356994629, 2.544095516204834, 3.193826675415039, 3.843557834625244, 4.493288993835449, 5.143020153045654, 5.792751312255859, 6.4424824714660645, 7.0922136306762695, 7.741944789886475, 8.39167594909668, 9.041406631469727, 9.69113826751709, 10.340869903564453, 10.9906005859375, 11.640331268310547, 12.29006290435791, 12.939794540405273, 13.58952522277832, 14.239255905151367, 14.88898754119873, 15.538719177246094, 16.18844985961914, 16.838180541992188, 17.487911224365234, 18.137643814086914, 18.78737449645996, 19.437105178833008, 20.086837768554688, 20.736568450927734, 21.38629913330078, 22.036029815673828, 22.685760498046875, 23.335493087768555, 23.9852237701416]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 3.0, 6.0, 4.0, 5.0, 12.0, 11.0, 12.0, 10.0, 12.0, 15.0, 21.0, 23.0, 15.0, 32.0, 32.0, 35.0, 39.0, 29.0, 40.0, 46.0, 33.0, 38.0, 40.0, 38.0, 43.0, 29.0, 36.0, 45.0, 48.0, 35.0, 35.0, 25.0, 23.0, 30.0, 16.0, 22.0, 13.0, 14.0, 14.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.7023983001709, -19.03127098083496, -18.360143661499023, -17.689016342163086, -17.01789093017578, -16.346763610839844, -15.675636291503906, -15.004508972167969, -14.333381652832031, -13.662254333496094, -12.991127014160156, -12.320000648498535, -11.648873329162598, -10.97774600982666, -10.306619644165039, -9.635492324829102, -8.964365005493164, -8.293237686157227, -7.622110843658447, -6.950984001159668, -6.2798566818237305, -5.608729362487793, -4.937602519989014, -4.266475677490234, -3.595348358154297, -2.9242212772369385, -2.25309419631958, -1.5819671154022217, -0.9108400344848633, -0.23971295356750488, 0.4314141273498535, 1.1025409698486328, 1.7736663818359375, 2.444793462753296, 3.1159205436706543, 3.7870476245880127, 4.458174705505371, 5.129302024841309, 5.800428867340088, 6.471555709838867, 7.142683029174805, 7.813810348510742, 8.48493766784668, 9.1560640335083, 9.827191352844238, 10.498318672180176, 11.169445037841797, 11.840572357177734, 12.511699676513672, 13.18282699584961, 13.853954315185547, 14.525080680847168, 15.196208000183105, 15.867335319519043, 16.538461685180664, 17.2095890045166, 17.88071632385254, 18.551843643188477, 19.222970962524414, 19.89409828186035, 20.565223693847656, 21.236351013183594, 21.90747833251953, 22.57860565185547, 23.249732971191406]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 11.0, 19.0, 21.0, 33.0, 62.0, 96.0, 114.0, 193.0, 297.0, 489.0, 697.0, 1037.0, 1685.0, 2510.0, 3636.0, 5448.0, 8186.0, 11719.0, 17131.0, 24032.0, 33268.0, 44214.0, 56486.0, 69161.0, 81381.0, 89816.0, 94140.0, 92767.0, 86058.0, 76079.0, 63255.0, 50963.0, 38677.0, 29093.0, 20813.0, 14437.0, 10159.0, 6882.0, 4477.0, 3139.0, 2055.0, 1311.0, 872.0, 552.0, 366.0, 260.0, 174.0, 105.0, 70.0, 40.0, 29.0, 18.0, 9.0, 12.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.87158203125, -9.5400390625, -9.20849609375, -8.876953125, -8.54541015625, -8.2138671875, -7.88232421875, -7.55078125, -7.21923828125, -6.8876953125, -6.55615234375, -6.224609375, -5.89306640625, -5.5615234375, -5.22998046875, -4.8984375, -4.56689453125, -4.2353515625, -3.90380859375, -3.572265625, -3.24072265625, -2.9091796875, -2.57763671875, -2.24609375, -1.91455078125, -1.5830078125, -1.25146484375, -0.919921875, -0.58837890625, -0.2568359375, 0.07470703125, 0.40625, 0.73779296875, 1.0693359375, 1.40087890625, 1.732421875, 2.06396484375, 2.3955078125, 2.72705078125, 3.05859375, 3.39013671875, 3.7216796875, 4.05322265625, 4.384765625, 4.71630859375, 5.0478515625, 5.37939453125, 5.7109375, 6.04248046875, 6.3740234375, 6.70556640625, 7.037109375, 7.36865234375, 7.7001953125, 8.03173828125, 8.36328125, 8.69482421875, 9.0263671875, 9.35791015625, 9.689453125, 10.02099609375, 10.3525390625, 10.68408203125, 11.015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 6.0, 11.0, 6.0, 11.0, 16.0, 11.0, 10.0, 18.0, 21.0, 33.0, 30.0, 33.0, 25.0, 31.0, 33.0, 42.0, 40.0, 42.0, 46.0, 36.0, 44.0, 37.0, 48.0, 41.0, 41.0, 39.0, 36.0, 32.0, 30.0, 21.0, 31.0, 16.0, 18.0, 13.0, 8.0, 15.0, 10.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.96875, -19.2666015625, -18.564453125, -17.8623046875, -17.16015625, -16.4580078125, -15.755859375, -15.0537109375, -14.3515625, -13.6494140625, -12.947265625, -12.2451171875, -11.54296875, -10.8408203125, -10.138671875, -9.4365234375, -8.734375, -8.0322265625, -7.330078125, -6.6279296875, -5.92578125, -5.2236328125, -4.521484375, -3.8193359375, -3.1171875, -2.4150390625, -1.712890625, -1.0107421875, -0.30859375, 0.3935546875, 1.095703125, 1.7978515625, 2.5, 3.2021484375, 3.904296875, 4.6064453125, 5.30859375, 6.0107421875, 6.712890625, 7.4150390625, 8.1171875, 8.8193359375, 9.521484375, 10.2236328125, 10.92578125, 11.6279296875, 12.330078125, 13.0322265625, 13.734375, 14.4365234375, 15.138671875, 15.8408203125, 16.54296875, 17.2451171875, 17.947265625, 18.6494140625, 19.3515625, 20.0537109375, 20.755859375, 21.4580078125, 22.16015625, 22.8623046875, 23.564453125, 24.2666015625, 24.96875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 5.0, 13.0, 11.0, 14.0, 25.0, 47.0, 60.0, 101.0, 162.0, 290.0, 413.0, 664.0, 1065.0, 1746.0, 2694.0, 4240.0, 6452.0, 10136.0, 15128.0, 22585.0, 32309.0, 44710.0, 59785.0, 76515.0, 91959.0, 102172.0, 106156.0, 102578.0, 90686.0, 75383.0, 59514.0, 44631.0, 31594.0, 21980.0, 15002.0, 9832.0, 6478.0, 4163.0, 2787.0, 1631.0, 1053.0, 672.0, 405.0, 261.0, 142.0, 124.0, 58.0, 48.0, 29.0, 22.0, 12.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-11.4296875, -11.0546875, -10.6796875, -10.3046875, -9.9296875, -9.5546875, -9.1796875, -8.8046875, -8.4296875, -8.0546875, -7.6796875, -7.3046875, -6.9296875, -6.5546875, -6.1796875, -5.8046875, -5.4296875, -5.0546875, -4.6796875, -4.3046875, -3.9296875, -3.5546875, -3.1796875, -2.8046875, -2.4296875, -2.0546875, -1.6796875, -1.3046875, -0.9296875, -0.5546875, -0.1796875, 0.1953125, 0.5703125, 0.9453125, 1.3203125, 1.6953125, 2.0703125, 2.4453125, 2.8203125, 3.1953125, 3.5703125, 3.9453125, 4.3203125, 4.6953125, 5.0703125, 5.4453125, 5.8203125, 6.1953125, 6.5703125, 6.9453125, 7.3203125, 7.6953125, 8.0703125, 8.4453125, 8.8203125, 9.1953125, 9.5703125, 9.9453125, 10.3203125, 10.6953125, 11.0703125, 11.4453125, 11.8203125, 12.1953125, 12.5703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 8.0, 15.0, 11.0, 12.0, 18.0, 20.0, 19.0, 12.0, 38.0, 30.0, 26.0, 24.0, 28.0, 39.0, 37.0, 35.0, 56.0, 61.0, 36.0, 38.0, 39.0, 48.0, 36.0, 39.0, 41.0, 23.0, 27.0, 16.0, 23.0, 28.0, 21.0, 14.0, 17.0, 14.0, 9.0, 9.0, 8.0, 6.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.4375, -14.0103759765625, -13.583251953125, -13.1561279296875, -12.72900390625, -12.3018798828125, -11.874755859375, -11.4476318359375, -11.0205078125, -10.5933837890625, -10.166259765625, -9.7391357421875, -9.31201171875, -8.8848876953125, -8.457763671875, -8.0306396484375, -7.603515625, -7.1763916015625, -6.749267578125, -6.3221435546875, -5.89501953125, -5.4678955078125, -5.040771484375, -4.6136474609375, -4.1865234375, -3.7593994140625, -3.332275390625, -2.9051513671875, -2.47802734375, -2.0509033203125, -1.623779296875, -1.1966552734375, -0.76953125, -0.3424072265625, 0.084716796875, 0.5118408203125, 0.93896484375, 1.3660888671875, 1.793212890625, 2.2203369140625, 2.6474609375, 3.0745849609375, 3.501708984375, 3.9288330078125, 4.35595703125, 4.7830810546875, 5.210205078125, 5.6373291015625, 6.064453125, 6.4915771484375, 6.918701171875, 7.3458251953125, 7.77294921875, 8.2000732421875, 8.627197265625, 9.0543212890625, 9.4814453125, 9.9085693359375, 10.335693359375, 10.7628173828125, 11.18994140625, 11.6170654296875, 12.044189453125, 12.4713134765625, 12.8984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 16.0, 29.0, 42.0, 52.0, 75.0, 122.0, 191.0, 342.0, 534.0, 800.0, 1353.0, 2161.0, 3532.0, 5730.0, 9421.0, 15118.0, 23927.0, 36197.0, 53478.0, 74127.0, 95623.0, 113529.0, 121854.0, 118506.0, 104404.0, 83998.0, 62255.0, 43320.0, 29220.0, 18432.0, 11658.0, 7060.0, 4402.0, 2623.0, 1632.0, 1081.0, 653.0, 374.0, 228.0, 171.0, 109.0, 63.0, 44.0, 23.0, 17.0, 16.0, 2.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.9459228515625, -3.821533203125, -3.6971435546875, -3.57275390625, -3.4483642578125, -3.323974609375, -3.1995849609375, -3.0751953125, -2.9508056640625, -2.826416015625, -2.7020263671875, -2.57763671875, -2.4532470703125, -2.328857421875, -2.2044677734375, -2.080078125, -1.9556884765625, -1.831298828125, -1.7069091796875, -1.58251953125, -1.4581298828125, -1.333740234375, -1.2093505859375, -1.0849609375, -0.9605712890625, -0.836181640625, -0.7117919921875, -0.58740234375, -0.4630126953125, -0.338623046875, -0.2142333984375, -0.08984375, 0.0345458984375, 0.158935546875, 0.2833251953125, 0.40771484375, 0.5321044921875, 0.656494140625, 0.7808837890625, 0.9052734375, 1.0296630859375, 1.154052734375, 1.2784423828125, 1.40283203125, 1.5272216796875, 1.651611328125, 1.7760009765625, 1.900390625, 2.0247802734375, 2.149169921875, 2.2735595703125, 2.39794921875, 2.5223388671875, 2.646728515625, 2.7711181640625, 2.8955078125, 3.0198974609375, 3.144287109375, 3.2686767578125, 3.39306640625, 3.5174560546875, 3.641845703125, 3.7662353515625, 3.890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 11.0, 11.0, 18.0, 18.0, 21.0, 14.0, 18.0, 16.0, 34.0, 37.0, 25.0, 27.0, 34.0, 29.0, 33.0, 40.0, 34.0, 44.0, 44.0, 30.0, 36.0, 33.0, 34.0, 45.0, 30.0, 36.0, 29.0, 31.0, 30.0, 21.0, 16.0, 15.0, 11.0, 14.0, 12.0, 9.0, 9.0, 9.0, 5.0, 11.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00035834312438964844, -0.00034697726368904114, -0.00033561140298843384, -0.00032424554228782654, -0.00031287968158721924, -0.00030151382088661194, -0.00029014796018600464, -0.00027878209948539734, -0.00026741623878479004, -0.00025605037808418274, -0.00024468451738357544, -0.00023331865668296814, -0.00022195279598236084, -0.00021058693528175354, -0.00019922107458114624, -0.00018785521388053894, -0.00017648935317993164, -0.00016512349247932434, -0.00015375763177871704, -0.00014239177107810974, -0.00013102591037750244, -0.00011966004967689514, -0.00010829418897628784, -9.692832827568054e-05, -8.556246757507324e-05, -7.419660687446594e-05, -6.283074617385864e-05, -5.146488547325134e-05, -4.009902477264404e-05, -2.8733164072036743e-05, -1.7367303371429443e-05, -6.0014426708221436e-06, 5.364418029785156e-06, 1.6730278730392456e-05, 2.8096139430999756e-05, 3.9462000131607056e-05, 5.0827860832214355e-05, 6.219372153282166e-05, 7.355958223342896e-05, 8.492544293403625e-05, 9.629130363464355e-05, 0.00010765716433525085, 0.00011902302503585815, 0.00013038888573646545, 0.00014175474643707275, 0.00015312060713768005, 0.00016448646783828735, 0.00017585232853889465, 0.00018721818923950195, 0.00019858404994010925, 0.00020994991064071655, 0.00022131577134132385, 0.00023268163204193115, 0.00024404749274253845, 0.00025541335344314575, 0.00026677921414375305, 0.00027814507484436035, 0.00028951093554496765, 0.00030087679624557495, 0.00031224265694618225, 0.00032360851764678955, 0.00033497437834739685, 0.00034634023904800415, 0.00035770609974861145, 0.00036907196044921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 7.0, 8.0, 11.0, 16.0, 31.0, 38.0, 60.0, 99.0, 188.0, 278.0, 509.0, 747.0, 1299.0, 2258.0, 3480.0, 5880.0, 9471.0, 15621.0, 24944.0, 39148.0, 57979.0, 81350.0, 105684.0, 123655.0, 129844.0, 121090.0, 100797.0, 76097.0, 53569.0, 35221.0, 22827.0, 14195.0, 8670.0, 5373.0, 3183.0, 1941.0, 1172.0, 705.0, 387.0, 269.0, 165.0, 122.0, 54.0, 34.0, 31.0, 21.0, 10.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0], "bins": [-4.76953125, -4.630859375, -4.4921875, -4.353515625, -4.21484375, -4.076171875, -3.9375, -3.798828125, -3.66015625, -3.521484375, -3.3828125, -3.244140625, -3.10546875, -2.966796875, -2.828125, -2.689453125, -2.55078125, -2.412109375, -2.2734375, -2.134765625, -1.99609375, -1.857421875, -1.71875, -1.580078125, -1.44140625, -1.302734375, -1.1640625, -1.025390625, -0.88671875, -0.748046875, -0.609375, -0.470703125, -0.33203125, -0.193359375, -0.0546875, 0.083984375, 0.22265625, 0.361328125, 0.5, 0.638671875, 0.77734375, 0.916015625, 1.0546875, 1.193359375, 1.33203125, 1.470703125, 1.609375, 1.748046875, 1.88671875, 2.025390625, 2.1640625, 2.302734375, 2.44140625, 2.580078125, 2.71875, 2.857421875, 2.99609375, 3.134765625, 3.2734375, 3.412109375, 3.55078125, 3.689453125, 3.828125, 3.966796875, 4.10546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 5.0, 3.0, 3.0, 5.0, 9.0, 14.0, 15.0, 22.0, 24.0, 27.0, 30.0, 32.0, 37.0, 37.0, 45.0, 50.0, 48.0, 56.0, 50.0, 57.0, 50.0, 48.0, 45.0, 38.0, 45.0, 32.0, 32.0, 20.0, 25.0, 13.0, 19.0, 13.0, 7.0, 8.0, 8.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-2.533203125, -2.46221923828125, -2.3912353515625, -2.32025146484375, -2.249267578125, -2.17828369140625, -2.1072998046875, -2.03631591796875, -1.96533203125, -1.89434814453125, -1.8233642578125, -1.75238037109375, -1.681396484375, -1.61041259765625, -1.5394287109375, -1.46844482421875, -1.3974609375, -1.32647705078125, -1.2554931640625, -1.18450927734375, -1.113525390625, -1.04254150390625, -0.9715576171875, -0.90057373046875, -0.82958984375, -0.75860595703125, -0.6876220703125, -0.61663818359375, -0.545654296875, -0.47467041015625, -0.4036865234375, -0.33270263671875, -0.26171875, -0.19073486328125, -0.1197509765625, -0.04876708984375, 0.022216796875, 0.09320068359375, 0.1641845703125, 0.23516845703125, 0.30615234375, 0.37713623046875, 0.4481201171875, 0.51910400390625, 0.590087890625, 0.66107177734375, 0.7320556640625, 0.80303955078125, 0.8740234375, 0.94500732421875, 1.0159912109375, 1.08697509765625, 1.157958984375, 1.22894287109375, 1.2999267578125, 1.37091064453125, 1.44189453125, 1.51287841796875, 1.5838623046875, 1.65484619140625, 1.725830078125, 1.79681396484375, 1.8677978515625, 1.93878173828125, 2.009765625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 7.0, 8.0, 16.0, 20.0, 18.0, 16.0, 22.0, 28.0, 28.0, 22.0, 40.0, 46.0, 60.0, 56.0, 70.0, 55.0, 45.0, 57.0, 44.0, 43.0, 36.0, 47.0, 38.0, 32.0, 16.0, 18.0, 19.0, 13.0, 12.0, 9.0, 12.0, 6.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.87759780883789, -17.261014938354492, -16.644432067871094, -16.027851104736328, -15.41126823425293, -14.794685363769531, -14.17810344696045, -13.561521530151367, -12.944938659667969, -12.32835578918457, -11.711773872375488, -11.095191955566406, -10.478609085083008, -9.86202621459961, -9.245444297790527, -8.628862380981445, -8.012279510498047, -7.395697116851807, -6.779114723205566, -6.162532329559326, -5.545949935913086, -4.929367542266846, -4.3127851486206055, -3.6962027549743652, -3.079620361328125, -2.4630379676818848, -1.8464555740356445, -1.2298731803894043, -0.6132907867431641, 0.003291606903076172, 0.6198740005493164, 1.2364563941955566, 1.853036880493164, 2.4696192741394043, 3.0862016677856445, 3.7027840614318848, 4.319366455078125, 4.935948848724365, 5.5525312423706055, 6.169113636016846, 6.785696029663086, 7.402278423309326, 8.018860816955566, 8.635442733764648, 9.252025604248047, 9.868608474731445, 10.485190391540527, 11.10177230834961, 11.718355178833008, 12.334938049316406, 12.951519966125488, 13.56810188293457, 14.184684753417969, 14.801267623901367, 15.41784954071045, 16.03443145751953, 16.65101432800293, 17.267597198486328, 17.884178161621094, 18.500761032104492, 19.11734390258789, 19.73392677307129, 20.350509643554688, 20.967090606689453, 21.58367347717285]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 10.0, 4.0, 10.0, 5.0, 9.0, 17.0, 14.0, 16.0, 24.0, 28.0, 19.0, 40.0, 35.0, 32.0, 37.0, 35.0, 44.0, 46.0, 37.0, 45.0, 49.0, 43.0, 44.0, 45.0, 37.0, 51.0, 25.0, 35.0, 25.0, 33.0, 23.0, 10.0, 20.0, 13.0, 13.0, 4.0, 10.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.188093185424805, -20.439037322998047, -19.689983367919922, -18.940929412841797, -18.19187355041504, -17.44281768798828, -16.693763732910156, -15.944708824157715, -15.195653915405273, -14.446599006652832, -13.69754409790039, -12.94848918914795, -12.199434280395508, -11.450379371643066, -10.701324462890625, -9.952269554138184, -9.203214645385742, -8.4541597366333, -7.705104827880859, -6.956049919128418, -6.206995010375977, -5.457940101623535, -4.708885192871094, -3.9598302841186523, -3.210775375366211, -2.4617204666137695, -1.7126655578613281, -0.9636106491088867, -0.2145557403564453, 0.5344991683959961, 1.2835540771484375, 2.032608985900879, 2.7816638946533203, 3.5307188034057617, 4.279773712158203, 5.0288286209106445, 5.777883529663086, 6.526938438415527, 7.275993347167969, 8.02504825592041, 8.774103164672852, 9.523158073425293, 10.272212982177734, 11.021267890930176, 11.770322799682617, 12.519377708435059, 13.2684326171875, 14.017487525939941, 14.766542434692383, 15.515597343444824, 16.264652252197266, 17.01370620727539, 17.76276206970215, 18.511817932128906, 19.26087188720703, 20.009925842285156, 20.758981704711914, 21.508037567138672, 22.257091522216797, 23.006145477294922, 23.75520133972168, 24.504257202148438, 25.253311157226562, 26.002365112304688, 26.751420974731445]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 21.0, 43.0, 88.0, 141.0, 221.0, 392.0, 677.0, 1208.0, 2004.0, 3428.0, 5857.0, 9886.0, 16433.0, 26843.0, 44531.0, 71433.0, 111984.0, 170088.0, 246885.0, 335215.0, 422519.0, 483200.0, 498440.0, 461718.0, 387230.0, 296850.0, 213058.0, 143953.0, 92761.0, 58143.0, 35848.0, 21844.0, 12836.0, 7564.0, 4523.0, 2692.0, 1519.0, 908.0, 550.0, 283.0, 198.0, 99.0, 50.0, 42.0, 38.0, 16.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.078125, -12.61572265625, -12.1533203125, -11.69091796875, -11.228515625, -10.76611328125, -10.3037109375, -9.84130859375, -9.37890625, -8.91650390625, -8.4541015625, -7.99169921875, -7.529296875, -7.06689453125, -6.6044921875, -6.14208984375, -5.6796875, -5.21728515625, -4.7548828125, -4.29248046875, -3.830078125, -3.36767578125, -2.9052734375, -2.44287109375, -1.98046875, -1.51806640625, -1.0556640625, -0.59326171875, -0.130859375, 0.33154296875, 0.7939453125, 1.25634765625, 1.71875, 2.18115234375, 2.6435546875, 3.10595703125, 3.568359375, 4.03076171875, 4.4931640625, 4.95556640625, 5.41796875, 5.88037109375, 6.3427734375, 6.80517578125, 7.267578125, 7.72998046875, 8.1923828125, 8.65478515625, 9.1171875, 9.57958984375, 10.0419921875, 10.50439453125, 10.966796875, 11.42919921875, 11.8916015625, 12.35400390625, 12.81640625, 13.27880859375, 13.7412109375, 14.20361328125, 14.666015625, 15.12841796875, 15.5908203125, 16.05322265625, 16.515625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 7.0, 2.0, 2.0, 8.0, 10.0, 12.0, 14.0, 10.0, 20.0, 10.0, 23.0, 26.0, 25.0, 30.0, 29.0, 25.0, 48.0, 36.0, 40.0, 46.0, 29.0, 42.0, 38.0, 47.0, 45.0, 47.0, 47.0, 38.0, 28.0, 28.0, 28.0, 23.0, 28.0, 18.0, 21.0, 16.0, 16.0, 14.0, 6.0, 6.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.984375, -15.42919921875, -14.8740234375, -14.31884765625, -13.763671875, -13.20849609375, -12.6533203125, -12.09814453125, -11.54296875, -10.98779296875, -10.4326171875, -9.87744140625, -9.322265625, -8.76708984375, -8.2119140625, -7.65673828125, -7.1015625, -6.54638671875, -5.9912109375, -5.43603515625, -4.880859375, -4.32568359375, -3.7705078125, -3.21533203125, -2.66015625, -2.10498046875, -1.5498046875, -0.99462890625, -0.439453125, 0.11572265625, 0.6708984375, 1.22607421875, 1.78125, 2.33642578125, 2.8916015625, 3.44677734375, 4.001953125, 4.55712890625, 5.1123046875, 5.66748046875, 6.22265625, 6.77783203125, 7.3330078125, 7.88818359375, 8.443359375, 8.99853515625, 9.5537109375, 10.10888671875, 10.6640625, 11.21923828125, 11.7744140625, 12.32958984375, 12.884765625, 13.43994140625, 13.9951171875, 14.55029296875, 15.10546875, 15.66064453125, 16.2158203125, 16.77099609375, 17.326171875, 17.88134765625, 18.4365234375, 18.99169921875, 19.546875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 19.0, 22.0, 39.0, 82.0, 139.0, 228.0, 371.0, 638.0, 1051.0, 1935.0, 3169.0, 5239.0, 8793.0, 14568.0, 23535.0, 37055.0, 56486.0, 85766.0, 125699.0, 176328.0, 234622.0, 297052.0, 353579.0, 396352.0, 415716.0, 405658.0, 370512.0, 316642.0, 254329.0, 193064.0, 140389.0, 97281.0, 65276.0, 42497.0, 27260.0, 17028.0, 10357.0, 6312.0, 3719.0, 2229.0, 1316.0, 811.0, 420.0, 300.0, 183.0, 93.0, 58.0, 38.0, 9.0, 9.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.3472900390625, -11.944580078125, -11.5418701171875, -11.13916015625, -10.7364501953125, -10.333740234375, -9.9310302734375, -9.5283203125, -9.1256103515625, -8.722900390625, -8.3201904296875, -7.91748046875, -7.5147705078125, -7.112060546875, -6.7093505859375, -6.306640625, -5.9039306640625, -5.501220703125, -5.0985107421875, -4.69580078125, -4.2930908203125, -3.890380859375, -3.4876708984375, -3.0849609375, -2.6822509765625, -2.279541015625, -1.8768310546875, -1.47412109375, -1.0714111328125, -0.668701171875, -0.2659912109375, 0.13671875, 0.5394287109375, 0.942138671875, 1.3448486328125, 1.74755859375, 2.1502685546875, 2.552978515625, 2.9556884765625, 3.3583984375, 3.7611083984375, 4.163818359375, 4.5665283203125, 4.96923828125, 5.3719482421875, 5.774658203125, 6.1773681640625, 6.580078125, 6.9827880859375, 7.385498046875, 7.7882080078125, 8.19091796875, 8.5936279296875, 8.996337890625, 9.3990478515625, 9.8017578125, 10.2044677734375, 10.607177734375, 11.0098876953125, 11.41259765625, 11.8153076171875, 12.218017578125, 12.6207275390625, 13.0234375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 6.0, 15.0, 10.0, 13.0, 10.0, 23.0, 32.0, 32.0, 39.0, 62.0, 85.0, 66.0, 99.0, 97.0, 104.0, 129.0, 158.0, 170.0, 186.0, 167.0, 208.0, 195.0, 202.0, 194.0, 205.0, 171.0, 177.0, 173.0, 150.0, 135.0, 105.0, 102.0, 89.0, 88.0, 80.0, 59.0, 49.0, 39.0, 39.0, 27.0, 19.0, 21.0, 12.0, 7.0, 13.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.403564453125, -7.16259765625, -6.921630859375, -6.6806640625, -6.439697265625, -6.19873046875, -5.957763671875, -5.716796875, -5.475830078125, -5.23486328125, -4.993896484375, -4.7529296875, -4.511962890625, -4.27099609375, -4.030029296875, -3.7890625, -3.548095703125, -3.30712890625, -3.066162109375, -2.8251953125, -2.584228515625, -2.34326171875, -2.102294921875, -1.861328125, -1.620361328125, -1.37939453125, -1.138427734375, -0.8974609375, -0.656494140625, -0.41552734375, -0.174560546875, 0.06640625, 0.307373046875, 0.54833984375, 0.789306640625, 1.0302734375, 1.271240234375, 1.51220703125, 1.753173828125, 1.994140625, 2.235107421875, 2.47607421875, 2.717041015625, 2.9580078125, 3.198974609375, 3.43994140625, 3.680908203125, 3.921875, 4.162841796875, 4.40380859375, 4.644775390625, 4.8857421875, 5.126708984375, 5.36767578125, 5.608642578125, 5.849609375, 6.090576171875, 6.33154296875, 6.572509765625, 6.8134765625, 7.054443359375, 7.29541015625, 7.536376953125, 7.77734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 9.0, 7.0, 20.0, 19.0, 28.0, 28.0, 38.0, 44.0, 30.0, 50.0, 49.0, 63.0, 71.0, 71.0, 71.0, 69.0, 54.0, 45.0, 40.0, 37.0, 38.0, 28.0, 17.0, 23.0, 12.0, 11.0, 10.0, 1.0, 4.0, 6.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.934795379638672, -19.184358596801758, -18.433923721313477, -17.683486938476562, -16.93305206298828, -16.182615280151367, -15.432178497314453, -14.681742668151855, -13.931306838989258, -13.18087100982666, -12.430435180664062, -11.679998397827148, -10.92956256866455, -10.179126739501953, -9.428689956665039, -8.678254127502441, -7.927818298339844, -7.177382469177246, -6.42694616317749, -5.676509857177734, -4.926074028015137, -4.175638198852539, -3.425201892852783, -2.6747655868530273, -1.9243297576904297, -1.173893690109253, -0.42345762252807617, 0.3269784450531006, 1.0774145126342773, 1.827850580215454, 2.578286647796631, 3.3287229537963867, 4.079156875610352, 4.829592704772949, 5.580029010772705, 6.330465316772461, 7.080901145935059, 7.831336975097656, 8.58177375793457, 9.332209587097168, 10.082645416259766, 10.833081245422363, 11.583517074584961, 12.333953857421875, 13.084389686584473, 13.83482551574707, 14.585262298583984, 15.335698127746582, 16.08613395690918, 16.836570739746094, 17.587005615234375, 18.33744239807129, 19.087879180908203, 19.838314056396484, 20.5887508392334, 21.339187622070312, 22.089622497558594, 22.840059280395508, 23.59049415588379, 24.340930938720703, 25.091365814208984, 25.8418025970459, 26.592239379882812, 27.342674255371094, 28.093111038208008]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 6.0, 6.0, 6.0, 8.0, 16.0, 18.0, 12.0, 13.0, 17.0, 31.0, 31.0, 28.0, 28.0, 40.0, 32.0, 44.0, 34.0, 34.0, 23.0, 44.0, 43.0, 39.0, 54.0, 43.0, 37.0, 42.0, 35.0, 28.0, 29.0, 33.0, 21.0, 20.0, 22.0, 19.0, 9.0, 10.0, 13.0, 7.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.133386611938477, -19.46126937866211, -18.78915023803711, -18.117033004760742, -17.444915771484375, -16.772796630859375, -16.100679397583008, -15.42856216430664, -14.756443977355957, -14.084325790405273, -13.412208557128906, -12.740090370178223, -12.067972183227539, -11.395854949951172, -10.723736763000488, -10.051618576049805, -9.379501342773438, -8.707383155822754, -8.035265922546387, -7.363147735595703, -6.691030025482178, -6.018912315368652, -5.346794128417969, -4.674676418304443, -4.002558708190918, -3.3304409980773926, -2.658323049545288, -1.9862051010131836, -1.3140873908996582, -0.6419696807861328, 0.03014850616455078, 0.7022662162780762, 1.3743839263916016, 2.046501636505127, 2.7186195850372314, 3.390737533569336, 4.062855243682861, 4.734972953796387, 5.40709114074707, 6.079208850860596, 6.751326560974121, 7.4234442710876465, 8.095561981201172, 8.767680168151855, 9.439798355102539, 10.111915588378906, 10.78403377532959, 11.456151962280273, 12.12826919555664, 12.800387382507324, 13.472504615783691, 14.144622802734375, 14.816740036010742, 15.488858222961426, 16.16097640991211, 16.833093643188477, 17.505210876464844, 18.17732810974121, 18.84944725036621, 19.521564483642578, 20.193681716918945, 20.865798950195312, 21.537918090820312, 22.21003532409668, 22.88215446472168]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 16.0, 19.0, 30.0, 36.0, 65.0, 89.0, 141.0, 211.0, 366.0, 576.0, 967.0, 1595.0, 2719.0, 4678.0, 8094.0, 14379.0, 24947.0, 44576.0, 79729.0, 143520.0, 229249.0, 209950.0, 123994.0, 68771.0, 38246.0, 21841.0, 12457.0, 7042.0, 4159.0, 2425.0, 1409.0, 834.0, 530.0, 330.0, 184.0, 125.0, 76.0, 52.0, 32.0, 31.0, 26.0, 10.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.615570068359375, -2.51824951171875, -2.420928955078125, -2.3236083984375, -2.226287841796875, -2.12896728515625, -2.031646728515625, -1.934326171875, -1.837005615234375, -1.73968505859375, -1.642364501953125, -1.5450439453125, -1.447723388671875, -1.35040283203125, -1.253082275390625, -1.15576171875, -1.058441162109375, -0.96112060546875, -0.863800048828125, -0.7664794921875, -0.669158935546875, -0.57183837890625, -0.474517822265625, -0.377197265625, -0.279876708984375, -0.18255615234375, -0.085235595703125, 0.0120849609375, 0.109405517578125, 0.20672607421875, 0.304046630859375, 0.4013671875, 0.498687744140625, 0.59600830078125, 0.693328857421875, 0.7906494140625, 0.887969970703125, 0.98529052734375, 1.082611083984375, 1.179931640625, 1.277252197265625, 1.37457275390625, 1.471893310546875, 1.5692138671875, 1.666534423828125, 1.76385498046875, 1.861175537109375, 1.95849609375, 2.055816650390625, 2.15313720703125, 2.250457763671875, 2.3477783203125, 2.445098876953125, 2.54241943359375, 2.639739990234375, 2.737060546875, 2.834381103515625, 2.93170166015625, 3.029022216796875, 3.1263427734375, 3.223663330078125, 3.32098388671875, 3.418304443359375, 3.515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 4.0, 9.0, 8.0, 15.0, 15.0, 17.0, 23.0, 25.0, 24.0, 28.0, 44.0, 47.0, 34.0, 41.0, 38.0, 33.0, 45.0, 42.0, 50.0, 50.0, 47.0, 41.0, 34.0, 32.0, 36.0, 31.0, 24.0, 34.0, 28.0, 20.0, 19.0, 11.0, 11.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.1044921875, -20.365234375, -19.6259765625, -18.88671875, -18.1474609375, -17.408203125, -16.6689453125, -15.9296875, -15.1904296875, -14.451171875, -13.7119140625, -12.97265625, -12.2333984375, -11.494140625, -10.7548828125, -10.015625, -9.2763671875, -8.537109375, -7.7978515625, -7.05859375, -6.3193359375, -5.580078125, -4.8408203125, -4.1015625, -3.3623046875, -2.623046875, -1.8837890625, -1.14453125, -0.4052734375, 0.333984375, 1.0732421875, 1.8125, 2.5517578125, 3.291015625, 4.0302734375, 4.76953125, 5.5087890625, 6.248046875, 6.9873046875, 7.7265625, 8.4658203125, 9.205078125, 9.9443359375, 10.68359375, 11.4228515625, 12.162109375, 12.9013671875, 13.640625, 14.3798828125, 15.119140625, 15.8583984375, 16.59765625, 17.3369140625, 18.076171875, 18.8154296875, 19.5546875, 20.2939453125, 21.033203125, 21.7724609375, 22.51171875, 23.2509765625, 23.990234375, 24.7294921875, 25.46875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 13.0, 18.0, 17.0, 48.0, 37.0, 75.0, 118.0, 120.0, 191.0, 245.0, 388.0, 499.0, 753.0, 1143.0, 1648.0, 2448.0, 3641.0, 5381.0, 8062.0, 12696.0, 19959.0, 31642.0, 50034.0, 80258.0, 124326.0, 179364.0, 179013.0, 125348.0, 80830.0, 50552.0, 31732.0, 19977.0, 12697.0, 8439.0, 5599.0, 3400.0, 2467.0, 1637.0, 1073.0, 763.0, 572.0, 413.0, 254.0, 203.0, 141.0, 101.0, 71.0, 51.0, 25.0, 25.0, 21.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0], "bins": [-2.462890625, -2.388275146484375, -2.31365966796875, -2.239044189453125, -2.1644287109375, -2.089813232421875, -2.01519775390625, -1.940582275390625, -1.865966796875, -1.791351318359375, -1.71673583984375, -1.642120361328125, -1.5675048828125, -1.492889404296875, -1.41827392578125, -1.343658447265625, -1.26904296875, -1.194427490234375, -1.11981201171875, -1.045196533203125, -0.9705810546875, -0.895965576171875, -0.82135009765625, -0.746734619140625, -0.672119140625, -0.597503662109375, -0.52288818359375, -0.448272705078125, -0.3736572265625, -0.299041748046875, -0.22442626953125, -0.149810791015625, -0.0751953125, -0.000579833984375, 0.07403564453125, 0.148651123046875, 0.2232666015625, 0.297882080078125, 0.37249755859375, 0.447113037109375, 0.521728515625, 0.596343994140625, 0.67095947265625, 0.745574951171875, 0.8201904296875, 0.894805908203125, 0.96942138671875, 1.044036865234375, 1.11865234375, 1.193267822265625, 1.26788330078125, 1.342498779296875, 1.4171142578125, 1.491729736328125, 1.56634521484375, 1.640960693359375, 1.715576171875, 1.790191650390625, 1.86480712890625, 1.939422607421875, 2.0140380859375, 2.088653564453125, 2.16326904296875, 2.237884521484375, 2.3125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 14.0, 5.0, 8.0, 10.0, 3.0, 13.0, 16.0, 17.0, 14.0, 14.0, 29.0, 27.0, 22.0, 28.0, 31.0, 38.0, 34.0, 35.0, 41.0, 37.0, 43.0, 40.0, 36.0, 39.0, 34.0, 28.0, 40.0, 33.0, 20.0, 25.0, 25.0, 18.0, 29.0, 27.0, 26.0, 18.0, 12.0, 6.0, 13.0, 15.0, 9.0, 6.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8046875, -12.399169921875, -11.99365234375, -11.588134765625, -11.1826171875, -10.777099609375, -10.37158203125, -9.966064453125, -9.560546875, -9.155029296875, -8.74951171875, -8.343994140625, -7.9384765625, -7.532958984375, -7.12744140625, -6.721923828125, -6.31640625, -5.910888671875, -5.50537109375, -5.099853515625, -4.6943359375, -4.288818359375, -3.88330078125, -3.477783203125, -3.072265625, -2.666748046875, -2.26123046875, -1.855712890625, -1.4501953125, -1.044677734375, -0.63916015625, -0.233642578125, 0.171875, 0.577392578125, 0.98291015625, 1.388427734375, 1.7939453125, 2.199462890625, 2.60498046875, 3.010498046875, 3.416015625, 3.821533203125, 4.22705078125, 4.632568359375, 5.0380859375, 5.443603515625, 5.84912109375, 6.254638671875, 6.66015625, 7.065673828125, 7.47119140625, 7.876708984375, 8.2822265625, 8.687744140625, 9.09326171875, 9.498779296875, 9.904296875, 10.309814453125, 10.71533203125, 11.120849609375, 11.5263671875, 11.931884765625, 12.33740234375, 12.742919921875, 13.1484375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 10.0, 16.0, 26.0, 44.0, 41.0, 68.0, 108.0, 154.0, 194.0, 353.0, 525.0, 832.0, 1281.0, 1918.0, 3005.0, 4495.0, 7311.0, 11884.0, 19460.0, 32622.0, 57662.0, 107758.0, 205654.0, 259210.0, 147442.0, 77649.0, 42955.0, 25075.0, 15132.0, 9218.0, 5860.0, 3661.0, 2409.0, 1537.0, 1009.0, 665.0, 420.0, 300.0, 199.0, 128.0, 75.0, 69.0, 35.0, 29.0, 12.0, 13.0, 9.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.1026611328125, -0.09957313537597656, -0.09648513793945312, -0.09339714050292969, -0.09030914306640625, -0.08722114562988281, -0.08413314819335938, -0.08104515075683594, -0.0779571533203125, -0.07486915588378906, -0.07178115844726562, -0.06869316101074219, -0.06560516357421875, -0.06251716613769531, -0.059429168701171875, -0.05634117126464844, -0.053253173828125, -0.05016517639160156, -0.047077178955078125, -0.04398918151855469, -0.04090118408203125, -0.03781318664550781, -0.034725189208984375, -0.03163719177246094, -0.0285491943359375, -0.025461196899414062, -0.022373199462890625, -0.019285202026367188, -0.01619720458984375, -0.013109207153320312, -0.010021209716796875, -0.0069332122802734375, -0.00384521484375, -0.0007572174072265625, 0.002330780029296875, 0.0054187774658203125, 0.00850677490234375, 0.011594772338867188, 0.014682769775390625, 0.017770767211914062, 0.0208587646484375, 0.023946762084960938, 0.027034759521484375, 0.030122756958007812, 0.03321075439453125, 0.03629875183105469, 0.039386749267578125, 0.04247474670410156, 0.045562744140625, 0.04865074157714844, 0.051738739013671875, 0.05482673645019531, 0.05791473388671875, 0.06100273132324219, 0.06409072875976562, 0.06717872619628906, 0.0702667236328125, 0.07335472106933594, 0.07644271850585938, 0.07953071594238281, 0.08261871337890625, 0.08570671081542969, 0.08879470825195312, 0.09188270568847656, 0.094970703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 1.0, 5.0, 6.0, 2.0, 3.0, 7.0, 9.0, 12.0, 14.0, 10.0, 16.0, 14.0, 22.0, 41.0, 26.0, 28.0, 27.0, 39.0, 45.0, 51.0, 27.0, 54.0, 30.0, 44.0, 57.0, 42.0, 41.0, 41.0, 36.0, 42.0, 41.0, 21.0, 22.0, 27.0, 15.0, 18.0, 11.0, 12.0, 11.0, 8.0, 11.0, 7.0, 4.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6868114471435547e-05, -1.6322359442710876e-05, -1.5776604413986206e-05, -1.5230849385261536e-05, -1.4685094356536865e-05, -1.4139339327812195e-05, -1.3593584299087524e-05, -1.3047829270362854e-05, -1.2502074241638184e-05, -1.1956319212913513e-05, -1.1410564184188843e-05, -1.0864809155464172e-05, -1.0319054126739502e-05, -9.773299098014832e-06, -9.227544069290161e-06, -8.68178904056549e-06, -8.13603401184082e-06, -7.59027898311615e-06, -7.0445239543914795e-06, -6.498768925666809e-06, -5.953013896942139e-06, -5.407258868217468e-06, -4.861503839492798e-06, -4.3157488107681274e-06, -3.769993782043457e-06, -3.2242387533187866e-06, -2.678483724594116e-06, -2.132728695869446e-06, -1.5869736671447754e-06, -1.041218638420105e-06, -4.954636096954346e-07, 5.029141902923584e-08, 5.960464477539062e-07, 1.1418014764785767e-06, 1.687556505203247e-06, 2.2333115339279175e-06, 2.779066562652588e-06, 3.3248215913772583e-06, 3.870576620101929e-06, 4.416331648826599e-06, 4.9620866775512695e-06, 5.50784170627594e-06, 6.05359673500061e-06, 6.599351763725281e-06, 7.145106792449951e-06, 7.690861821174622e-06, 8.236616849899292e-06, 8.782371878623962e-06, 9.328126907348633e-06, 9.873881936073303e-06, 1.0419636964797974e-05, 1.0965391993522644e-05, 1.1511147022247314e-05, 1.2056902050971985e-05, 1.2602657079696655e-05, 1.3148412108421326e-05, 1.3694167137145996e-05, 1.4239922165870667e-05, 1.4785677194595337e-05, 1.5331432223320007e-05, 1.5877187252044678e-05, 1.6422942280769348e-05, 1.696869730949402e-05, 1.751445233821869e-05, 1.806020736694336e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 4.0, 12.0, 18.0, 30.0, 44.0, 55.0, 100.0, 169.0, 204.0, 343.0, 576.0, 905.0, 1396.0, 2199.0, 3355.0, 5346.0, 8636.0, 14107.0, 22719.0, 38066.0, 65611.0, 123191.0, 254673.0, 237787.0, 114118.0, 61825.0, 35854.0, 21498.0, 13333.0, 8244.0, 5190.0, 3314.0, 2078.0, 1298.0, 789.0, 536.0, 341.0, 186.0, 142.0, 97.0, 52.0, 27.0, 27.0, 17.0, 16.0, 12.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2152099609375, -0.20847320556640625, -0.2017364501953125, -0.19499969482421875, -0.188262939453125, -0.18152618408203125, -0.1747894287109375, -0.16805267333984375, -0.16131591796875, -0.15457916259765625, -0.1478424072265625, -0.14110565185546875, -0.134368896484375, -0.12763214111328125, -0.1208953857421875, -0.11415863037109375, -0.107421875, -0.10068511962890625, -0.0939483642578125, -0.08721160888671875, -0.080474853515625, -0.07373809814453125, -0.0670013427734375, -0.06026458740234375, -0.05352783203125, -0.04679107666015625, -0.0400543212890625, -0.03331756591796875, -0.026580810546875, -0.01984405517578125, -0.0131072998046875, -0.00637054443359375, 0.0003662109375, 0.00710296630859375, 0.0138397216796875, 0.02057647705078125, 0.027313232421875, 0.03404998779296875, 0.0407867431640625, 0.04752349853515625, 0.05426025390625, 0.06099700927734375, 0.0677337646484375, 0.07447052001953125, 0.081207275390625, 0.08794403076171875, 0.0946807861328125, 0.10141754150390625, 0.108154296875, 0.11489105224609375, 0.1216278076171875, 0.12836456298828125, 0.135101318359375, 0.14183807373046875, 0.1485748291015625, 0.15531158447265625, 0.16204833984375, 0.16878509521484375, 0.1755218505859375, 0.18225860595703125, 0.188995361328125, 0.19573211669921875, 0.2024688720703125, 0.20920562744140625, 0.2159423828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 10.0, 9.0, 8.0, 9.0, 16.0, 11.0, 13.0, 16.0, 27.0, 32.0, 36.0, 47.0, 41.0, 51.0, 60.0, 64.0, 81.0, 83.0, 58.0, 46.0, 43.0, 31.0, 30.0, 32.0, 20.0, 15.0, 13.0, 12.0, 14.0, 13.0, 6.0, 9.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.09429931640625, -0.09148025512695312, -0.08866119384765625, -0.08584213256835938, -0.0830230712890625, -0.08020401000976562, -0.07738494873046875, -0.07456588745117188, -0.071746826171875, -0.06892776489257812, -0.06610870361328125, -0.06328964233398438, -0.0604705810546875, -0.057651519775390625, -0.05483245849609375, -0.052013397216796875, -0.0491943359375, -0.046375274658203125, -0.04355621337890625, -0.040737152099609375, -0.0379180908203125, -0.035099029541015625, -0.03227996826171875, -0.029460906982421875, -0.026641845703125, -0.023822784423828125, -0.02100372314453125, -0.018184661865234375, -0.0153656005859375, -0.012546539306640625, -0.00972747802734375, -0.006908416748046875, -0.00408935546875, -0.001270294189453125, 0.00154876708984375, 0.004367828369140625, 0.0071868896484375, 0.010005950927734375, 0.01282501220703125, 0.015644073486328125, 0.018463134765625, 0.021282196044921875, 0.02410125732421875, 0.026920318603515625, 0.0297393798828125, 0.032558441162109375, 0.03537750244140625, 0.038196563720703125, 0.041015625, 0.043834686279296875, 0.04665374755859375, 0.049472808837890625, 0.0522918701171875, 0.055110931396484375, 0.05792999267578125, 0.060749053955078125, 0.063568115234375, 0.06638717651367188, 0.06920623779296875, 0.07202529907226562, 0.0748443603515625, 0.07766342163085938, 0.08048248291015625, 0.08330154418945312, 0.08612060546875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 14.0, 11.0, 18.0, 23.0, 29.0, 29.0, 40.0, 34.0, 43.0, 54.0, 47.0, 68.0, 76.0, 72.0, 62.0, 62.0, 60.0, 46.0, 35.0, 30.0, 43.0, 19.0, 19.0, 22.0, 9.0, 13.0, 4.0, 1.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.65962791442871, -18.907756805419922, -18.155885696411133, -17.404014587402344, -16.652141571044922, -15.900270462036133, -15.148399353027344, -14.396528244018555, -13.644657135009766, -12.892786026000977, -12.140913963317871, -11.389042854309082, -10.637171745300293, -9.885299682617188, -9.133428573608398, -8.38155746459961, -7.629685401916504, -6.877813816070557, -6.125942707061768, -5.37407112121582, -4.622200012207031, -3.870328426361084, -3.1184568405151367, -2.3665857315063477, -1.6147141456604004, -0.8628427386283875, -0.11097133159637451, 0.6409001350402832, 1.3927714824676514, 2.1446428298950195, 2.896514415740967, 3.648385524749756, 4.400257110595703, 5.15212869644165, 5.9039998054504395, 6.655871391296387, 7.407742500305176, 8.159614562988281, 8.91148567199707, 9.66335678100586, 10.415227890014648, 11.167098999023438, 11.918971061706543, 12.670842170715332, 13.422713279724121, 14.174585342407227, 14.926456451416016, 15.678327560424805, 16.430198669433594, 17.182069778442383, 17.933940887451172, 18.685813903808594, 19.437685012817383, 20.189556121826172, 20.94142723083496, 21.69329833984375, 22.445171356201172, 23.19704246520996, 23.94891357421875, 24.700786590576172, 25.45265769958496, 26.20452880859375, 26.95639991760254, 27.708271026611328, 28.460142135620117]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 5.0, 7.0, 6.0, 8.0, 17.0, 16.0, 10.0, 15.0, 15.0, 31.0, 33.0, 28.0, 28.0, 39.0, 29.0, 46.0, 34.0, 34.0, 21.0, 46.0, 42.0, 43.0, 49.0, 44.0, 38.0, 42.0, 36.0, 27.0, 30.0, 29.0, 25.0, 22.0, 21.0, 20.0, 8.0, 9.0, 12.0, 10.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.081941604614258, -19.4132022857666, -18.744461059570312, -18.075721740722656, -17.406982421875, -16.73824119567871, -16.069501876831055, -15.400761604309082, -14.73202133178711, -14.063281059265137, -13.394540786743164, -12.725801467895508, -12.057061195373535, -11.388320922851562, -10.719581604003906, -10.050841331481934, -9.382101058959961, -8.713360786437988, -8.044620513916016, -7.375881195068359, -6.707140922546387, -6.038400650024414, -5.3696608543396, -4.700921058654785, -4.0321807861328125, -3.363440752029419, -2.6947007179260254, -2.025960683822632, -1.3572206497192383, -0.6884806156158447, -0.019740581512451172, 0.6489992141723633, 1.317739486694336, 1.9864795207977295, 2.655219554901123, 3.3239595890045166, 3.99269962310791, 4.661439895629883, 5.330179691314697, 5.998919486999512, 6.667659759521484, 7.336400032043457, 8.00514030456543, 8.673879623413086, 9.342619895935059, 10.011360168457031, 10.680099487304688, 11.34883975982666, 12.017580032348633, 12.686320304870605, 13.355060577392578, 14.023799896240234, 14.692540168762207, 15.36128044128418, 16.030019760131836, 16.698760986328125, 17.36750030517578, 18.036239624023438, 18.704980850219727, 19.373720169067383, 20.042461395263672, 20.711200714111328, 21.379940032958984, 22.04867935180664, 22.71742057800293]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 10.0, 5.0, 14.0, 26.0, 52.0, 72.0, 112.0, 164.0, 239.0, 385.0, 624.0, 1042.0, 1634.0, 2551.0, 4125.0, 6326.0, 9856.0, 15161.0, 22358.0, 32411.0, 45711.0, 61284.0, 77021.0, 92013.0, 102647.0, 105962.0, 101564.0, 91158.0, 76440.0, 59062.0, 44128.0, 31854.0, 21817.0, 14377.0, 9353.0, 6263.0, 3883.0, 2583.0, 1581.0, 1015.0, 621.0, 384.0, 246.0, 154.0, 96.0, 70.0, 35.0, 33.0, 10.0, 11.0, 10.0, 5.0, 4.0, 2.0, 2.0], "bins": [-12.2109375, -11.8565673828125, -11.502197265625, -11.1478271484375, -10.79345703125, -10.4390869140625, -10.084716796875, -9.7303466796875, -9.3759765625, -9.0216064453125, -8.667236328125, -8.3128662109375, -7.95849609375, -7.6041259765625, -7.249755859375, -6.8953857421875, -6.541015625, -6.1866455078125, -5.832275390625, -5.4779052734375, -5.12353515625, -4.7691650390625, -4.414794921875, -4.0604248046875, -3.7060546875, -3.3516845703125, -2.997314453125, -2.6429443359375, -2.28857421875, -1.9342041015625, -1.579833984375, -1.2254638671875, -0.87109375, -0.5167236328125, -0.162353515625, 0.1920166015625, 0.54638671875, 0.9007568359375, 1.255126953125, 1.6094970703125, 1.9638671875, 2.3182373046875, 2.672607421875, 3.0269775390625, 3.38134765625, 3.7357177734375, 4.090087890625, 4.4444580078125, 4.798828125, 5.1531982421875, 5.507568359375, 5.8619384765625, 6.21630859375, 6.5706787109375, 6.925048828125, 7.2794189453125, 7.6337890625, 7.9881591796875, 8.342529296875, 8.6968994140625, 9.05126953125, 9.4056396484375, 9.760009765625, 10.1143798828125, 10.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 7.0, 10.0, 9.0, 16.0, 12.0, 21.0, 17.0, 23.0, 30.0, 28.0, 30.0, 24.0, 34.0, 31.0, 34.0, 34.0, 22.0, 33.0, 37.0, 42.0, 37.0, 34.0, 47.0, 33.0, 35.0, 35.0, 29.0, 32.0, 29.0, 26.0, 27.0, 25.0, 18.0, 13.0, 12.0, 10.0, 7.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.921875, -18.31201171875, -17.7021484375, -17.09228515625, -16.482421875, -15.87255859375, -15.2626953125, -14.65283203125, -14.04296875, -13.43310546875, -12.8232421875, -12.21337890625, -11.603515625, -10.99365234375, -10.3837890625, -9.77392578125, -9.1640625, -8.55419921875, -7.9443359375, -7.33447265625, -6.724609375, -6.11474609375, -5.5048828125, -4.89501953125, -4.28515625, -3.67529296875, -3.0654296875, -2.45556640625, -1.845703125, -1.23583984375, -0.6259765625, -0.01611328125, 0.59375, 1.20361328125, 1.8134765625, 2.42333984375, 3.033203125, 3.64306640625, 4.2529296875, 4.86279296875, 5.47265625, 6.08251953125, 6.6923828125, 7.30224609375, 7.912109375, 8.52197265625, 9.1318359375, 9.74169921875, 10.3515625, 10.96142578125, 11.5712890625, 12.18115234375, 12.791015625, 13.40087890625, 14.0107421875, 14.62060546875, 15.23046875, 15.84033203125, 16.4501953125, 17.06005859375, 17.669921875, 18.27978515625, 18.8896484375, 19.49951171875, 20.109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 13.0, 15.0, 13.0, 30.0, 55.0, 84.0, 152.0, 221.0, 345.0, 576.0, 852.0, 1399.0, 1998.0, 2976.0, 4357.0, 6392.0, 9311.0, 13384.0, 19010.0, 26119.0, 34928.0, 45251.0, 57660.0, 68988.0, 80086.0, 87806.0, 91247.0, 88958.0, 82907.0, 73889.0, 61708.0, 49909.0, 38856.0, 29007.0, 21341.0, 15239.0, 10877.0, 7434.0, 5071.0, 3472.0, 2231.0, 1586.0, 984.0, 646.0, 432.0, 275.0, 160.0, 131.0, 70.0, 48.0, 23.0, 21.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.40625, -9.0997314453125, -8.793212890625, -8.4866943359375, -8.18017578125, -7.8736572265625, -7.567138671875, -7.2606201171875, -6.9541015625, -6.6475830078125, -6.341064453125, -6.0345458984375, -5.72802734375, -5.4215087890625, -5.114990234375, -4.8084716796875, -4.501953125, -4.1954345703125, -3.888916015625, -3.5823974609375, -3.27587890625, -2.9693603515625, -2.662841796875, -2.3563232421875, -2.0498046875, -1.7432861328125, -1.436767578125, -1.1302490234375, -0.82373046875, -0.5172119140625, -0.210693359375, 0.0958251953125, 0.40234375, 0.7088623046875, 1.015380859375, 1.3218994140625, 1.62841796875, 1.9349365234375, 2.241455078125, 2.5479736328125, 2.8544921875, 3.1610107421875, 3.467529296875, 3.7740478515625, 4.08056640625, 4.3870849609375, 4.693603515625, 5.0001220703125, 5.306640625, 5.6131591796875, 5.919677734375, 6.2261962890625, 6.53271484375, 6.8392333984375, 7.145751953125, 7.4522705078125, 7.7587890625, 8.0653076171875, 8.371826171875, 8.6783447265625, 8.98486328125, 9.2913818359375, 9.597900390625, 9.9044189453125, 10.2109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 1.0, 6.0, 3.0, 3.0, 8.0, 7.0, 7.0, 11.0, 9.0, 17.0, 15.0, 16.0, 17.0, 17.0, 28.0, 23.0, 25.0, 31.0, 39.0, 45.0, 25.0, 32.0, 31.0, 47.0, 32.0, 30.0, 40.0, 30.0, 26.0, 26.0, 31.0, 37.0, 37.0, 42.0, 28.0, 26.0, 24.0, 15.0, 14.0, 11.0, 12.0, 12.0, 9.0, 9.0, 8.0, 11.0, 6.0, 11.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.7109375, -11.3514404296875, -10.991943359375, -10.6324462890625, -10.27294921875, -9.9134521484375, -9.553955078125, -9.1944580078125, -8.8349609375, -8.4754638671875, -8.115966796875, -7.7564697265625, -7.39697265625, -7.0374755859375, -6.677978515625, -6.3184814453125, -5.958984375, -5.5994873046875, -5.239990234375, -4.8804931640625, -4.52099609375, -4.1614990234375, -3.802001953125, -3.4425048828125, -3.0830078125, -2.7235107421875, -2.364013671875, -2.0045166015625, -1.64501953125, -1.2855224609375, -0.926025390625, -0.5665283203125, -0.20703125, 0.1524658203125, 0.511962890625, 0.8714599609375, 1.23095703125, 1.5904541015625, 1.949951171875, 2.3094482421875, 2.6689453125, 3.0284423828125, 3.387939453125, 3.7474365234375, 4.10693359375, 4.4664306640625, 4.825927734375, 5.1854248046875, 5.544921875, 5.9044189453125, 6.263916015625, 6.6234130859375, 6.98291015625, 7.3424072265625, 7.701904296875, 8.0614013671875, 8.4208984375, 8.7803955078125, 9.139892578125, 9.4993896484375, 9.85888671875, 10.2183837890625, 10.577880859375, 10.9373779296875, 11.296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 12.0, 14.0, 26.0, 56.0, 83.0, 123.0, 170.0, 272.0, 450.0, 647.0, 1101.0, 1706.0, 2828.0, 4483.0, 7127.0, 11416.0, 17764.0, 27445.0, 40505.0, 57826.0, 77526.0, 98103.0, 113190.0, 118899.0, 113526.0, 98617.0, 79066.0, 58638.0, 40964.0, 27557.0, 17751.0, 11372.0, 7265.0, 4502.0, 2834.0, 1666.0, 1115.0, 686.0, 426.0, 291.0, 189.0, 105.0, 73.0, 57.0, 36.0, 17.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.71875, -3.6043701171875, -3.489990234375, -3.3756103515625, -3.26123046875, -3.1468505859375, -3.032470703125, -2.9180908203125, -2.8037109375, -2.6893310546875, -2.574951171875, -2.4605712890625, -2.34619140625, -2.2318115234375, -2.117431640625, -2.0030517578125, -1.888671875, -1.7742919921875, -1.659912109375, -1.5455322265625, -1.43115234375, -1.3167724609375, -1.202392578125, -1.0880126953125, -0.9736328125, -0.8592529296875, -0.744873046875, -0.6304931640625, -0.51611328125, -0.4017333984375, -0.287353515625, -0.1729736328125, -0.05859375, 0.0557861328125, 0.170166015625, 0.2845458984375, 0.39892578125, 0.5133056640625, 0.627685546875, 0.7420654296875, 0.8564453125, 0.9708251953125, 1.085205078125, 1.1995849609375, 1.31396484375, 1.4283447265625, 1.542724609375, 1.6571044921875, 1.771484375, 1.8858642578125, 2.000244140625, 2.1146240234375, 2.22900390625, 2.3433837890625, 2.457763671875, 2.5721435546875, 2.6865234375, 2.8009033203125, 2.915283203125, 3.0296630859375, 3.14404296875, 3.2584228515625, 3.372802734375, 3.4871826171875, 3.6015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 8.0, 9.0, 12.0, 18.0, 16.0, 25.0, 26.0, 30.0, 27.0, 34.0, 36.0, 37.0, 53.0, 49.0, 39.0, 47.0, 50.0, 53.0, 53.0, 50.0, 47.0, 39.0, 34.0, 33.0, 20.0, 20.0, 19.0, 18.0, 13.0, 17.0, 14.0, 10.0, 7.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039577484130859375, -0.00038237497210502625, -0.00036897510290145874, -0.00035557523369789124, -0.00034217536449432373, -0.0003287754952907562, -0.0003153756260871887, -0.0003019757568836212, -0.0002885758876800537, -0.0002751760184764862, -0.0002617761492729187, -0.0002483762800693512, -0.0002349764108657837, -0.0002215765416622162, -0.00020817667245864868, -0.00019477680325508118, -0.00018137693405151367, -0.00016797706484794617, -0.00015457719564437866, -0.00014117732644081116, -0.00012777745723724365, -0.00011437758803367615, -0.00010097771883010864, -8.757784962654114e-05, -7.417798042297363e-05, -6.077811121940613e-05, -4.737824201583862e-05, -3.397837281227112e-05, -2.0578503608703613e-05, -7.178634405136108e-06, 6.2212347984313965e-06, 1.96211040019989e-05, 3.3020973205566406e-05, 4.642084240913391e-05, 5.9820711612701416e-05, 7.322058081626892e-05, 8.662045001983643e-05, 0.00010002031922340393, 0.00011342018842697144, 0.00012682005763053894, 0.00014021992683410645, 0.00015361979603767395, 0.00016701966524124146, 0.00018041953444480896, 0.00019381940364837646, 0.00020721927285194397, 0.00022061914205551147, 0.00023401901125907898, 0.0002474188804626465, 0.000260818749666214, 0.0002742186188697815, 0.000287618488073349, 0.0003010183572769165, 0.000314418226480484, 0.0003278180956840515, 0.000341217964887619, 0.0003546178340911865, 0.00036801770329475403, 0.00038141757249832153, 0.00039481744170188904, 0.00040821731090545654, 0.00042161718010902405, 0.00043501704931259155, 0.00044841691851615906, 0.00046181678771972656]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 13.0, 16.0, 14.0, 23.0, 31.0, 59.0, 74.0, 115.0, 202.0, 329.0, 588.0, 949.0, 1695.0, 3065.0, 5647.0, 10759.0, 20018.0, 35850.0, 62986.0, 100219.0, 140109.0, 165250.0, 160370.0, 129607.0, 88769.0, 54080.0, 31034.0, 16730.0, 9039.0, 4789.0, 2613.0, 1426.0, 739.0, 487.0, 299.0, 185.0, 115.0, 75.0, 58.0, 31.0, 26.0, 22.0, 21.0, 7.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.15234375, -4.97979736328125, -4.8072509765625, -4.63470458984375, -4.462158203125, -4.28961181640625, -4.1170654296875, -3.94451904296875, -3.77197265625, -3.59942626953125, -3.4268798828125, -3.25433349609375, -3.081787109375, -2.90924072265625, -2.7366943359375, -2.56414794921875, -2.3916015625, -2.21905517578125, -2.0465087890625, -1.87396240234375, -1.701416015625, -1.52886962890625, -1.3563232421875, -1.18377685546875, -1.01123046875, -0.83868408203125, -0.6661376953125, -0.49359130859375, -0.321044921875, -0.14849853515625, 0.0240478515625, 0.19659423828125, 0.369140625, 0.54168701171875, 0.7142333984375, 0.88677978515625, 1.059326171875, 1.23187255859375, 1.4044189453125, 1.57696533203125, 1.74951171875, 1.92205810546875, 2.0946044921875, 2.26715087890625, 2.439697265625, 2.61224365234375, 2.7847900390625, 2.95733642578125, 3.1298828125, 3.30242919921875, 3.4749755859375, 3.64752197265625, 3.820068359375, 3.99261474609375, 4.1651611328125, 4.33770751953125, 4.51025390625, 4.68280029296875, 4.8553466796875, 5.02789306640625, 5.200439453125, 5.37298583984375, 5.5455322265625, 5.71807861328125, 5.890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 10.0, 11.0, 16.0, 11.0, 10.0, 16.0, 24.0, 23.0, 34.0, 42.0, 47.0, 56.0, 70.0, 53.0, 44.0, 53.0, 42.0, 64.0, 51.0, 49.0, 28.0, 36.0, 36.0, 27.0, 27.0, 22.0, 19.0, 18.0, 10.0, 9.0, 11.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.0703125, -2.007537841796875, -1.94476318359375, -1.881988525390625, -1.8192138671875, -1.756439208984375, -1.69366455078125, -1.630889892578125, -1.568115234375, -1.505340576171875, -1.44256591796875, -1.379791259765625, -1.3170166015625, -1.254241943359375, -1.19146728515625, -1.128692626953125, -1.06591796875, -1.003143310546875, -0.94036865234375, -0.877593994140625, -0.8148193359375, -0.752044677734375, -0.68927001953125, -0.626495361328125, -0.563720703125, -0.500946044921875, -0.43817138671875, -0.375396728515625, -0.3126220703125, -0.249847412109375, -0.18707275390625, -0.124298095703125, -0.0615234375, 0.001251220703125, 0.06402587890625, 0.126800537109375, 0.1895751953125, 0.252349853515625, 0.31512451171875, 0.377899169921875, 0.440673828125, 0.503448486328125, 0.56622314453125, 0.628997802734375, 0.6917724609375, 0.754547119140625, 0.81732177734375, 0.880096435546875, 0.94287109375, 1.005645751953125, 1.06842041015625, 1.131195068359375, 1.1939697265625, 1.256744384765625, 1.31951904296875, 1.382293701171875, 1.445068359375, 1.507843017578125, 1.57061767578125, 1.633392333984375, 1.6961669921875, 1.758941650390625, 1.82171630859375, 1.884490966796875, 1.947265625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 5.0, 15.0, 17.0, 22.0, 17.0, 22.0, 28.0, 29.0, 37.0, 43.0, 42.0, 60.0, 74.0, 57.0, 51.0, 68.0, 56.0, 62.0, 58.0, 42.0, 40.0, 27.0, 32.0, 30.0, 12.0, 12.0, 9.0, 10.0, 5.0, 9.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96094512939453, -18.245296478271484, -17.529647827148438, -16.81399917602539, -16.098350524902344, -15.382701873779297, -14.667054176330566, -13.95140552520752, -13.235756874084473, -12.520108222961426, -11.804459571838379, -11.088811874389648, -10.373163223266602, -9.657514572143555, -8.941865921020508, -8.226217269897461, -7.510568618774414, -6.794919967651367, -6.07927131652832, -5.363623142242432, -4.647974491119385, -3.932325839996338, -3.216677665710449, -2.5010290145874023, -1.7853803634643555, -1.0697318315505981, -0.3540832996368408, 0.36156511306762695, 1.0772137641906738, 1.7928624153137207, 2.5085105895996094, 3.2241592407226562, 3.939809799194336, 4.655458450317383, 5.37110710144043, 6.086755275726318, 6.802403926849365, 7.518052577972412, 8.2337007522583, 8.949349403381348, 9.664998054504395, 10.380646705627441, 11.096295356750488, 11.811943054199219, 12.527591705322266, 13.243240356445312, 13.95888900756836, 14.674537658691406, 15.390186309814453, 16.1058349609375, 16.821483612060547, 17.537132263183594, 18.25278091430664, 18.968429565429688, 19.684078216552734, 20.39972686767578, 21.115375518798828, 21.831024169921875, 22.546672821044922, 23.26232147216797, 23.977970123291016, 24.693618774414062, 25.40926742553711, 26.124916076660156, 26.84056282043457]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 7.0, 5.0, 12.0, 8.0, 17.0, 16.0, 19.0, 12.0, 26.0, 22.0, 31.0, 20.0, 30.0, 33.0, 43.0, 36.0, 36.0, 54.0, 35.0, 47.0, 29.0, 40.0, 47.0, 34.0, 29.0, 47.0, 30.0, 26.0, 33.0, 30.0, 26.0, 12.0, 20.0, 12.0, 17.0, 11.0, 9.0, 12.0, 4.0, 8.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.36363983154297, -20.685218811035156, -20.006799697875977, -19.328378677368164, -18.649959564208984, -17.971538543701172, -17.29311752319336, -16.614696502685547, -15.936277389526367, -15.257857322692871, -14.579437255859375, -13.901016235351562, -13.222596168518066, -12.54417610168457, -11.865755081176758, -11.187335014343262, -10.508914947509766, -9.83049488067627, -9.152074813842773, -8.473653793334961, -7.795233726501465, -7.116813659667969, -6.4383931159973145, -5.75997257232666, -5.081552505493164, -4.403132438659668, -3.7247118949890137, -3.0462915897369385, -2.3678712844848633, -1.689450979232788, -1.011030673980713, -0.3326101303100586, 0.3458099365234375, 1.0242302417755127, 1.702650547027588, 2.381070852279663, 3.0594911575317383, 3.7379114627838135, 4.416331768035889, 5.094752311706543, 5.773172378540039, 6.451592445373535, 7.1300129890441895, 7.808433532714844, 8.48685359954834, 9.165273666381836, 9.843694686889648, 10.522114753723145, 11.20053482055664, 11.878954887390137, 12.557374954223633, 13.235795974731445, 13.914216041564941, 14.592636108398438, 15.27105712890625, 15.949477195739746, 16.627897262573242, 17.306318283081055, 17.984737396240234, 18.663158416748047, 19.34157943725586, 20.01999855041504, 20.69841957092285, 21.37683868408203, 22.055259704589844]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 15.0, 26.0, 52.0, 108.0, 154.0, 278.0, 425.0, 716.0, 1188.0, 2023.0, 3394.0, 5699.0, 9504.0, 15510.0, 25224.0, 40346.0, 63198.0, 97695.0, 144028.0, 207125.0, 278330.0, 354533.0, 419767.0, 456007.0, 452318.0, 411035.0, 346091.0, 268225.0, 197709.0, 137510.0, 93532.0, 60711.0, 38450.0, 24403.0, 15015.0, 9279.0, 5757.0, 3538.0, 2158.0, 1281.0, 771.0, 448.0, 297.0, 159.0, 87.0, 56.0, 42.0, 28.0, 15.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-13.8125, -13.3800048828125, -12.947509765625, -12.5150146484375, -12.08251953125, -11.6500244140625, -11.217529296875, -10.7850341796875, -10.3525390625, -9.9200439453125, -9.487548828125, -9.0550537109375, -8.62255859375, -8.1900634765625, -7.757568359375, -7.3250732421875, -6.892578125, -6.4600830078125, -6.027587890625, -5.5950927734375, -5.16259765625, -4.7301025390625, -4.297607421875, -3.8651123046875, -3.4326171875, -3.0001220703125, -2.567626953125, -2.1351318359375, -1.70263671875, -1.2701416015625, -0.837646484375, -0.4051513671875, 0.02734375, 0.4598388671875, 0.892333984375, 1.3248291015625, 1.75732421875, 2.1898193359375, 2.622314453125, 3.0548095703125, 3.4873046875, 3.9197998046875, 4.352294921875, 4.7847900390625, 5.21728515625, 5.6497802734375, 6.082275390625, 6.5147705078125, 6.947265625, 7.3797607421875, 7.812255859375, 8.2447509765625, 8.67724609375, 9.1097412109375, 9.542236328125, 9.9747314453125, 10.4072265625, 10.8397216796875, 11.272216796875, 11.7047119140625, 12.13720703125, 12.5697021484375, 13.002197265625, 13.4346923828125, 13.8671875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 8.0, 8.0, 7.0, 9.0, 16.0, 7.0, 19.0, 19.0, 17.0, 28.0, 28.0, 31.0, 34.0, 36.0, 32.0, 41.0, 47.0, 38.0, 30.0, 39.0, 36.0, 41.0, 29.0, 46.0, 40.0, 35.0, 25.0, 39.0, 32.0, 23.0, 16.0, 21.0, 15.0, 17.0, 8.0, 20.0, 10.0, 12.0, 6.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.109375, -16.585693359375, -16.06201171875, -15.538330078125, -15.0146484375, -14.490966796875, -13.96728515625, -13.443603515625, -12.919921875, -12.396240234375, -11.87255859375, -11.348876953125, -10.8251953125, -10.301513671875, -9.77783203125, -9.254150390625, -8.73046875, -8.206787109375, -7.68310546875, -7.159423828125, -6.6357421875, -6.112060546875, -5.58837890625, -5.064697265625, -4.541015625, -4.017333984375, -3.49365234375, -2.969970703125, -2.4462890625, -1.922607421875, -1.39892578125, -0.875244140625, -0.3515625, 0.172119140625, 0.69580078125, 1.219482421875, 1.7431640625, 2.266845703125, 2.79052734375, 3.314208984375, 3.837890625, 4.361572265625, 4.88525390625, 5.408935546875, 5.9326171875, 6.456298828125, 6.97998046875, 7.503662109375, 8.02734375, 8.551025390625, 9.07470703125, 9.598388671875, 10.1220703125, 10.645751953125, 11.16943359375, 11.693115234375, 12.216796875, 12.740478515625, 13.26416015625, 13.787841796875, 14.3115234375, 14.835205078125, 15.35888671875, 15.882568359375, 16.40625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 15.0, 13.0, 29.0, 42.0, 95.0, 165.0, 328.0, 573.0, 1027.0, 1897.0, 3506.0, 6094.0, 10951.0, 19280.0, 31882.0, 53592.0, 85637.0, 131601.0, 193207.0, 265260.0, 342417.0, 411167.0, 454394.0, 460554.0, 430210.0, 368847.0, 294363.0, 217866.0, 152551.0, 100705.0, 63536.0, 39107.0, 22955.0, 13387.0, 7646.0, 4245.0, 2323.0, 1296.0, 689.0, 362.0, 217.0, 112.0, 64.0, 42.0, 25.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.734375, -15.2740478515625, -14.813720703125, -14.3533935546875, -13.89306640625, -13.4327392578125, -12.972412109375, -12.5120849609375, -12.0517578125, -11.5914306640625, -11.131103515625, -10.6707763671875, -10.21044921875, -9.7501220703125, -9.289794921875, -8.8294677734375, -8.369140625, -7.9088134765625, -7.448486328125, -6.9881591796875, -6.52783203125, -6.0675048828125, -5.607177734375, -5.1468505859375, -4.6865234375, -4.2261962890625, -3.765869140625, -3.3055419921875, -2.84521484375, -2.3848876953125, -1.924560546875, -1.4642333984375, -1.00390625, -0.5435791015625, -0.083251953125, 0.3770751953125, 0.83740234375, 1.2977294921875, 1.758056640625, 2.2183837890625, 2.6787109375, 3.1390380859375, 3.599365234375, 4.0596923828125, 4.52001953125, 4.9803466796875, 5.440673828125, 5.9010009765625, 6.361328125, 6.8216552734375, 7.281982421875, 7.7423095703125, 8.20263671875, 8.6629638671875, 9.123291015625, 9.5836181640625, 10.0439453125, 10.5042724609375, 10.964599609375, 11.4249267578125, 11.88525390625, 12.3455810546875, 12.805908203125, 13.2662353515625, 13.7265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 6.0, 10.0, 7.0, 12.0, 15.0, 29.0, 38.0, 42.0, 53.0, 62.0, 99.0, 111.0, 127.0, 161.0, 170.0, 210.0, 209.0, 232.0, 248.0, 223.0, 249.0, 224.0, 199.0, 188.0, 198.0, 174.0, 140.0, 114.0, 102.0, 97.0, 74.0, 61.0, 46.0, 33.0, 32.0, 19.0, 12.0, 14.0, 6.0, 8.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.4873046875, -8.193359375, -7.8994140625, -7.60546875, -7.3115234375, -7.017578125, -6.7236328125, -6.4296875, -6.1357421875, -5.841796875, -5.5478515625, -5.25390625, -4.9599609375, -4.666015625, -4.3720703125, -4.078125, -3.7841796875, -3.490234375, -3.1962890625, -2.90234375, -2.6083984375, -2.314453125, -2.0205078125, -1.7265625, -1.4326171875, -1.138671875, -0.8447265625, -0.55078125, -0.2568359375, 0.037109375, 0.3310546875, 0.625, 0.9189453125, 1.212890625, 1.5068359375, 1.80078125, 2.0947265625, 2.388671875, 2.6826171875, 2.9765625, 3.2705078125, 3.564453125, 3.8583984375, 4.15234375, 4.4462890625, 4.740234375, 5.0341796875, 5.328125, 5.6220703125, 5.916015625, 6.2099609375, 6.50390625, 6.7978515625, 7.091796875, 7.3857421875, 7.6796875, 7.9736328125, 8.267578125, 8.5615234375, 8.85546875, 9.1494140625, 9.443359375, 9.7373046875, 10.03125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 11.0, 10.0, 10.0, 18.0, 20.0, 24.0, 26.0, 17.0, 27.0, 33.0, 38.0, 45.0, 52.0, 46.0, 53.0, 58.0, 39.0, 43.0, 59.0, 49.0, 47.0, 34.0, 33.0, 35.0, 37.0, 29.0, 27.0, 11.0, 8.0, 13.0, 11.0, 6.0, 4.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.399248123168945, -17.771133422851562, -17.143016815185547, -16.51490020751953, -15.886785507202148, -15.25866985321045, -14.63055419921875, -14.00243854522705, -13.374322891235352, -12.746207237243652, -12.118091583251953, -11.489975929260254, -10.861860275268555, -10.233744621276855, -9.605628967285156, -8.977513313293457, -8.349397659301758, -7.721282005310059, -7.093166351318359, -6.46505069732666, -5.836935043334961, -5.208819389343262, -4.5807037353515625, -3.9525880813598633, -3.324472427368164, -2.696356773376465, -2.0682411193847656, -1.4401254653930664, -0.8120098114013672, -0.18389415740966797, 0.44422149658203125, 1.0723371505737305, 1.7004528045654297, 2.328568458557129, 2.956684112548828, 3.5847997665405273, 4.212915420532227, 4.841031074523926, 5.469146728515625, 6.097262382507324, 6.725378036499023, 7.353493690490723, 7.981609344482422, 8.609724998474121, 9.23784065246582, 9.86595630645752, 10.494071960449219, 11.122187614440918, 11.750303268432617, 12.378418922424316, 13.006534576416016, 13.634650230407715, 14.262765884399414, 14.890881538391113, 15.518997192382812, 16.147113800048828, 16.77522850036621, 17.403343200683594, 18.03145980834961, 18.659576416015625, 19.287691116333008, 19.91580581665039, 20.543922424316406, 21.172039031982422, 21.800153732299805]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 11.0, 4.0, 4.0, 6.0, 10.0, 12.0, 20.0, 13.0, 14.0, 18.0, 12.0, 16.0, 26.0, 22.0, 31.0, 37.0, 27.0, 37.0, 35.0, 40.0, 38.0, 34.0, 60.0, 34.0, 36.0, 36.0, 43.0, 35.0, 34.0, 34.0, 29.0, 26.0, 26.0, 20.0, 11.0, 21.0, 8.0, 11.0, 17.0, 13.0, 10.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.7728214263916, -19.141103744506836, -18.509384155273438, -17.877666473388672, -17.245948791503906, -16.614229202270508, -15.982511520385742, -15.35079288482666, -14.719074249267578, -14.087355613708496, -13.455636978149414, -12.823919296264648, -12.192200660705566, -11.560482025146484, -10.928764343261719, -10.297045707702637, -9.665327072143555, -9.033608436584473, -8.40188980102539, -7.770172119140625, -7.138453483581543, -6.506734848022461, -5.875016689300537, -5.243298530578613, -4.611579895019531, -3.9798614978790283, -3.3481431007385254, -2.7164247035980225, -2.0847063064575195, -1.4529879093170166, -0.8212695121765137, -0.18955135345458984, 0.4421672821044922, 1.0738856792449951, 1.705604076385498, 2.337322473526001, 2.969040870666504, 3.600759267807007, 4.23247766494751, 4.864195823669434, 5.495914459228516, 6.127633094787598, 6.7593512535095215, 7.391069412231445, 8.022788047790527, 8.65450668334961, 9.286224365234375, 9.917943000793457, 10.549661636352539, 11.181380271911621, 11.813098907470703, 12.444816589355469, 13.07653522491455, 13.708253860473633, 14.339971542358398, 14.97169017791748, 15.603408813476562, 16.235126495361328, 16.866846084594727, 17.498563766479492, 18.13028335571289, 18.762001037597656, 19.393718719482422, 20.025436401367188, 20.657155990600586]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 8.0, 5.0, 12.0, 19.0, 21.0, 48.0, 56.0, 89.0, 175.0, 214.0, 304.0, 500.0, 722.0, 1214.0, 2108.0, 3596.0, 6025.0, 10308.0, 17840.0, 31673.0, 56146.0, 99675.0, 177618.0, 241908.0, 173177.0, 97139.0, 54638.0, 30763.0, 17581.0, 10148.0, 5915.0, 3476.0, 2036.0, 1204.0, 829.0, 496.0, 306.0, 198.0, 121.0, 82.0, 55.0, 38.0, 18.0, 17.0, 11.0, 14.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.921875, -2.8319091796875, -2.741943359375, -2.6519775390625, -2.56201171875, -2.4720458984375, -2.382080078125, -2.2921142578125, -2.2021484375, -2.1121826171875, -2.022216796875, -1.9322509765625, -1.84228515625, -1.7523193359375, -1.662353515625, -1.5723876953125, -1.482421875, -1.3924560546875, -1.302490234375, -1.2125244140625, -1.12255859375, -1.0325927734375, -0.942626953125, -0.8526611328125, -0.7626953125, -0.6727294921875, -0.582763671875, -0.4927978515625, -0.40283203125, -0.3128662109375, -0.222900390625, -0.1329345703125, -0.04296875, 0.0469970703125, 0.136962890625, 0.2269287109375, 0.31689453125, 0.4068603515625, 0.496826171875, 0.5867919921875, 0.6767578125, 0.7667236328125, 0.856689453125, 0.9466552734375, 1.03662109375, 1.1265869140625, 1.216552734375, 1.3065185546875, 1.396484375, 1.4864501953125, 1.576416015625, 1.6663818359375, 1.75634765625, 1.8463134765625, 1.936279296875, 2.0262451171875, 2.1162109375, 2.2061767578125, 2.296142578125, 2.3861083984375, 2.47607421875, 2.5660400390625, 2.656005859375, 2.7459716796875, 2.8359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 1.0, 12.0, 9.0, 6.0, 7.0, 11.0, 10.0, 15.0, 14.0, 16.0, 25.0, 22.0, 22.0, 24.0, 29.0, 40.0, 28.0, 41.0, 37.0, 42.0, 50.0, 47.0, 35.0, 34.0, 48.0, 47.0, 45.0, 36.0, 36.0, 22.0, 27.0, 25.0, 24.0, 21.0, 14.0, 15.0, 17.0, 12.0, 8.0, 6.0, 10.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-22.578125, -21.8779296875, -21.177734375, -20.4775390625, -19.77734375, -19.0771484375, -18.376953125, -17.6767578125, -16.9765625, -16.2763671875, -15.576171875, -14.8759765625, -14.17578125, -13.4755859375, -12.775390625, -12.0751953125, -11.375, -10.6748046875, -9.974609375, -9.2744140625, -8.57421875, -7.8740234375, -7.173828125, -6.4736328125, -5.7734375, -5.0732421875, -4.373046875, -3.6728515625, -2.97265625, -2.2724609375, -1.572265625, -0.8720703125, -0.171875, 0.5283203125, 1.228515625, 1.9287109375, 2.62890625, 3.3291015625, 4.029296875, 4.7294921875, 5.4296875, 6.1298828125, 6.830078125, 7.5302734375, 8.23046875, 8.9306640625, 9.630859375, 10.3310546875, 11.03125, 11.7314453125, 12.431640625, 13.1318359375, 13.83203125, 14.5322265625, 15.232421875, 15.9326171875, 16.6328125, 17.3330078125, 18.033203125, 18.7333984375, 19.43359375, 20.1337890625, 20.833984375, 21.5341796875, 22.234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 6.0, 2.0, 7.0, 14.0, 19.0, 42.0, 47.0, 81.0, 118.0, 140.0, 245.0, 292.0, 428.0, 610.0, 816.0, 1250.0, 1746.0, 2475.0, 3761.0, 5452.0, 8132.0, 12021.0, 18502.0, 28575.0, 44889.0, 69923.0, 108306.0, 159515.0, 184727.0, 137655.0, 91148.0, 58447.0, 37118.0, 23797.0, 15731.0, 10429.0, 6952.0, 4619.0, 3123.0, 2209.0, 1527.0, 1104.0, 734.0, 562.0, 390.0, 267.0, 198.0, 121.0, 74.0, 74.0, 42.0, 32.0, 23.0, 16.0, 11.0, 9.0, 4.0, 5.0, 1.0, 3.0], "bins": [-2.322265625, -2.2503662109375, -2.178466796875, -2.1065673828125, -2.03466796875, -1.9627685546875, -1.890869140625, -1.8189697265625, -1.7470703125, -1.6751708984375, -1.603271484375, -1.5313720703125, -1.45947265625, -1.3875732421875, -1.315673828125, -1.2437744140625, -1.171875, -1.0999755859375, -1.028076171875, -0.9561767578125, -0.88427734375, -0.8123779296875, -0.740478515625, -0.6685791015625, -0.5966796875, -0.5247802734375, -0.452880859375, -0.3809814453125, -0.30908203125, -0.2371826171875, -0.165283203125, -0.0933837890625, -0.021484375, 0.0504150390625, 0.122314453125, 0.1942138671875, 0.26611328125, 0.3380126953125, 0.409912109375, 0.4818115234375, 0.5537109375, 0.6256103515625, 0.697509765625, 0.7694091796875, 0.84130859375, 0.9132080078125, 0.985107421875, 1.0570068359375, 1.12890625, 1.2008056640625, 1.272705078125, 1.3446044921875, 1.41650390625, 1.4884033203125, 1.560302734375, 1.6322021484375, 1.7041015625, 1.7760009765625, 1.847900390625, 1.9197998046875, 1.99169921875, 2.0635986328125, 2.135498046875, 2.2073974609375, 2.279296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 10.0, 9.0, 12.0, 9.0, 15.0, 16.0, 13.0, 17.0, 20.0, 20.0, 25.0, 27.0, 27.0, 30.0, 43.0, 34.0, 33.0, 38.0, 27.0, 39.0, 42.0, 33.0, 32.0, 33.0, 44.0, 38.0, 31.0, 47.0, 27.0, 31.0, 16.0, 22.0, 23.0, 21.0, 19.0, 15.0, 17.0, 7.0, 5.0, 5.0, 4.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.03125, -12.62060546875, -12.2099609375, -11.79931640625, -11.388671875, -10.97802734375, -10.5673828125, -10.15673828125, -9.74609375, -9.33544921875, -8.9248046875, -8.51416015625, -8.103515625, -7.69287109375, -7.2822265625, -6.87158203125, -6.4609375, -6.05029296875, -5.6396484375, -5.22900390625, -4.818359375, -4.40771484375, -3.9970703125, -3.58642578125, -3.17578125, -2.76513671875, -2.3544921875, -1.94384765625, -1.533203125, -1.12255859375, -0.7119140625, -0.30126953125, 0.109375, 0.52001953125, 0.9306640625, 1.34130859375, 1.751953125, 2.16259765625, 2.5732421875, 2.98388671875, 3.39453125, 3.80517578125, 4.2158203125, 4.62646484375, 5.037109375, 5.44775390625, 5.8583984375, 6.26904296875, 6.6796875, 7.09033203125, 7.5009765625, 7.91162109375, 8.322265625, 8.73291015625, 9.1435546875, 9.55419921875, 9.96484375, 10.37548828125, 10.7861328125, 11.19677734375, 11.607421875, 12.01806640625, 12.4287109375, 12.83935546875, 13.25]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 9.0, 14.0, 24.0, 28.0, 40.0, 68.0, 97.0, 168.0, 227.0, 338.0, 442.0, 588.0, 904.0, 1252.0, 1860.0, 2630.0, 3798.0, 5746.0, 8560.0, 12678.0, 19622.0, 31580.0, 51378.0, 87911.0, 159484.0, 239696.0, 172642.0, 95173.0, 55230.0, 33325.0, 21286.0, 13497.0, 8921.0, 5941.0, 4220.0, 2758.0, 1985.0, 1325.0, 947.0, 671.0, 448.0, 305.0, 218.0, 164.0, 122.0, 95.0, 49.0, 30.0, 33.0, 11.0, 8.0, 8.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.08154296875, -0.07911396026611328, -0.07668495178222656, -0.07425594329833984, -0.07182693481445312, -0.0693979263305664, -0.06696891784667969, -0.06453990936279297, -0.06211090087890625, -0.05968189239501953, -0.05725288391113281, -0.054823875427246094, -0.052394866943359375, -0.049965858459472656, -0.04753684997558594, -0.04510784149169922, -0.0426788330078125, -0.04024982452392578, -0.03782081604003906, -0.035391807556152344, -0.032962799072265625, -0.030533790588378906, -0.028104782104492188, -0.02567577362060547, -0.02324676513671875, -0.02081775665283203, -0.018388748168945312, -0.015959739685058594, -0.013530731201171875, -0.011101722717285156, -0.008672714233398438, -0.006243705749511719, -0.003814697265625, -0.0013856887817382812, 0.0010433197021484375, 0.0034723281860351562, 0.005901336669921875, 0.008330345153808594, 0.010759353637695312, 0.013188362121582031, 0.01561737060546875, 0.01804637908935547, 0.020475387573242188, 0.022904396057128906, 0.025333404541015625, 0.027762413024902344, 0.030191421508789062, 0.03262042999267578, 0.0350494384765625, 0.03747844696044922, 0.03990745544433594, 0.042336463928222656, 0.044765472412109375, 0.047194480895996094, 0.04962348937988281, 0.05205249786376953, 0.05448150634765625, 0.05691051483154297, 0.05933952331542969, 0.061768531799316406, 0.06419754028320312, 0.06662654876708984, 0.06905555725097656, 0.07148456573486328, 0.07391357421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 7.0, 8.0, 8.0, 14.0, 15.0, 15.0, 14.0, 25.0, 19.0, 24.0, 31.0, 41.0, 41.0, 36.0, 34.0, 40.0, 36.0, 32.0, 42.0, 35.0, 39.0, 61.0, 34.0, 33.0, 27.0, 32.0, 37.0, 30.0, 31.0, 18.0, 20.0, 25.0, 11.0, 18.0, 16.0, 11.0, 11.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.627206802368164e-05, -1.5798956155776978e-05, -1.5325844287872314e-05, -1.4852732419967651e-05, -1.4379620552062988e-05, -1.3906508684158325e-05, -1.3433396816253662e-05, -1.2960284948348999e-05, -1.2487173080444336e-05, -1.2014061212539673e-05, -1.154094934463501e-05, -1.1067837476730347e-05, -1.0594725608825684e-05, -1.012161374092102e-05, -9.648501873016357e-06, -9.175390005111694e-06, -8.702278137207031e-06, -8.229166269302368e-06, -7.756054401397705e-06, -7.282942533493042e-06, -6.809830665588379e-06, -6.336718797683716e-06, -5.863606929779053e-06, -5.39049506187439e-06, -4.9173831939697266e-06, -4.4442713260650635e-06, -3.9711594581604e-06, -3.4980475902557373e-06, -3.0249357223510742e-06, -2.551823854446411e-06, -2.078711986541748e-06, -1.605600118637085e-06, -1.1324882507324219e-06, -6.593763828277588e-07, -1.862645149230957e-07, 2.868473529815674e-07, 7.599592208862305e-07, 1.2330710887908936e-06, 1.7061829566955566e-06, 2.1792948246002197e-06, 2.652406692504883e-06, 3.125518560409546e-06, 3.598630428314209e-06, 4.071742296218872e-06, 4.544854164123535e-06, 5.017966032028198e-06, 5.491077899932861e-06, 5.964189767837524e-06, 6.4373016357421875e-06, 6.910413503646851e-06, 7.383525371551514e-06, 7.856637239456177e-06, 8.32974910736084e-06, 8.802860975265503e-06, 9.275972843170166e-06, 9.749084711074829e-06, 1.0222196578979492e-05, 1.0695308446884155e-05, 1.1168420314788818e-05, 1.1641532182693481e-05, 1.2114644050598145e-05, 1.2587755918502808e-05, 1.306086778640747e-05, 1.3533979654312134e-05, 1.4007091522216797e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 17.0, 17.0, 31.0, 51.0, 93.0, 125.0, 177.0, 252.0, 400.0, 633.0, 983.0, 1566.0, 2513.0, 3969.0, 6511.0, 10797.0, 17774.0, 29792.0, 51994.0, 93747.0, 185238.0, 293460.0, 155028.0, 80929.0, 45333.0, 26378.0, 15666.0, 9543.0, 5854.0, 3560.0, 2172.0, 1338.0, 923.0, 521.0, 383.0, 257.0, 155.0, 109.0, 75.0, 57.0, 38.0, 21.0, 14.0, 16.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1885986328125, -0.1825885772705078, -0.17657852172851562, -0.17056846618652344, -0.16455841064453125, -0.15854835510253906, -0.15253829956054688, -0.1465282440185547, -0.1405181884765625, -0.1345081329345703, -0.12849807739257812, -0.12248802185058594, -0.11647796630859375, -0.11046791076660156, -0.10445785522460938, -0.09844779968261719, -0.092437744140625, -0.08642768859863281, -0.08041763305664062, -0.07440757751464844, -0.06839752197265625, -0.06238746643066406, -0.056377410888671875, -0.05036735534667969, -0.0443572998046875, -0.03834724426269531, -0.032337188720703125, -0.026327133178710938, -0.02031707763671875, -0.014307022094726562, -0.008296966552734375, -0.0022869110107421875, 0.00372314453125, 0.009733200073242188, 0.015743255615234375, 0.021753311157226562, 0.02776336669921875, 0.03377342224121094, 0.039783477783203125, 0.04579353332519531, 0.0518035888671875, 0.05781364440917969, 0.06382369995117188, 0.06983375549316406, 0.07584381103515625, 0.08185386657714844, 0.08786392211914062, 0.09387397766113281, 0.099884033203125, 0.10589408874511719, 0.11190414428710938, 0.11791419982910156, 0.12392425537109375, 0.12993431091308594, 0.13594436645507812, 0.1419544219970703, 0.1479644775390625, 0.1539745330810547, 0.15998458862304688, 0.16599464416503906, 0.17200469970703125, 0.17801475524902344, 0.18402481079101562, 0.1900348663330078, 0.196044921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 5.0, 9.0, 8.0, 12.0, 14.0, 14.0, 16.0, 26.0, 30.0, 32.0, 51.0, 93.0, 136.0, 138.0, 117.0, 81.0, 36.0, 38.0, 32.0, 19.0, 20.0, 19.0, 8.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.1013174057006836, -0.09759330749511719, -0.09386920928955078, -0.09014511108398438, -0.08642101287841797, -0.08269691467285156, -0.07897281646728516, -0.07524871826171875, -0.07152462005615234, -0.06780052185058594, -0.06407642364501953, -0.060352325439453125, -0.05662822723388672, -0.05290412902832031, -0.049180030822753906, -0.0454559326171875, -0.041731834411621094, -0.03800773620605469, -0.03428363800048828, -0.030559539794921875, -0.02683544158935547, -0.023111343383789062, -0.019387245178222656, -0.01566314697265625, -0.011939048767089844, -0.008214950561523438, -0.004490852355957031, -0.000766754150390625, 0.0029573440551757812, 0.0066814422607421875, 0.010405540466308594, 0.014129638671875, 0.017853736877441406, 0.021577835083007812, 0.02530193328857422, 0.029026031494140625, 0.03275012969970703, 0.03647422790527344, 0.040198326110839844, 0.04392242431640625, 0.047646522521972656, 0.05137062072753906, 0.05509471893310547, 0.058818817138671875, 0.06254291534423828, 0.06626701354980469, 0.0699911117553711, 0.0737152099609375, 0.0774393081665039, 0.08116340637207031, 0.08488750457763672, 0.08861160278320312, 0.09233570098876953, 0.09605979919433594, 0.09978389739990234, 0.10350799560546875, 0.10723209381103516, 0.11095619201660156, 0.11468029022216797, 0.11840438842773438, 0.12212848663330078, 0.1258525848388672, 0.1295766830444336, 0.13330078125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 8.0, 18.0, 17.0, 28.0, 22.0, 20.0, 31.0, 29.0, 34.0, 45.0, 60.0, 41.0, 55.0, 54.0, 39.0, 44.0, 59.0, 48.0, 44.0, 34.0, 41.0, 31.0, 30.0, 35.0, 28.0, 13.0, 10.0, 12.0, 12.0, 5.0, 2.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.31485366821289, -17.69188690185547, -17.06892204284668, -16.44595718383789, -15.822990417480469, -15.200024604797363, -14.577058792114258, -13.954092979431152, -13.331127166748047, -12.708161354064941, -12.085195541381836, -11.46222972869873, -10.839263916015625, -10.21629810333252, -9.593332290649414, -8.970366477966309, -8.347400665283203, -7.724434852600098, -7.101469039916992, -6.478503227233887, -5.855537414550781, -5.232571601867676, -4.60960578918457, -3.986639976501465, -3.3636741638183594, -2.740708351135254, -2.1177425384521484, -1.494776725769043, -0.8718109130859375, -0.24884510040283203, 0.37412071228027344, 0.9970865249633789, 1.6200523376464844, 2.24301815032959, 2.8659839630126953, 3.488949775695801, 4.111915588378906, 4.734881401062012, 5.357847213745117, 5.980813026428223, 6.603778839111328, 7.226744651794434, 7.849710464477539, 8.472676277160645, 9.09564208984375, 9.718607902526855, 10.341573715209961, 10.964539527893066, 11.587505340576172, 12.210471153259277, 12.833436965942383, 13.456402778625488, 14.079368591308594, 14.7023344039917, 15.325300216674805, 15.94826602935791, 16.571231842041016, 17.194198608398438, 17.817163467407227, 18.440128326416016, 19.063095092773438, 19.68606185913086, 20.30902671813965, 20.931991577148438, 21.55495834350586]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 9.0, 6.0, 3.0, 6.0, 10.0, 14.0, 19.0, 12.0, 15.0, 17.0, 12.0, 16.0, 27.0, 21.0, 30.0, 38.0, 28.0, 35.0, 37.0, 39.0, 40.0, 34.0, 58.0, 35.0, 34.0, 41.0, 39.0, 36.0, 33.0, 36.0, 30.0, 23.0, 25.0, 22.0, 11.0, 19.0, 9.0, 12.0, 18.0, 11.0, 10.0, 10.0, 5.0, 7.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.883899688720703, -19.253053665161133, -18.622207641601562, -17.991361618041992, -17.360515594482422, -16.72966766357422, -16.09882164001465, -15.467975616455078, -14.837129592895508, -14.206283569335938, -13.575437545776367, -12.94459056854248, -12.31374454498291, -11.68289852142334, -11.052051544189453, -10.421205520629883, -9.790359497070312, -9.159513473510742, -8.528667449951172, -7.897820472717285, -7.266974449157715, -6.6361284255981445, -6.005281925201416, -5.3744354248046875, -4.743589401245117, -4.112743377685547, -3.4818968772888184, -2.851050615310669, -2.2202043533325195, -1.5893580913543701, -0.9585118293762207, -0.3276653289794922, 0.30318260192871094, 0.9340288639068604, 1.5648751258850098, 2.195721387863159, 2.8265676498413086, 3.457413911819458, 4.088260173797607, 4.719106674194336, 5.349952697753906, 5.980798721313477, 6.611645221710205, 7.242491722106934, 7.873337745666504, 8.504183769226074, 9.135030746459961, 9.765876770019531, 10.396722793579102, 11.027568817138672, 11.658414840698242, 12.289261817932129, 12.9201078414917, 13.55095386505127, 14.181800842285156, 14.812646865844727, 15.443492889404297, 16.074338912963867, 16.705184936523438, 17.336030960083008, 17.966876983642578, 18.59772491455078, 19.22857093811035, 19.859416961669922, 20.490262985229492]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 13.0, 22.0, 23.0, 33.0, 64.0, 101.0, 156.0, 235.0, 374.0, 598.0, 1001.0, 1456.0, 2331.0, 3530.0, 5484.0, 8300.0, 12255.0, 18240.0, 26383.0, 36489.0, 49250.0, 63282.0, 76745.0, 88672.0, 96671.0, 99122.0, 94425.0, 85322.0, 72040.0, 57836.0, 44300.0, 32570.0, 23518.0, 16132.0, 11041.0, 7289.0, 4684.0, 3065.0, 2031.0, 1223.0, 832.0, 527.0, 312.0, 195.0, 145.0, 88.0, 58.0, 34.0, 23.0, 12.0, 5.0, 6.0, 5.0, 3.0, 2.0, 4.0], "bins": [-10.5703125, -10.253173828125, -9.93603515625, -9.618896484375, -9.3017578125, -8.984619140625, -8.66748046875, -8.350341796875, -8.033203125, -7.716064453125, -7.39892578125, -7.081787109375, -6.7646484375, -6.447509765625, -6.13037109375, -5.813232421875, -5.49609375, -5.178955078125, -4.86181640625, -4.544677734375, -4.2275390625, -3.910400390625, -3.59326171875, -3.276123046875, -2.958984375, -2.641845703125, -2.32470703125, -2.007568359375, -1.6904296875, -1.373291015625, -1.05615234375, -0.739013671875, -0.421875, -0.104736328125, 0.21240234375, 0.529541015625, 0.8466796875, 1.163818359375, 1.48095703125, 1.798095703125, 2.115234375, 2.432373046875, 2.74951171875, 3.066650390625, 3.3837890625, 3.700927734375, 4.01806640625, 4.335205078125, 4.65234375, 4.969482421875, 5.28662109375, 5.603759765625, 5.9208984375, 6.238037109375, 6.55517578125, 6.872314453125, 7.189453125, 7.506591796875, 7.82373046875, 8.140869140625, 8.4580078125, 8.775146484375, 9.09228515625, 9.409423828125, 9.7265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 10.0, 3.0, 8.0, 9.0, 10.0, 15.0, 15.0, 17.0, 19.0, 18.0, 20.0, 17.0, 25.0, 23.0, 28.0, 26.0, 31.0, 35.0, 32.0, 39.0, 38.0, 40.0, 42.0, 37.0, 40.0, 42.0, 38.0, 31.0, 30.0, 21.0, 27.0, 27.0, 29.0, 12.0, 17.0, 15.0, 13.0, 24.0, 13.0, 13.0, 9.0, 8.0, 6.0, 10.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0], "bins": [-18.265625, -17.662841796875, -17.06005859375, -16.457275390625, -15.8544921875, -15.251708984375, -14.64892578125, -14.046142578125, -13.443359375, -12.840576171875, -12.23779296875, -11.635009765625, -11.0322265625, -10.429443359375, -9.82666015625, -9.223876953125, -8.62109375, -8.018310546875, -7.41552734375, -6.812744140625, -6.2099609375, -5.607177734375, -5.00439453125, -4.401611328125, -3.798828125, -3.196044921875, -2.59326171875, -1.990478515625, -1.3876953125, -0.784912109375, -0.18212890625, 0.420654296875, 1.0234375, 1.626220703125, 2.22900390625, 2.831787109375, 3.4345703125, 4.037353515625, 4.64013671875, 5.242919921875, 5.845703125, 6.448486328125, 7.05126953125, 7.654052734375, 8.2568359375, 8.859619140625, 9.46240234375, 10.065185546875, 10.66796875, 11.270751953125, 11.87353515625, 12.476318359375, 13.0791015625, 13.681884765625, 14.28466796875, 14.887451171875, 15.490234375, 16.093017578125, 16.69580078125, 17.298583984375, 17.9013671875, 18.504150390625, 19.10693359375, 19.709716796875, 20.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 17.0, 13.0, 11.0, 17.0, 36.0, 67.0, 66.0, 116.0, 170.0, 317.0, 479.0, 747.0, 1289.0, 2055.0, 3260.0, 5241.0, 8389.0, 13284.0, 20209.0, 30616.0, 42890.0, 58935.0, 76868.0, 93677.0, 105661.0, 109802.0, 106467.0, 94222.0, 78237.0, 60970.0, 44883.0, 31292.0, 21137.0, 13610.0, 8743.0, 5600.0, 3531.0, 2126.0, 1333.0, 847.0, 499.0, 282.0, 198.0, 125.0, 85.0, 48.0, 40.0, 18.0, 8.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.171875, -10.8177490234375, -10.463623046875, -10.1094970703125, -9.75537109375, -9.4012451171875, -9.047119140625, -8.6929931640625, -8.3388671875, -7.9847412109375, -7.630615234375, -7.2764892578125, -6.92236328125, -6.5682373046875, -6.214111328125, -5.8599853515625, -5.505859375, -5.1517333984375, -4.797607421875, -4.4434814453125, -4.08935546875, -3.7352294921875, -3.381103515625, -3.0269775390625, -2.6728515625, -2.3187255859375, -1.964599609375, -1.6104736328125, -1.25634765625, -0.9022216796875, -0.548095703125, -0.1939697265625, 0.16015625, 0.5142822265625, 0.868408203125, 1.2225341796875, 1.57666015625, 1.9307861328125, 2.284912109375, 2.6390380859375, 2.9931640625, 3.3472900390625, 3.701416015625, 4.0555419921875, 4.40966796875, 4.7637939453125, 5.117919921875, 5.4720458984375, 5.826171875, 6.1802978515625, 6.534423828125, 6.8885498046875, 7.24267578125, 7.5968017578125, 7.950927734375, 8.3050537109375, 8.6591796875, 9.0133056640625, 9.367431640625, 9.7215576171875, 10.07568359375, 10.4298095703125, 10.783935546875, 11.1380615234375, 11.4921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 9.0, 12.0, 6.0, 7.0, 17.0, 23.0, 20.0, 22.0, 32.0, 31.0, 25.0, 37.0, 39.0, 36.0, 40.0, 31.0, 45.0, 44.0, 37.0, 35.0, 41.0, 42.0, 30.0, 33.0, 35.0, 36.0, 33.0, 21.0, 32.0, 19.0, 12.0, 15.0, 14.0, 13.0, 17.0, 6.0, 7.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.1484375, -12.73486328125, -12.3212890625, -11.90771484375, -11.494140625, -11.08056640625, -10.6669921875, -10.25341796875, -9.83984375, -9.42626953125, -9.0126953125, -8.59912109375, -8.185546875, -7.77197265625, -7.3583984375, -6.94482421875, -6.53125, -6.11767578125, -5.7041015625, -5.29052734375, -4.876953125, -4.46337890625, -4.0498046875, -3.63623046875, -3.22265625, -2.80908203125, -2.3955078125, -1.98193359375, -1.568359375, -1.15478515625, -0.7412109375, -0.32763671875, 0.0859375, 0.49951171875, 0.9130859375, 1.32666015625, 1.740234375, 2.15380859375, 2.5673828125, 2.98095703125, 3.39453125, 3.80810546875, 4.2216796875, 4.63525390625, 5.048828125, 5.46240234375, 5.8759765625, 6.28955078125, 6.703125, 7.11669921875, 7.5302734375, 7.94384765625, 8.357421875, 8.77099609375, 9.1845703125, 9.59814453125, 10.01171875, 10.42529296875, 10.8388671875, 11.25244140625, 11.666015625, 12.07958984375, 12.4931640625, 12.90673828125, 13.3203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 11.0, 8.0, 11.0, 11.0, 31.0, 36.0, 60.0, 98.0, 169.0, 245.0, 331.0, 574.0, 884.0, 1286.0, 1978.0, 3123.0, 4745.0, 7142.0, 10565.0, 15509.0, 22149.0, 30728.0, 41333.0, 54231.0, 67386.0, 79845.0, 89514.0, 95441.0, 94959.0, 89130.0, 79092.0, 66790.0, 53046.0, 40852.0, 30142.0, 21716.0, 14851.0, 10364.0, 6972.0, 4571.0, 3005.0, 1963.0, 1267.0, 852.0, 532.0, 356.0, 242.0, 150.0, 107.0, 67.0, 39.0, 18.0, 16.0, 8.0, 7.0, 5.0, 0.0, 2.0, 3.0], "bins": [-3.12890625, -3.03399658203125, -2.9390869140625, -2.84417724609375, -2.749267578125, -2.65435791015625, -2.5594482421875, -2.46453857421875, -2.36962890625, -2.27471923828125, -2.1798095703125, -2.08489990234375, -1.989990234375, -1.89508056640625, -1.8001708984375, -1.70526123046875, -1.6103515625, -1.51544189453125, -1.4205322265625, -1.32562255859375, -1.230712890625, -1.13580322265625, -1.0408935546875, -0.94598388671875, -0.85107421875, -0.75616455078125, -0.6612548828125, -0.56634521484375, -0.471435546875, -0.37652587890625, -0.2816162109375, -0.18670654296875, -0.091796875, 0.00311279296875, 0.0980224609375, 0.19293212890625, 0.287841796875, 0.38275146484375, 0.4776611328125, 0.57257080078125, 0.66748046875, 0.76239013671875, 0.8572998046875, 0.95220947265625, 1.047119140625, 1.14202880859375, 1.2369384765625, 1.33184814453125, 1.4267578125, 1.52166748046875, 1.6165771484375, 1.71148681640625, 1.806396484375, 1.90130615234375, 1.9962158203125, 2.09112548828125, 2.18603515625, 2.28094482421875, 2.3758544921875, 2.47076416015625, 2.565673828125, 2.66058349609375, 2.7554931640625, 2.85040283203125, 2.9453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 0.0, 9.0, 13.0, 9.0, 12.0, 14.0, 17.0, 18.0, 19.0, 21.0, 24.0, 21.0, 33.0, 23.0, 26.0, 36.0, 41.0, 44.0, 51.0, 45.0, 44.0, 46.0, 34.0, 49.0, 46.0, 24.0, 42.0, 30.0, 29.0, 25.0, 22.0, 17.0, 19.0, 12.0, 15.0, 12.0, 10.0, 9.0, 11.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.0003902912139892578, -0.0003788881003856659, -0.000367484986782074, -0.00035608187317848206, -0.00034467875957489014, -0.0003332756459712982, -0.0003218725323677063, -0.0003104694187641144, -0.00029906630516052246, -0.00028766319155693054, -0.0002762600779533386, -0.0002648569643497467, -0.0002534538507461548, -0.00024205073714256287, -0.00023064762353897095, -0.00021924450993537903, -0.0002078413963317871, -0.0001964382827281952, -0.00018503516912460327, -0.00017363205552101135, -0.00016222894191741943, -0.00015082582831382751, -0.0001394227147102356, -0.00012801960110664368, -0.00011661648750305176, -0.00010521337389945984, -9.381026029586792e-05, -8.2407146692276e-05, -7.100403308868408e-05, -5.960091948509216e-05, -4.8197805881500244e-05, -3.6794692277908325e-05, -2.5391578674316406e-05, -1.3988465070724487e-05, -2.5853514671325684e-06, 8.81776213645935e-06, 2.022087574005127e-05, 3.162398934364319e-05, 4.302710294723511e-05, 5.4430216550827026e-05, 6.583333015441895e-05, 7.723644375801086e-05, 8.863955736160278e-05, 0.0001000426709651947, 0.00011144578456878662, 0.00012284889817237854, 0.00013425201177597046, 0.00014565512537956238, 0.0001570582389831543, 0.00016846135258674622, 0.00017986446619033813, 0.00019126757979393005, 0.00020267069339752197, 0.0002140738070011139, 0.0002254769206047058, 0.00023688003420829773, 0.00024828314781188965, 0.00025968626141548157, 0.0002710893750190735, 0.0002824924886226654, 0.0002938956022262573, 0.00030529871582984924, 0.00031670182943344116, 0.0003281049430370331, 0.000339508056640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 10.0, 21.0, 31.0, 52.0, 84.0, 130.0, 187.0, 287.0, 504.0, 843.0, 1265.0, 2015.0, 3281.0, 5461.0, 8546.0, 13491.0, 20840.0, 31454.0, 45915.0, 63888.0, 82679.0, 100772.0, 111874.0, 115004.0, 107935.0, 92634.0, 73972.0, 54492.0, 38883.0, 25966.0, 16896.0, 10962.0, 6819.0, 4261.0, 2705.0, 1634.0, 1030.0, 663.0, 406.0, 251.0, 153.0, 98.0, 60.0, 36.0, 23.0, 14.0, 14.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.486328125, -3.3671875, -3.248046875, -3.12890625, -3.009765625, -2.890625, -2.771484375, -2.65234375, -2.533203125, -2.4140625, -2.294921875, -2.17578125, -2.056640625, -1.9375, -1.818359375, -1.69921875, -1.580078125, -1.4609375, -1.341796875, -1.22265625, -1.103515625, -0.984375, -0.865234375, -0.74609375, -0.626953125, -0.5078125, -0.388671875, -0.26953125, -0.150390625, -0.03125, 0.087890625, 0.20703125, 0.326171875, 0.4453125, 0.564453125, 0.68359375, 0.802734375, 0.921875, 1.041015625, 1.16015625, 1.279296875, 1.3984375, 1.517578125, 1.63671875, 1.755859375, 1.875, 1.994140625, 2.11328125, 2.232421875, 2.3515625, 2.470703125, 2.58984375, 2.708984375, 2.828125, 2.947265625, 3.06640625, 3.185546875, 3.3046875, 3.423828125, 3.54296875, 3.662109375, 3.78125, 3.900390625, 4.01953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 10.0, 7.0, 8.0, 20.0, 21.0, 24.0, 25.0, 31.0, 47.0, 56.0, 54.0, 48.0, 44.0, 56.0, 57.0, 49.0, 66.0, 39.0, 57.0, 54.0, 42.0, 37.0, 30.0, 20.0, 26.0, 16.0, 14.0, 11.0, 12.0, 3.0, 6.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.830078125, -2.753265380859375, -2.67645263671875, -2.599639892578125, -2.5228271484375, -2.446014404296875, -2.36920166015625, -2.292388916015625, -2.215576171875, -2.138763427734375, -2.06195068359375, -1.985137939453125, -1.9083251953125, -1.831512451171875, -1.75469970703125, -1.677886962890625, -1.60107421875, -1.524261474609375, -1.44744873046875, -1.370635986328125, -1.2938232421875, -1.217010498046875, -1.14019775390625, -1.063385009765625, -0.986572265625, -0.909759521484375, -0.83294677734375, -0.756134033203125, -0.6793212890625, -0.602508544921875, -0.52569580078125, -0.448883056640625, -0.3720703125, -0.295257568359375, -0.21844482421875, -0.141632080078125, -0.0648193359375, 0.011993408203125, 0.08880615234375, 0.165618896484375, 0.242431640625, 0.319244384765625, 0.39605712890625, 0.472869873046875, 0.5496826171875, 0.626495361328125, 0.70330810546875, 0.780120849609375, 0.85693359375, 0.933746337890625, 1.01055908203125, 1.087371826171875, 1.1641845703125, 1.240997314453125, 1.31781005859375, 1.394622802734375, 1.471435546875, 1.548248291015625, 1.62506103515625, 1.701873779296875, 1.7786865234375, 1.855499267578125, 1.93231201171875, 2.009124755859375, 2.0859375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 5.0, 2.0, 11.0, 9.0, 16.0, 20.0, 28.0, 14.0, 18.0, 39.0, 30.0, 34.0, 52.0, 45.0, 52.0, 61.0, 48.0, 47.0, 53.0, 63.0, 40.0, 49.0, 39.0, 36.0, 42.0, 26.0, 29.0, 26.0, 16.0, 14.0, 9.0, 7.0, 1.0, 2.0, 8.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.092493057250977, -15.434326171875, -14.776158332824707, -14.11799144744873, -13.459823608398438, -12.801656723022461, -12.143489837646484, -11.485321998596191, -10.827154159545898, -10.168987274169922, -9.510819435119629, -8.852652549743652, -8.19448471069336, -7.536317825317383, -6.878150463104248, -6.219983100891113, -5.561816215515137, -4.903648853302002, -4.245481491088867, -3.5873143672943115, -2.9291470050811768, -2.270979642868042, -1.6128125190734863, -0.9546451568603516, -0.2964777946472168, 0.3616895079612732, 1.0198568105697632, 1.6780240535736084, 2.336191415786743, 2.994358777999878, 3.6525259017944336, 4.310693264007568, 4.968860626220703, 5.627027988433838, 6.285195350646973, 6.943362236022949, 7.601530075073242, 8.259696960449219, 8.917863845825195, 9.576031684875488, 10.234199523925781, 10.892366409301758, 11.55053424835205, 12.208701133728027, 12.86686897277832, 13.525035858154297, 14.183202743530273, 14.841370582580566, 15.499537467956543, 16.157705307006836, 16.815872192382812, 17.47403907775879, 18.132205963134766, 18.790374755859375, 19.44854164123535, 20.106708526611328, 20.764875411987305, 21.42304229736328, 22.081209182739258, 22.739377975463867, 23.397544860839844, 24.05571174621582, 24.713878631591797, 25.372047424316406, 26.030214309692383]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 3.0, 4.0, 9.0, 4.0, 11.0, 8.0, 9.0, 14.0, 18.0, 17.0, 17.0, 20.0, 23.0, 23.0, 15.0, 35.0, 31.0, 39.0, 30.0, 45.0, 39.0, 41.0, 48.0, 40.0, 39.0, 43.0, 25.0, 36.0, 30.0, 33.0, 43.0, 21.0, 25.0, 23.0, 14.0, 18.0, 14.0, 15.0, 8.0, 9.0, 11.0, 7.0, 7.0, 6.0, 6.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-20.20684242248535, -19.571300506591797, -18.935758590698242, -18.300216674804688, -17.664674758911133, -17.029132843017578, -16.393590927124023, -15.758048057556152, -15.122506141662598, -14.486964225769043, -13.851422309875488, -13.215880393981934, -12.580337524414062, -11.944795608520508, -11.309253692626953, -10.673711776733398, -10.038169860839844, -9.402627944946289, -8.767086029052734, -8.13154411315918, -7.496001720428467, -6.860459804534912, -6.224917411804199, -5.5893754959106445, -4.95383358001709, -4.318291664123535, -3.6827495098114014, -3.0472073554992676, -2.411665439605713, -1.7761235237121582, -1.1405813694000244, -0.5050392150878906, 0.13050079345703125, 0.7660428285598755, 1.4015848636627197, 2.0371270179748535, 2.672668933868408, 3.308210849761963, 3.9437530040740967, 4.5792951583862305, 5.214837074279785, 5.85037899017334, 6.4859209060668945, 7.121463298797607, 7.757005214691162, 8.392547607421875, 9.02808952331543, 9.663631439208984, 10.299173355102539, 10.934715270996094, 11.570257186889648, 12.205799102783203, 12.841341018676758, 13.476882934570312, 14.112425804138184, 14.747967720031738, 15.383509635925293, 16.019052505493164, 16.65459442138672, 17.290136337280273, 17.925678253173828, 18.561220169067383, 19.196762084960938, 19.832304000854492, 20.467845916748047]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 22.0, 25.0, 52.0, 95.0, 153.0, 228.0, 419.0, 706.0, 1123.0, 1815.0, 3134.0, 4998.0, 8445.0, 13603.0, 21781.0, 34397.0, 54142.0, 81541.0, 121214.0, 171528.0, 235083.0, 302159.0, 365451.0, 413921.0, 433064.0, 420231.0, 376944.0, 314370.0, 246913.0, 183809.0, 130368.0, 89640.0, 59312.0, 38188.0, 24482.0, 15777.0, 9749.0, 5942.0, 3654.0, 2279.0, 1374.0, 843.0, 511.0, 295.0, 185.0, 115.0, 81.0, 38.0, 32.0, 22.0, 14.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-13.28125, -12.8472900390625, -12.413330078125, -11.9793701171875, -11.54541015625, -11.1114501953125, -10.677490234375, -10.2435302734375, -9.8095703125, -9.3756103515625, -8.941650390625, -8.5076904296875, -8.07373046875, -7.6397705078125, -7.205810546875, -6.7718505859375, -6.337890625, -5.9039306640625, -5.469970703125, -5.0360107421875, -4.60205078125, -4.1680908203125, -3.734130859375, -3.3001708984375, -2.8662109375, -2.4322509765625, -1.998291015625, -1.5643310546875, -1.13037109375, -0.6964111328125, -0.262451171875, 0.1715087890625, 0.60546875, 1.0394287109375, 1.473388671875, 1.9073486328125, 2.34130859375, 2.7752685546875, 3.209228515625, 3.6431884765625, 4.0771484375, 4.5111083984375, 4.945068359375, 5.3790283203125, 5.81298828125, 6.2469482421875, 6.680908203125, 7.1148681640625, 7.548828125, 7.9827880859375, 8.416748046875, 8.8507080078125, 9.28466796875, 9.7186279296875, 10.152587890625, 10.5865478515625, 11.0205078125, 11.4544677734375, 11.888427734375, 12.3223876953125, 12.75634765625, 13.1903076171875, 13.624267578125, 14.0582275390625, 14.4921875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 2.0, 4.0, 7.0, 7.0, 7.0, 6.0, 6.0, 15.0, 11.0, 17.0, 24.0, 17.0, 21.0, 21.0, 22.0, 27.0, 27.0, 33.0, 36.0, 44.0, 44.0, 50.0, 49.0, 36.0, 35.0, 47.0, 41.0, 39.0, 47.0, 23.0, 25.0, 26.0, 22.0, 23.0, 23.0, 19.0, 18.0, 10.0, 7.0, 9.0, 9.0, 10.0, 5.0, 5.0, 9.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-17.546875, -17.0029296875, -16.458984375, -15.9150390625, -15.37109375, -14.8271484375, -14.283203125, -13.7392578125, -13.1953125, -12.6513671875, -12.107421875, -11.5634765625, -11.01953125, -10.4755859375, -9.931640625, -9.3876953125, -8.84375, -8.2998046875, -7.755859375, -7.2119140625, -6.66796875, -6.1240234375, -5.580078125, -5.0361328125, -4.4921875, -3.9482421875, -3.404296875, -2.8603515625, -2.31640625, -1.7724609375, -1.228515625, -0.6845703125, -0.140625, 0.4033203125, 0.947265625, 1.4912109375, 2.03515625, 2.5791015625, 3.123046875, 3.6669921875, 4.2109375, 4.7548828125, 5.298828125, 5.8427734375, 6.38671875, 6.9306640625, 7.474609375, 8.0185546875, 8.5625, 9.1064453125, 9.650390625, 10.1943359375, 10.73828125, 11.2822265625, 11.826171875, 12.3701171875, 12.9140625, 13.4580078125, 14.001953125, 14.5458984375, 15.08984375, 15.6337890625, 16.177734375, 16.7216796875, 17.265625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 12.0, 6.0, 10.0, 12.0, 30.0, 44.0, 75.0, 145.0, 253.0, 461.0, 711.0, 1240.0, 2006.0, 3374.0, 5666.0, 8992.0, 14350.0, 22364.0, 34651.0, 51911.0, 76191.0, 108684.0, 147979.0, 196053.0, 246734.0, 296992.0, 340954.0, 368607.0, 379691.0, 366623.0, 335312.0, 292259.0, 242078.0, 189852.0, 143470.0, 103404.0, 73172.0, 50098.0, 33017.0, 21632.0, 13600.0, 8372.0, 5248.0, 3146.0, 1967.0, 1153.0, 686.0, 428.0, 244.0, 136.0, 81.0, 55.0, 44.0, 11.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-13.15625, -12.750732421875, -12.34521484375, -11.939697265625, -11.5341796875, -11.128662109375, -10.72314453125, -10.317626953125, -9.912109375, -9.506591796875, -9.10107421875, -8.695556640625, -8.2900390625, -7.884521484375, -7.47900390625, -7.073486328125, -6.66796875, -6.262451171875, -5.85693359375, -5.451416015625, -5.0458984375, -4.640380859375, -4.23486328125, -3.829345703125, -3.423828125, -3.018310546875, -2.61279296875, -2.207275390625, -1.8017578125, -1.396240234375, -0.99072265625, -0.585205078125, -0.1796875, 0.225830078125, 0.63134765625, 1.036865234375, 1.4423828125, 1.847900390625, 2.25341796875, 2.658935546875, 3.064453125, 3.469970703125, 3.87548828125, 4.281005859375, 4.6865234375, 5.092041015625, 5.49755859375, 5.903076171875, 6.30859375, 6.714111328125, 7.11962890625, 7.525146484375, 7.9306640625, 8.336181640625, 8.74169921875, 9.147216796875, 9.552734375, 9.958251953125, 10.36376953125, 10.769287109375, 11.1748046875, 11.580322265625, 11.98583984375, 12.391357421875, 12.796875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 4.0, 8.0, 9.0, 4.0, 12.0, 17.0, 25.0, 38.0, 38.0, 50.0, 65.0, 68.0, 77.0, 97.0, 127.0, 131.0, 158.0, 183.0, 169.0, 179.0, 201.0, 227.0, 219.0, 207.0, 183.0, 195.0, 210.0, 168.0, 143.0, 129.0, 120.0, 103.0, 88.0, 76.0, 65.0, 66.0, 45.0, 39.0, 24.0, 27.0, 16.0, 13.0, 13.0, 11.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.421875, -8.1485595703125, -7.875244140625, -7.6019287109375, -7.32861328125, -7.0552978515625, -6.781982421875, -6.5086669921875, -6.2353515625, -5.9620361328125, -5.688720703125, -5.4154052734375, -5.14208984375, -4.8687744140625, -4.595458984375, -4.3221435546875, -4.048828125, -3.7755126953125, -3.502197265625, -3.2288818359375, -2.95556640625, -2.6822509765625, -2.408935546875, -2.1356201171875, -1.8623046875, -1.5889892578125, -1.315673828125, -1.0423583984375, -0.76904296875, -0.4957275390625, -0.222412109375, 0.0509033203125, 0.32421875, 0.5975341796875, 0.870849609375, 1.1441650390625, 1.41748046875, 1.6907958984375, 1.964111328125, 2.2374267578125, 2.5107421875, 2.7840576171875, 3.057373046875, 3.3306884765625, 3.60400390625, 3.8773193359375, 4.150634765625, 4.4239501953125, 4.697265625, 4.9705810546875, 5.243896484375, 5.5172119140625, 5.79052734375, 6.0638427734375, 6.337158203125, 6.6104736328125, 6.8837890625, 7.1571044921875, 7.430419921875, 7.7037353515625, 7.97705078125, 8.2503662109375, 8.523681640625, 8.7969970703125, 9.0703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 1.0, 6.0, 7.0, 12.0, 14.0, 9.0, 16.0, 30.0, 28.0, 27.0, 31.0, 27.0, 40.0, 39.0, 52.0, 54.0, 53.0, 60.0, 50.0, 56.0, 58.0, 44.0, 32.0, 45.0, 33.0, 37.0, 21.0, 22.0, 24.0, 20.0, 14.0, 8.0, 6.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.79474449157715, -19.080846786499023, -18.3669490814209, -17.653051376342773, -16.93915367126465, -16.225257873535156, -15.511359214782715, -14.797462463378906, -14.083564758300781, -13.369667053222656, -12.655769348144531, -11.941871643066406, -11.227974891662598, -10.514077186584473, -9.800179481506348, -9.086282730102539, -8.372384071350098, -7.658486366271973, -6.944589138031006, -6.230691432952881, -5.516794204711914, -4.802896499633789, -4.088998794555664, -3.3751015663146973, -2.6612038612365723, -1.9473063945770264, -1.233408808708191, -0.5195112228393555, 0.19438624382019043, 0.9082837104797363, 1.6221814155578613, 2.336078643798828, 3.049976348876953, 3.763873815536499, 4.477771282196045, 5.19166898727417, 5.905566215515137, 6.619463920593262, 7.333361625671387, 8.047258377075195, 8.76115608215332, 9.475053787231445, 10.18895149230957, 10.902849197387695, 11.616745948791504, 12.330643653869629, 13.044541358947754, 13.758438110351562, 14.472336769104004, 15.186234474182129, 15.900132179260254, 16.614028930664062, 17.327926635742188, 18.041824340820312, 18.755722045898438, 19.469619750976562, 20.183517456054688, 20.897415161132812, 21.611312866210938, 22.325210571289062, 23.039108276367188, 23.753005981445312, 24.466903686523438, 25.18079948425293, 25.894697189331055]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 2.0, 13.0, 8.0, 10.0, 5.0, 15.0, 12.0, 17.0, 18.0, 20.0, 21.0, 26.0, 26.0, 43.0, 22.0, 23.0, 25.0, 34.0, 23.0, 32.0, 48.0, 35.0, 33.0, 39.0, 37.0, 40.0, 35.0, 29.0, 29.0, 25.0, 26.0, 27.0, 16.0, 22.0, 21.0, 13.0, 11.0, 13.0, 14.0, 12.0, 15.0, 12.0, 14.0, 11.0, 6.0, 5.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-19.253223419189453, -18.640270233154297, -18.027318954467773, -17.414365768432617, -16.801414489746094, -16.188461303710938, -15.575508117675781, -14.962555885314941, -14.349603652954102, -13.736651420593262, -13.123699188232422, -12.510746002197266, -11.897793769836426, -11.284841537475586, -10.67188835144043, -10.05893611907959, -9.44598388671875, -8.83303165435791, -8.22007942199707, -7.607126235961914, -6.994174003601074, -6.381221771240234, -5.768269062042236, -5.155316352844238, -4.542364120483398, -3.9294116497039795, -3.3164591789245605, -2.7035067081451416, -2.0905542373657227, -1.4776017665863037, -0.8646492958068848, -0.2516965866088867, 0.36125755310058594, 0.9742100238800049, 1.5871624946594238, 2.2001149654388428, 2.8130674362182617, 3.4260199069976807, 4.0389723777771, 4.651925086975098, 5.2648773193359375, 5.877829551696777, 6.490782260894775, 7.103734970092773, 7.716687202453613, 8.329639434814453, 8.94259262084961, 9.55554485321045, 10.168497085571289, 10.781449317932129, 11.394401550292969, 12.007354736328125, 12.620306968688965, 13.233259201049805, 13.846212387084961, 14.4591646194458, 15.07211685180664, 15.68506908416748, 16.29802131652832, 16.910974502563477, 17.52392578125, 18.136878967285156, 18.749832153320312, 19.36278533935547, 19.975736618041992]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 8.0, 3.0, 12.0, 21.0, 30.0, 35.0, 82.0, 87.0, 135.0, 214.0, 333.0, 511.0, 811.0, 1281.0, 2099.0, 3327.0, 5876.0, 9966.0, 17357.0, 30294.0, 53639.0, 94926.0, 168662.0, 241876.0, 180668.0, 101827.0, 57253.0, 32306.0, 18505.0, 10569.0, 6095.0, 3782.0, 2210.0, 1355.0, 824.0, 551.0, 342.0, 241.0, 166.0, 95.0, 60.0, 40.0, 29.0, 18.0, 12.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.662628173828125, -2.56939697265625, -2.476165771484375, -2.3829345703125, -2.289703369140625, -2.19647216796875, -2.103240966796875, -2.010009765625, -1.916778564453125, -1.82354736328125, -1.730316162109375, -1.6370849609375, -1.543853759765625, -1.45062255859375, -1.357391357421875, -1.26416015625, -1.170928955078125, -1.07769775390625, -0.984466552734375, -0.8912353515625, -0.798004150390625, -0.70477294921875, -0.611541748046875, -0.518310546875, -0.425079345703125, -0.33184814453125, -0.238616943359375, -0.1453857421875, -0.052154541015625, 0.04107666015625, 0.134307861328125, 0.2275390625, 0.320770263671875, 0.41400146484375, 0.507232666015625, 0.6004638671875, 0.693695068359375, 0.78692626953125, 0.880157470703125, 0.973388671875, 1.066619873046875, 1.15985107421875, 1.253082275390625, 1.3463134765625, 1.439544677734375, 1.53277587890625, 1.626007080078125, 1.71923828125, 1.812469482421875, 1.90570068359375, 1.998931884765625, 2.0921630859375, 2.185394287109375, 2.27862548828125, 2.371856689453125, 2.465087890625, 2.558319091796875, 2.65155029296875, 2.744781494140625, 2.8380126953125, 2.931243896484375, 3.02447509765625, 3.117706298828125, 3.2109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 3.0, 5.0, 8.0, 9.0, 6.0, 15.0, 12.0, 17.0, 25.0, 25.0, 24.0, 24.0, 21.0, 28.0, 31.0, 30.0, 34.0, 31.0, 33.0, 40.0, 46.0, 31.0, 32.0, 40.0, 36.0, 29.0, 37.0, 29.0, 27.0, 33.0, 26.0, 27.0, 22.0, 19.0, 17.0, 13.0, 15.0, 13.0, 16.0, 17.0, 8.0, 8.0, 8.0, 5.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-21.0, -20.345703125, -19.69140625, -19.037109375, -18.3828125, -17.728515625, -17.07421875, -16.419921875, -15.765625, -15.111328125, -14.45703125, -13.802734375, -13.1484375, -12.494140625, -11.83984375, -11.185546875, -10.53125, -9.876953125, -9.22265625, -8.568359375, -7.9140625, -7.259765625, -6.60546875, -5.951171875, -5.296875, -4.642578125, -3.98828125, -3.333984375, -2.6796875, -2.025390625, -1.37109375, -0.716796875, -0.0625, 0.591796875, 1.24609375, 1.900390625, 2.5546875, 3.208984375, 3.86328125, 4.517578125, 5.171875, 5.826171875, 6.48046875, 7.134765625, 7.7890625, 8.443359375, 9.09765625, 9.751953125, 10.40625, 11.060546875, 11.71484375, 12.369140625, 13.0234375, 13.677734375, 14.33203125, 14.986328125, 15.640625, 16.294921875, 16.94921875, 17.603515625, 18.2578125, 18.912109375, 19.56640625, 20.220703125, 20.875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 9.0, 6.0, 15.0, 10.0, 32.0, 38.0, 62.0, 78.0, 138.0, 177.0, 301.0, 425.0, 593.0, 941.0, 1374.0, 1993.0, 3035.0, 4517.0, 6800.0, 10697.0, 17230.0, 27475.0, 44968.0, 73212.0, 117045.0, 174351.0, 194071.0, 137562.0, 88249.0, 53340.0, 32592.0, 20358.0, 12876.0, 8211.0, 5343.0, 3393.0, 2261.0, 1549.0, 1024.0, 682.0, 486.0, 299.0, 263.0, 157.0, 111.0, 67.0, 51.0, 28.0, 27.0, 16.0, 9.0, 2.0, 8.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.728515625, -2.64373779296875, -2.5589599609375, -2.47418212890625, -2.389404296875, -2.30462646484375, -2.2198486328125, -2.13507080078125, -2.05029296875, -1.96551513671875, -1.8807373046875, -1.79595947265625, -1.711181640625, -1.62640380859375, -1.5416259765625, -1.45684814453125, -1.3720703125, -1.28729248046875, -1.2025146484375, -1.11773681640625, -1.032958984375, -0.94818115234375, -0.8634033203125, -0.77862548828125, -0.69384765625, -0.60906982421875, -0.5242919921875, -0.43951416015625, -0.354736328125, -0.26995849609375, -0.1851806640625, -0.10040283203125, -0.015625, 0.06915283203125, 0.1539306640625, 0.23870849609375, 0.323486328125, 0.40826416015625, 0.4930419921875, 0.57781982421875, 0.66259765625, 0.74737548828125, 0.8321533203125, 0.91693115234375, 1.001708984375, 1.08648681640625, 1.1712646484375, 1.25604248046875, 1.3408203125, 1.42559814453125, 1.5103759765625, 1.59515380859375, 1.679931640625, 1.76470947265625, 1.8494873046875, 1.93426513671875, 2.01904296875, 2.10382080078125, 2.1885986328125, 2.27337646484375, 2.358154296875, 2.44293212890625, 2.5277099609375, 2.61248779296875, 2.697265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 10.0, 9.0, 16.0, 15.0, 13.0, 28.0, 26.0, 14.0, 24.0, 30.0, 24.0, 38.0, 30.0, 30.0, 43.0, 46.0, 40.0, 54.0, 37.0, 44.0, 43.0, 40.0, 24.0, 37.0, 38.0, 35.0, 28.0, 25.0, 20.0, 17.0, 13.0, 17.0, 15.0, 12.0, 7.0, 12.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.3515625, -12.8795166015625, -12.407470703125, -11.9354248046875, -11.46337890625, -10.9913330078125, -10.519287109375, -10.0472412109375, -9.5751953125, -9.1031494140625, -8.631103515625, -8.1590576171875, -7.68701171875, -7.2149658203125, -6.742919921875, -6.2708740234375, -5.798828125, -5.3267822265625, -4.854736328125, -4.3826904296875, -3.91064453125, -3.4385986328125, -2.966552734375, -2.4945068359375, -2.0224609375, -1.5504150390625, -1.078369140625, -0.6063232421875, -0.13427734375, 0.3377685546875, 0.809814453125, 1.2818603515625, 1.75390625, 2.2259521484375, 2.697998046875, 3.1700439453125, 3.64208984375, 4.1141357421875, 4.586181640625, 5.0582275390625, 5.5302734375, 6.0023193359375, 6.474365234375, 6.9464111328125, 7.41845703125, 7.8905029296875, 8.362548828125, 8.8345947265625, 9.306640625, 9.7786865234375, 10.250732421875, 10.7227783203125, 11.19482421875, 11.6668701171875, 12.138916015625, 12.6109619140625, 13.0830078125, 13.5550537109375, 14.027099609375, 14.4991455078125, 14.97119140625, 15.4432373046875, 15.915283203125, 16.3873291015625, 16.859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 17.0, 16.0, 20.0, 38.0, 59.0, 81.0, 125.0, 177.0, 266.0, 392.0, 626.0, 940.0, 1305.0, 1870.0, 2811.0, 4377.0, 6488.0, 10176.0, 15861.0, 25042.0, 42447.0, 74419.0, 141607.0, 249225.0, 208624.0, 108956.0, 59184.0, 34275.0, 20934.0, 13076.0, 8446.0, 5400.0, 3703.0, 2447.0, 1656.0, 1161.0, 756.0, 493.0, 382.0, 225.0, 135.0, 108.0, 76.0, 50.0, 31.0, 23.0, 10.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.08306884765625, -0.0806112289428711, -0.07815361022949219, -0.07569599151611328, -0.07323837280273438, -0.07078075408935547, -0.06832313537597656, -0.06586551666259766, -0.06340789794921875, -0.060950279235839844, -0.05849266052246094, -0.05603504180908203, -0.053577423095703125, -0.05111980438232422, -0.04866218566894531, -0.046204566955566406, -0.0437469482421875, -0.041289329528808594, -0.03883171081542969, -0.03637409210205078, -0.033916473388671875, -0.03145885467529297, -0.029001235961914062, -0.026543617248535156, -0.02408599853515625, -0.021628379821777344, -0.019170761108398438, -0.01671314239501953, -0.014255523681640625, -0.011797904968261719, -0.009340286254882812, -0.006882667541503906, -0.004425048828125, -0.0019674301147460938, 0.0004901885986328125, 0.0029478073120117188, 0.005405426025390625, 0.007863044738769531, 0.010320663452148438, 0.012778282165527344, 0.01523590087890625, 0.017693519592285156, 0.020151138305664062, 0.02260875701904297, 0.025066375732421875, 0.02752399444580078, 0.029981613159179688, 0.032439231872558594, 0.0348968505859375, 0.037354469299316406, 0.03981208801269531, 0.04226970672607422, 0.044727325439453125, 0.04718494415283203, 0.04964256286621094, 0.052100181579589844, 0.05455780029296875, 0.057015419006347656, 0.05947303771972656, 0.06193065643310547, 0.06438827514648438, 0.06684589385986328, 0.06930351257324219, 0.0717611312866211, 0.07421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 11.0, 8.0, 9.0, 7.0, 10.0, 8.0, 13.0, 20.0, 14.0, 28.0, 23.0, 36.0, 26.0, 25.0, 27.0, 39.0, 50.0, 38.0, 50.0, 55.0, 56.0, 48.0, 49.0, 35.0, 39.0, 34.0, 40.0, 34.0, 32.0, 18.0, 28.0, 18.0, 10.0, 9.0, 11.0, 8.0, 7.0, 11.0, 3.0, 4.0, 7.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.519918441772461e-05, -1.4706514775753021e-05, -1.4213845133781433e-05, -1.3721175491809845e-05, -1.3228505849838257e-05, -1.2735836207866669e-05, -1.224316656589508e-05, -1.1750496923923492e-05, -1.1257827281951904e-05, -1.0765157639980316e-05, -1.0272487998008728e-05, -9.77981835603714e-06, -9.287148714065552e-06, -8.794479072093964e-06, -8.301809430122375e-06, -7.809139788150787e-06, -7.316470146179199e-06, -6.823800504207611e-06, -6.331130862236023e-06, -5.838461220264435e-06, -5.345791578292847e-06, -4.8531219363212585e-06, -4.36045229434967e-06, -3.867782652378082e-06, -3.375113010406494e-06, -2.882443368434906e-06, -2.389773726463318e-06, -1.8971040844917297e-06, -1.4044344425201416e-06, -9.117648005485535e-07, -4.1909515857696533e-07, 7.35744833946228e-08, 5.662441253662109e-07, 1.058913767337799e-06, 1.5515834093093872e-06, 2.0442530512809753e-06, 2.5369226932525635e-06, 3.0295923352241516e-06, 3.5222619771957397e-06, 4.014931619167328e-06, 4.507601261138916e-06, 5.000270903110504e-06, 5.492940545082092e-06, 5.98561018705368e-06, 6.4782798290252686e-06, 6.970949470996857e-06, 7.463619112968445e-06, 7.956288754940033e-06, 8.448958396911621e-06, 8.94162803888321e-06, 9.434297680854797e-06, 9.926967322826385e-06, 1.0419636964797974e-05, 1.0912306606769562e-05, 1.140497624874115e-05, 1.1897645890712738e-05, 1.2390315532684326e-05, 1.2882985174655914e-05, 1.3375654816627502e-05, 1.386832445859909e-05, 1.4360994100570679e-05, 1.4853663742542267e-05, 1.5346333384513855e-05, 1.5839003026485443e-05, 1.633167266845703e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 13.0, 15.0, 19.0, 33.0, 55.0, 59.0, 97.0, 136.0, 206.0, 319.0, 461.0, 681.0, 1040.0, 1506.0, 2295.0, 3293.0, 4904.0, 7147.0, 11057.0, 16984.0, 26695.0, 42239.0, 69684.0, 124641.0, 238208.0, 213791.0, 110708.0, 63005.0, 38477.0, 24059.0, 15712.0, 10134.0, 6750.0, 4482.0, 3181.0, 2066.0, 1446.0, 936.0, 652.0, 472.0, 321.0, 187.0, 141.0, 81.0, 54.0, 37.0, 29.0, 21.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1513671875, -0.1464691162109375, -0.141571044921875, -0.1366729736328125, -0.13177490234375, -0.1268768310546875, -0.121978759765625, -0.1170806884765625, -0.1121826171875, -0.1072845458984375, -0.102386474609375, -0.0974884033203125, -0.09259033203125, -0.0876922607421875, -0.082794189453125, -0.0778961181640625, -0.072998046875, -0.0680999755859375, -0.063201904296875, -0.0583038330078125, -0.05340576171875, -0.0485076904296875, -0.043609619140625, -0.0387115478515625, -0.0338134765625, -0.0289154052734375, -0.024017333984375, -0.0191192626953125, -0.01422119140625, -0.0093231201171875, -0.004425048828125, 0.0004730224609375, 0.00537109375, 0.0102691650390625, 0.015167236328125, 0.0200653076171875, 0.02496337890625, 0.0298614501953125, 0.034759521484375, 0.0396575927734375, 0.0445556640625, 0.0494537353515625, 0.054351806640625, 0.0592498779296875, 0.06414794921875, 0.0690460205078125, 0.073944091796875, 0.0788421630859375, 0.083740234375, 0.0886383056640625, 0.093536376953125, 0.0984344482421875, 0.10333251953125, 0.1082305908203125, 0.113128662109375, 0.1180267333984375, 0.1229248046875, 0.1278228759765625, 0.132720947265625, 0.1376190185546875, 0.14251708984375, 0.1474151611328125, 0.152313232421875, 0.1572113037109375, 0.162109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 8.0, 12.0, 11.0, 12.0, 17.0, 18.0, 26.0, 22.0, 30.0, 51.0, 65.0, 85.0, 91.0, 89.0, 93.0, 73.0, 54.0, 45.0, 29.0, 32.0, 19.0, 14.0, 18.0, 9.0, 11.0, 6.0, 5.0, 5.0, 8.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08746337890625, -0.08448028564453125, -0.0814971923828125, -0.07851409912109375, -0.075531005859375, -0.07254791259765625, -0.0695648193359375, -0.06658172607421875, -0.0635986328125, -0.06061553955078125, -0.0576324462890625, -0.05464935302734375, -0.051666259765625, -0.04868316650390625, -0.0457000732421875, -0.04271697998046875, -0.03973388671875, -0.03675079345703125, -0.0337677001953125, -0.03078460693359375, -0.027801513671875, -0.02481842041015625, -0.0218353271484375, -0.01885223388671875, -0.015869140625, -0.01288604736328125, -0.0099029541015625, -0.00691986083984375, -0.003936767578125, -0.00095367431640625, 0.0020294189453125, 0.00501251220703125, 0.00799560546875, 0.01097869873046875, 0.0139617919921875, 0.01694488525390625, 0.019927978515625, 0.02291107177734375, 0.0258941650390625, 0.02887725830078125, 0.0318603515625, 0.03484344482421875, 0.0378265380859375, 0.04080963134765625, 0.043792724609375, 0.04677581787109375, 0.0497589111328125, 0.05274200439453125, 0.05572509765625, 0.05870819091796875, 0.0616912841796875, 0.06467437744140625, 0.067657470703125, 0.07064056396484375, 0.0736236572265625, 0.07660675048828125, 0.07958984375, 0.08257293701171875, 0.0855560302734375, 0.08853912353515625, 0.091522216796875, 0.09450531005859375, 0.0974884033203125, 0.10047149658203125, 0.10345458984375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 15.0, 11.0, 13.0, 13.0, 25.0, 24.0, 27.0, 31.0, 28.0, 34.0, 32.0, 58.0, 57.0, 50.0, 59.0, 43.0, 65.0, 46.0, 56.0, 36.0, 34.0, 38.0, 39.0, 21.0, 26.0, 25.0, 22.0, 11.0, 14.0, 9.0, 10.0, 2.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.748821258544922, -19.04790687561035, -18.34699249267578, -17.646080017089844, -16.945165634155273, -16.244251251220703, -15.54333782196045, -14.842424392700195, -14.141510009765625, -13.440595626831055, -12.7396821975708, -12.038768768310547, -11.337854385375977, -10.636940002441406, -9.936026573181152, -9.235113143920898, -8.534198760986328, -7.833284854888916, -7.132370948791504, -6.431457042694092, -5.73054313659668, -5.029629230499268, -4.3287153244018555, -3.6278014183044434, -2.9268875122070312, -2.225973606109619, -1.525059700012207, -0.8241457939147949, -0.12323188781738281, 0.5776820182800293, 1.2785959243774414, 1.9795098304748535, 2.6804256439208984, 3.3813395500183105, 4.082253456115723, 4.783167362213135, 5.484081268310547, 6.184995174407959, 6.885909080505371, 7.586822986602783, 8.287736892700195, 8.988651275634766, 9.68956470489502, 10.390478134155273, 11.091392517089844, 11.792306900024414, 12.493220329284668, 13.194133758544922, 13.895048141479492, 14.595962524414062, 15.296875953674316, 15.99778938293457, 16.69870376586914, 17.39961814880371, 18.10053253173828, 18.80144500732422, 19.50235939025879, 20.20327377319336, 20.904186248779297, 21.605100631713867, 22.306015014648438, 23.006929397583008, 23.707843780517578, 24.408756256103516, 25.109670639038086]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 4.0, 3.0, 11.0, 9.0, 10.0, 5.0, 13.0, 14.0, 17.0, 16.0, 22.0, 20.0, 27.0, 25.0, 44.0, 22.0, 23.0, 25.0, 34.0, 23.0, 33.0, 43.0, 39.0, 32.0, 40.0, 38.0, 39.0, 38.0, 27.0, 28.0, 24.0, 28.0, 27.0, 15.0, 22.0, 21.0, 13.0, 11.0, 13.0, 15.0, 12.0, 14.0, 13.0, 13.0, 12.0, 5.0, 5.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-19.268037796020508, -18.65593147277832, -18.043825149536133, -17.431718826293945, -16.819612503051758, -16.20750617980957, -15.595398902893066, -14.983292579650879, -14.371186256408691, -13.759079933166504, -13.146973609924316, -12.534867286682129, -11.922760009765625, -11.310653686523438, -10.69854736328125, -10.086441040039062, -9.474334716796875, -8.862228393554688, -8.2501220703125, -7.638015270233154, -7.025908946990967, -6.413802623748779, -5.801695823669434, -5.189589500427246, -4.577483177185059, -3.965376853942871, -3.3532702922821045, -2.741163730621338, -2.1290574073791504, -1.516951084136963, -0.9048445224761963, -0.2927379608154297, 0.319366455078125, 0.931472897529602, 1.543579339981079, 2.1556859016418457, 2.767792224884033, 3.3798985481262207, 3.9920051097869873, 4.604111671447754, 5.216217994689941, 5.828324317932129, 6.440430641174316, 7.052537441253662, 7.66464376449585, 8.276750564575195, 8.888856887817383, 9.50096321105957, 10.113069534301758, 10.725175857543945, 11.337282180786133, 11.94938850402832, 12.561494827270508, 13.173601150512695, 13.7857084274292, 14.397814750671387, 15.009921073913574, 15.622027397155762, 16.234134674072266, 16.846240997314453, 17.45834732055664, 18.070453643798828, 18.682559967041016, 19.294666290283203, 19.90677261352539]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 13.0, 19.0, 22.0, 51.0, 66.0, 109.0, 160.0, 262.0, 427.0, 602.0, 892.0, 1417.0, 2233.0, 3239.0, 4677.0, 6986.0, 10022.0, 14291.0, 19613.0, 26673.0, 35170.0, 45663.0, 56399.0, 67174.0, 76441.0, 83972.0, 86899.0, 85993.0, 81377.0, 72848.0, 61925.0, 51201.0, 40828.0, 31634.0, 23428.0, 17181.0, 12422.0, 8545.0, 5747.0, 3993.0, 2670.0, 1839.0, 1185.0, 790.0, 521.0, 305.0, 214.0, 138.0, 98.0, 60.0, 43.0, 28.0, 15.0, 16.0, 6.0, 6.0, 4.0, 4.0], "bins": [-9.3515625, -9.0662841796875, -8.781005859375, -8.4957275390625, -8.21044921875, -7.9251708984375, -7.639892578125, -7.3546142578125, -7.0693359375, -6.7840576171875, -6.498779296875, -6.2135009765625, -5.92822265625, -5.6429443359375, -5.357666015625, -5.0723876953125, -4.787109375, -4.5018310546875, -4.216552734375, -3.9312744140625, -3.64599609375, -3.3607177734375, -3.075439453125, -2.7901611328125, -2.5048828125, -2.2196044921875, -1.934326171875, -1.6490478515625, -1.36376953125, -1.0784912109375, -0.793212890625, -0.5079345703125, -0.22265625, 0.0626220703125, 0.347900390625, 0.6331787109375, 0.91845703125, 1.2037353515625, 1.489013671875, 1.7742919921875, 2.0595703125, 2.3448486328125, 2.630126953125, 2.9154052734375, 3.20068359375, 3.4859619140625, 3.771240234375, 4.0565185546875, 4.341796875, 4.6270751953125, 4.912353515625, 5.1976318359375, 5.48291015625, 5.7681884765625, 6.053466796875, 6.3387451171875, 6.6240234375, 6.9093017578125, 7.194580078125, 7.4798583984375, 7.76513671875, 8.0504150390625, 8.335693359375, 8.6209716796875, 8.90625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 3.0, 7.0, 2.0, 9.0, 5.0, 4.0, 12.0, 13.0, 10.0, 13.0, 9.0, 16.0, 28.0, 29.0, 26.0, 34.0, 28.0, 36.0, 24.0, 34.0, 37.0, 36.0, 40.0, 45.0, 32.0, 44.0, 44.0, 34.0, 26.0, 33.0, 30.0, 35.0, 20.0, 22.0, 20.0, 19.0, 23.0, 13.0, 17.0, 23.0, 11.0, 9.0, 6.0, 9.0, 10.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-20.578125, -19.921142578125, -19.26416015625, -18.607177734375, -17.9501953125, -17.293212890625, -16.63623046875, -15.979248046875, -15.322265625, -14.665283203125, -14.00830078125, -13.351318359375, -12.6943359375, -12.037353515625, -11.38037109375, -10.723388671875, -10.06640625, -9.409423828125, -8.75244140625, -8.095458984375, -7.4384765625, -6.781494140625, -6.12451171875, -5.467529296875, -4.810546875, -4.153564453125, -3.49658203125, -2.839599609375, -2.1826171875, -1.525634765625, -0.86865234375, -0.211669921875, 0.4453125, 1.102294921875, 1.75927734375, 2.416259765625, 3.0732421875, 3.730224609375, 4.38720703125, 5.044189453125, 5.701171875, 6.358154296875, 7.01513671875, 7.672119140625, 8.3291015625, 8.986083984375, 9.64306640625, 10.300048828125, 10.95703125, 11.614013671875, 12.27099609375, 12.927978515625, 13.5849609375, 14.241943359375, 14.89892578125, 15.555908203125, 16.212890625, 16.869873046875, 17.52685546875, 18.183837890625, 18.8408203125, 19.497802734375, 20.15478515625, 20.811767578125, 21.46875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 20.0, 23.0, 28.0, 56.0, 97.0, 138.0, 222.0, 398.0, 638.0, 1031.0, 1637.0, 2465.0, 3905.0, 6024.0, 9010.0, 13195.0, 19352.0, 27121.0, 37533.0, 49538.0, 62508.0, 75973.0, 87246.0, 93800.0, 96200.0, 92685.0, 84133.0, 71661.0, 58162.0, 45509.0, 33676.0, 24253.0, 16944.0, 11508.0, 7896.0, 5045.0, 3320.0, 2112.0, 1345.0, 794.0, 531.0, 310.0, 202.0, 141.0, 69.0, 37.0, 20.0, 15.0, 10.0, 4.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.2396240234375, -8.924560546875, -8.6094970703125, -8.29443359375, -7.9793701171875, -7.664306640625, -7.3492431640625, -7.0341796875, -6.7191162109375, -6.404052734375, -6.0889892578125, -5.77392578125, -5.4588623046875, -5.143798828125, -4.8287353515625, -4.513671875, -4.1986083984375, -3.883544921875, -3.5684814453125, -3.25341796875, -2.9383544921875, -2.623291015625, -2.3082275390625, -1.9931640625, -1.6781005859375, -1.363037109375, -1.0479736328125, -0.73291015625, -0.4178466796875, -0.102783203125, 0.2122802734375, 0.52734375, 0.8424072265625, 1.157470703125, 1.4725341796875, 1.78759765625, 2.1026611328125, 2.417724609375, 2.7327880859375, 3.0478515625, 3.3629150390625, 3.677978515625, 3.9930419921875, 4.30810546875, 4.6231689453125, 4.938232421875, 5.2532958984375, 5.568359375, 5.8834228515625, 6.198486328125, 6.5135498046875, 6.82861328125, 7.1436767578125, 7.458740234375, 7.7738037109375, 8.0888671875, 8.4039306640625, 8.718994140625, 9.0340576171875, 9.34912109375, 9.6641845703125, 9.979248046875, 10.2943115234375, 10.609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 3.0, 3.0, 2.0, 7.0, 1.0, 6.0, 4.0, 8.0, 3.0, 11.0, 8.0, 13.0, 19.0, 16.0, 13.0, 25.0, 27.0, 24.0, 33.0, 27.0, 38.0, 35.0, 34.0, 36.0, 43.0, 44.0, 43.0, 36.0, 54.0, 33.0, 37.0, 38.0, 34.0, 27.0, 27.0, 24.0, 28.0, 14.0, 19.0, 19.0, 12.0, 18.0, 9.0, 14.0, 13.0, 9.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.0703125, -12.64208984375, -12.2138671875, -11.78564453125, -11.357421875, -10.92919921875, -10.5009765625, -10.07275390625, -9.64453125, -9.21630859375, -8.7880859375, -8.35986328125, -7.931640625, -7.50341796875, -7.0751953125, -6.64697265625, -6.21875, -5.79052734375, -5.3623046875, -4.93408203125, -4.505859375, -4.07763671875, -3.6494140625, -3.22119140625, -2.79296875, -2.36474609375, -1.9365234375, -1.50830078125, -1.080078125, -0.65185546875, -0.2236328125, 0.20458984375, 0.6328125, 1.06103515625, 1.4892578125, 1.91748046875, 2.345703125, 2.77392578125, 3.2021484375, 3.63037109375, 4.05859375, 4.48681640625, 4.9150390625, 5.34326171875, 5.771484375, 6.19970703125, 6.6279296875, 7.05615234375, 7.484375, 7.91259765625, 8.3408203125, 8.76904296875, 9.197265625, 9.62548828125, 10.0537109375, 10.48193359375, 10.91015625, 11.33837890625, 11.7666015625, 12.19482421875, 12.623046875, 13.05126953125, 13.4794921875, 13.90771484375, 14.3359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 5.0, 11.0, 23.0, 48.0, 76.0, 108.0, 145.0, 265.0, 378.0, 622.0, 972.0, 1533.0, 2272.0, 3432.0, 5319.0, 7737.0, 11631.0, 16619.0, 23319.0, 31341.0, 42131.0, 53763.0, 65628.0, 76487.0, 85112.0, 90261.0, 90757.0, 86289.0, 77635.0, 67080.0, 54400.0, 43201.0, 32907.0, 24102.0, 16845.0, 12056.0, 8169.0, 5531.0, 3612.0, 2357.0, 1603.0, 1087.0, 593.0, 375.0, 283.0, 147.0, 113.0, 69.0, 50.0, 18.0, 20.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.732421875, -2.63836669921875, -2.5443115234375, -2.45025634765625, -2.356201171875, -2.26214599609375, -2.1680908203125, -2.07403564453125, -1.97998046875, -1.88592529296875, -1.7918701171875, -1.69781494140625, -1.603759765625, -1.50970458984375, -1.4156494140625, -1.32159423828125, -1.2275390625, -1.13348388671875, -1.0394287109375, -0.94537353515625, -0.851318359375, -0.75726318359375, -0.6632080078125, -0.56915283203125, -0.47509765625, -0.38104248046875, -0.2869873046875, -0.19293212890625, -0.098876953125, -0.00482177734375, 0.0892333984375, 0.18328857421875, 0.27734375, 0.37139892578125, 0.4654541015625, 0.55950927734375, 0.653564453125, 0.74761962890625, 0.8416748046875, 0.93572998046875, 1.02978515625, 1.12384033203125, 1.2178955078125, 1.31195068359375, 1.406005859375, 1.50006103515625, 1.5941162109375, 1.68817138671875, 1.7822265625, 1.87628173828125, 1.9703369140625, 2.06439208984375, 2.158447265625, 2.25250244140625, 2.3465576171875, 2.44061279296875, 2.53466796875, 2.62872314453125, 2.7227783203125, 2.81683349609375, 2.910888671875, 3.00494384765625, 3.0989990234375, 3.19305419921875, 3.287109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 9.0, 11.0, 12.0, 16.0, 16.0, 17.0, 29.0, 30.0, 36.0, 28.0, 34.0, 47.0, 40.0, 42.0, 40.0, 38.0, 52.0, 47.0, 49.0, 44.0, 36.0, 35.0, 38.0, 31.0, 26.0, 38.0, 22.0, 23.0, 20.0, 10.0, 7.0, 17.0, 4.0, 8.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00045299530029296875, -0.00043886899948120117, -0.0004247426986694336, -0.000410616397857666, -0.00039649009704589844, -0.00038236379623413086, -0.0003682374954223633, -0.0003541111946105957, -0.0003399848937988281, -0.00032585859298706055, -0.00031173229217529297, -0.0002976059913635254, -0.0002834796905517578, -0.00026935338973999023, -0.00025522708892822266, -0.00024110078811645508, -0.0002269744873046875, -0.00021284818649291992, -0.00019872188568115234, -0.00018459558486938477, -0.0001704692840576172, -0.0001563429832458496, -0.00014221668243408203, -0.00012809038162231445, -0.00011396408081054688, -9.98377799987793e-05, -8.571147918701172e-05, -7.158517837524414e-05, -5.745887756347656e-05, -4.3332576751708984e-05, -2.9206275939941406e-05, -1.5079975128173828e-05, -9.5367431640625e-07, 1.3172626495361328e-05, 2.7298927307128906e-05, 4.1425228118896484e-05, 5.555152893066406e-05, 6.967782974243164e-05, 8.380413055419922e-05, 9.79304313659668e-05, 0.00011205673217773438, 0.00012618303298950195, 0.00014030933380126953, 0.0001544356346130371, 0.0001685619354248047, 0.00018268823623657227, 0.00019681453704833984, 0.00021094083786010742, 0.000225067138671875, 0.00023919343948364258, 0.00025331974029541016, 0.00026744604110717773, 0.0002815723419189453, 0.0002956986427307129, 0.00030982494354248047, 0.00032395124435424805, 0.0003380775451660156, 0.0003522038459777832, 0.0003663301467895508, 0.00038045644760131836, 0.00039458274841308594, 0.0004087090492248535, 0.0004228353500366211, 0.00043696165084838867, 0.00045108795166015625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 24.0, 31.0, 47.0, 63.0, 102.0, 163.0, 270.0, 391.0, 572.0, 888.0, 1402.0, 2272.0, 3365.0, 5470.0, 8483.0, 13083.0, 20077.0, 29604.0, 42121.0, 57924.0, 75349.0, 91402.0, 102988.0, 108582.0, 105483.0, 94744.0, 79732.0, 62362.0, 46253.0, 32631.0, 21896.0, 14455.0, 9389.0, 6077.0, 3885.0, 2480.0, 1570.0, 1062.0, 653.0, 435.0, 255.0, 180.0, 124.0, 87.0, 44.0, 25.0, 22.0, 11.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.611328125, -3.493408203125, -3.37548828125, -3.257568359375, -3.1396484375, -3.021728515625, -2.90380859375, -2.785888671875, -2.66796875, -2.550048828125, -2.43212890625, -2.314208984375, -2.1962890625, -2.078369140625, -1.96044921875, -1.842529296875, -1.724609375, -1.606689453125, -1.48876953125, -1.370849609375, -1.2529296875, -1.135009765625, -1.01708984375, -0.899169921875, -0.78125, -0.663330078125, -0.54541015625, -0.427490234375, -0.3095703125, -0.191650390625, -0.07373046875, 0.044189453125, 0.162109375, 0.280029296875, 0.39794921875, 0.515869140625, 0.6337890625, 0.751708984375, 0.86962890625, 0.987548828125, 1.10546875, 1.223388671875, 1.34130859375, 1.459228515625, 1.5771484375, 1.695068359375, 1.81298828125, 1.930908203125, 2.048828125, 2.166748046875, 2.28466796875, 2.402587890625, 2.5205078125, 2.638427734375, 2.75634765625, 2.874267578125, 2.9921875, 3.110107421875, 3.22802734375, 3.345947265625, 3.4638671875, 3.581787109375, 3.69970703125, 3.817626953125, 3.935546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 4.0, 13.0, 4.0, 4.0, 8.0, 7.0, 18.0, 15.0, 25.0, 19.0, 23.0, 30.0, 35.0, 41.0, 33.0, 41.0, 40.0, 30.0, 46.0, 48.0, 53.0, 58.0, 41.0, 31.0, 35.0, 38.0, 31.0, 33.0, 32.0, 33.0, 30.0, 19.0, 13.0, 16.0, 12.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.765625, -1.7064208984375, -1.647216796875, -1.5880126953125, -1.52880859375, -1.4696044921875, -1.410400390625, -1.3511962890625, -1.2919921875, -1.2327880859375, -1.173583984375, -1.1143798828125, -1.05517578125, -0.9959716796875, -0.936767578125, -0.8775634765625, -0.818359375, -0.7591552734375, -0.699951171875, -0.6407470703125, -0.58154296875, -0.5223388671875, -0.463134765625, -0.4039306640625, -0.3447265625, -0.2855224609375, -0.226318359375, -0.1671142578125, -0.10791015625, -0.0487060546875, 0.010498046875, 0.0697021484375, 0.12890625, 0.1881103515625, 0.247314453125, 0.3065185546875, 0.36572265625, 0.4249267578125, 0.484130859375, 0.5433349609375, 0.6025390625, 0.6617431640625, 0.720947265625, 0.7801513671875, 0.83935546875, 0.8985595703125, 0.957763671875, 1.0169677734375, 1.076171875, 1.1353759765625, 1.194580078125, 1.2537841796875, 1.31298828125, 1.3721923828125, 1.431396484375, 1.4906005859375, 1.5498046875, 1.6090087890625, 1.668212890625, 1.7274169921875, 1.78662109375, 1.8458251953125, 1.905029296875, 1.9642333984375, 2.0234375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 5.0, 13.0, 14.0, 17.0, 23.0, 21.0, 27.0, 24.0, 22.0, 24.0, 31.0, 36.0, 42.0, 38.0, 47.0, 44.0, 59.0, 61.0, 51.0, 39.0, 39.0, 38.0, 46.0, 22.0, 33.0, 23.0, 22.0, 21.0, 19.0, 21.0, 20.0, 5.0, 6.0, 6.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.6627140045166, -18.03164291381836, -17.400571823120117, -16.769500732421875, -16.138431549072266, -15.507359504699707, -14.876289367675781, -14.245218276977539, -13.614147186279297, -12.983076095581055, -12.352005004882812, -11.720934867858887, -11.089863777160645, -10.458792686462402, -9.827722549438477, -9.196651458740234, -8.565580368041992, -7.93450927734375, -7.303438663482666, -6.672368049621582, -6.04129695892334, -5.410225868225098, -4.779155254364014, -4.14808464050293, -3.5170135498046875, -2.8859426975250244, -2.2548718452453613, -1.6238009929656982, -0.9927301406860352, -0.36165928840637207, 0.269411563873291, 0.900482177734375, 1.53155517578125, 2.162626028060913, 2.793696880340576, 3.4247677326202393, 4.055838584899902, 4.6869096755981445, 5.3179802894592285, 5.9490509033203125, 6.580121994018555, 7.211193084716797, 7.842263698577881, 8.473334312438965, 9.104405403137207, 9.73547649383545, 10.366546630859375, 10.997617721557617, 11.62868881225586, 12.259759902954102, 12.890830993652344, 13.52190113067627, 14.152972221374512, 14.784043312072754, 15.41511344909668, 16.046184539794922, 16.677255630493164, 17.308326721191406, 17.93939781188965, 18.57046890258789, 19.2015380859375, 19.832609176635742, 20.463680267333984, 21.094751358032227, 21.72582244873047]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 13.0, 22.0, 25.0, 23.0, 28.0, 39.0, 31.0, 33.0, 38.0, 29.0, 34.0, 30.0, 42.0, 36.0, 35.0, 54.0, 51.0, 39.0, 27.0, 42.0, 29.0, 34.0, 25.0, 22.0, 33.0, 22.0, 19.0, 16.0, 10.0, 11.0, 10.0, 22.0, 9.0, 7.0, 7.0, 6.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.167316436767578, -23.409618377685547, -22.651920318603516, -21.894222259521484, -21.136524200439453, -20.378826141357422, -19.62112808227539, -18.86343002319336, -18.105731964111328, -17.348033905029297, -16.590335845947266, -15.832637786865234, -15.074939727783203, -14.317241668701172, -13.559542655944824, -12.801844596862793, -12.044145584106445, -11.286447525024414, -10.528749465942383, -9.771051406860352, -9.01335334777832, -8.255655288696289, -7.497956275939941, -6.74025821685791, -5.982560157775879, -5.224862098693848, -4.467164039611816, -3.709465503692627, -2.9517674446105957, -2.1940693855285645, -1.436370849609375, -0.6786727905273438, 0.07902336120605469, 0.8367215394973755, 1.5944197177886963, 2.3521180152893066, 3.109816074371338, 3.867514133453369, 4.625212669372559, 5.38291072845459, 6.140608787536621, 6.898306846618652, 7.656004905700684, 8.413703918457031, 9.171401977539062, 9.929100036621094, 10.686798095703125, 11.444496154785156, 12.202194213867188, 12.959892272949219, 13.71759033203125, 14.475288391113281, 15.232986450195312, 15.990684509277344, 16.748382568359375, 17.506080627441406, 18.263778686523438, 19.02147674560547, 19.7791748046875, 20.53687286376953, 21.294570922851562, 22.052268981933594, 22.809967041015625, 23.567665100097656, 24.32536506652832]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 25.0, 35.0, 58.0, 76.0, 123.0, 220.0, 353.0, 582.0, 950.0, 1544.0, 2632.0, 3996.0, 6860.0, 10734.0, 16630.0, 26367.0, 40185.0, 60060.0, 88233.0, 125649.0, 172424.0, 225683.0, 284417.0, 336911.0, 377955.0, 397213.0, 392290.0, 361244.0, 314139.0, 258213.0, 201367.0, 151175.0, 109125.0, 76292.0, 52514.0, 34787.0, 22998.0, 14741.0, 9525.0, 6138.0, 3689.0, 2363.0, 1439.0, 921.0, 540.0, 327.0, 194.0, 151.0, 65.0, 55.0, 29.0, 12.0, 12.0, 4.0, 6.0, 2.0, 3.0, 1.0], "bins": [-14.328125, -13.87744140625, -13.4267578125, -12.97607421875, -12.525390625, -12.07470703125, -11.6240234375, -11.17333984375, -10.72265625, -10.27197265625, -9.8212890625, -9.37060546875, -8.919921875, -8.46923828125, -8.0185546875, -7.56787109375, -7.1171875, -6.66650390625, -6.2158203125, -5.76513671875, -5.314453125, -4.86376953125, -4.4130859375, -3.96240234375, -3.51171875, -3.06103515625, -2.6103515625, -2.15966796875, -1.708984375, -1.25830078125, -0.8076171875, -0.35693359375, 0.09375, 0.54443359375, 0.9951171875, 1.44580078125, 1.896484375, 2.34716796875, 2.7978515625, 3.24853515625, 3.69921875, 4.14990234375, 4.6005859375, 5.05126953125, 5.501953125, 5.95263671875, 6.4033203125, 6.85400390625, 7.3046875, 7.75537109375, 8.2060546875, 8.65673828125, 9.107421875, 9.55810546875, 10.0087890625, 10.45947265625, 10.91015625, 11.36083984375, 11.8115234375, 12.26220703125, 12.712890625, 13.16357421875, 13.6142578125, 14.06494140625, 14.515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 10.0, 10.0, 11.0, 12.0, 16.0, 16.0, 26.0, 26.0, 27.0, 29.0, 29.0, 43.0, 30.0, 38.0, 45.0, 39.0, 40.0, 36.0, 52.0, 35.0, 46.0, 38.0, 36.0, 38.0, 34.0, 23.0, 22.0, 31.0, 25.0, 18.0, 14.0, 25.0, 11.0, 16.0, 11.0, 6.0, 7.0, 4.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.953125, -20.30029296875, -19.6474609375, -18.99462890625, -18.341796875, -17.68896484375, -17.0361328125, -16.38330078125, -15.73046875, -15.07763671875, -14.4248046875, -13.77197265625, -13.119140625, -12.46630859375, -11.8134765625, -11.16064453125, -10.5078125, -9.85498046875, -9.2021484375, -8.54931640625, -7.896484375, -7.24365234375, -6.5908203125, -5.93798828125, -5.28515625, -4.63232421875, -3.9794921875, -3.32666015625, -2.673828125, -2.02099609375, -1.3681640625, -0.71533203125, -0.0625, 0.59033203125, 1.2431640625, 1.89599609375, 2.548828125, 3.20166015625, 3.8544921875, 4.50732421875, 5.16015625, 5.81298828125, 6.4658203125, 7.11865234375, 7.771484375, 8.42431640625, 9.0771484375, 9.72998046875, 10.3828125, 11.03564453125, 11.6884765625, 12.34130859375, 12.994140625, 13.64697265625, 14.2998046875, 14.95263671875, 15.60546875, 16.25830078125, 16.9111328125, 17.56396484375, 18.216796875, 18.86962890625, 19.5224609375, 20.17529296875, 20.828125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 16.0, 21.0, 49.0, 62.0, 143.0, 213.0, 390.0, 678.0, 1245.0, 2126.0, 3567.0, 6167.0, 10526.0, 17259.0, 28611.0, 44955.0, 69613.0, 102398.0, 147043.0, 200973.0, 262494.0, 321046.0, 372496.0, 403169.0, 409187.0, 391368.0, 347984.0, 291735.0, 230534.0, 173377.0, 123918.0, 84598.0, 55825.0, 35360.0, 22051.0, 13562.0, 8132.0, 4759.0, 2727.0, 1685.0, 913.0, 544.0, 346.0, 171.0, 107.0, 60.0, 34.0, 17.0, 13.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.3125, -15.806640625, -15.30078125, -14.794921875, -14.2890625, -13.783203125, -13.27734375, -12.771484375, -12.265625, -11.759765625, -11.25390625, -10.748046875, -10.2421875, -9.736328125, -9.23046875, -8.724609375, -8.21875, -7.712890625, -7.20703125, -6.701171875, -6.1953125, -5.689453125, -5.18359375, -4.677734375, -4.171875, -3.666015625, -3.16015625, -2.654296875, -2.1484375, -1.642578125, -1.13671875, -0.630859375, -0.125, 0.380859375, 0.88671875, 1.392578125, 1.8984375, 2.404296875, 2.91015625, 3.416015625, 3.921875, 4.427734375, 4.93359375, 5.439453125, 5.9453125, 6.451171875, 6.95703125, 7.462890625, 7.96875, 8.474609375, 8.98046875, 9.486328125, 9.9921875, 10.498046875, 11.00390625, 11.509765625, 12.015625, 12.521484375, 13.02734375, 13.533203125, 14.0390625, 14.544921875, 15.05078125, 15.556640625, 16.0625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 3.0, 13.0, 13.0, 17.0, 17.0, 32.0, 53.0, 58.0, 63.0, 70.0, 87.0, 99.0, 118.0, 132.0, 147.0, 159.0, 196.0, 168.0, 211.0, 221.0, 226.0, 226.0, 179.0, 187.0, 184.0, 154.0, 167.0, 149.0, 108.0, 127.0, 106.0, 84.0, 62.0, 46.0, 42.0, 40.0, 25.0, 18.0, 13.0, 18.0, 12.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.7578125, -8.4412841796875, -8.124755859375, -7.8082275390625, -7.49169921875, -7.1751708984375, -6.858642578125, -6.5421142578125, -6.2255859375, -5.9090576171875, -5.592529296875, -5.2760009765625, -4.95947265625, -4.6429443359375, -4.326416015625, -4.0098876953125, -3.693359375, -3.3768310546875, -3.060302734375, -2.7437744140625, -2.42724609375, -2.1107177734375, -1.794189453125, -1.4776611328125, -1.1611328125, -0.8446044921875, -0.528076171875, -0.2115478515625, 0.10498046875, 0.4215087890625, 0.738037109375, 1.0545654296875, 1.37109375, 1.6876220703125, 2.004150390625, 2.3206787109375, 2.63720703125, 2.9537353515625, 3.270263671875, 3.5867919921875, 3.9033203125, 4.2198486328125, 4.536376953125, 4.8529052734375, 5.16943359375, 5.4859619140625, 5.802490234375, 6.1190185546875, 6.435546875, 6.7520751953125, 7.068603515625, 7.3851318359375, 7.70166015625, 8.0181884765625, 8.334716796875, 8.6512451171875, 8.9677734375, 9.2843017578125, 9.600830078125, 9.9173583984375, 10.23388671875, 10.5504150390625, 10.866943359375, 11.1834716796875, 11.5]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 7.0, 10.0, 15.0, 7.0, 9.0, 18.0, 12.0, 20.0, 20.0, 29.0, 26.0, 37.0, 38.0, 49.0, 51.0, 54.0, 42.0, 43.0, 49.0, 47.0, 54.0, 42.0, 39.0, 39.0, 44.0, 35.0, 20.0, 33.0, 26.0, 11.0, 10.0, 8.0, 10.0, 3.0, 5.0, 10.0, 6.0, 5.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.613582611083984, -23.887020111083984, -23.160457611083984, -22.43389320373535, -21.70733070373535, -20.98076820373535, -20.25420379638672, -19.52764129638672, -18.80107879638672, -18.07451629638672, -17.34795379638672, -16.621389389038086, -15.894826889038086, -15.168264389038086, -14.44170093536377, -13.715137481689453, -12.988574981689453, -12.262012481689453, -11.535449028015137, -10.80888557434082, -10.08232307434082, -9.35576057434082, -8.629197120666504, -7.902634143829346, -7.1760711669921875, -6.449508190155029, -5.722945213317871, -4.996382236480713, -4.269819259643555, -3.5432562828063965, -2.8166933059692383, -2.09013032913208, -1.3635692596435547, -0.6370062828063965, 0.08955669403076172, 0.8161196708679199, 1.5426826477050781, 2.2692456245422363, 2.9958086013793945, 3.7223715782165527, 4.448934555053711, 5.175497531890869, 5.902060508728027, 6.6286234855651855, 7.355186462402344, 8.081748962402344, 8.80831241607666, 9.534875869750977, 10.261438369750977, 10.988000869750977, 11.714564323425293, 12.44112777709961, 13.16769027709961, 13.89425277709961, 14.620816230773926, 15.347379684448242, 16.073942184448242, 16.800504684448242, 17.527069091796875, 18.253631591796875, 18.980194091796875, 19.706756591796875, 20.433319091796875, 21.159883499145508, 21.886445999145508]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 10.0, 10.0, 16.0, 17.0, 29.0, 22.0, 29.0, 28.0, 17.0, 34.0, 26.0, 26.0, 36.0, 36.0, 37.0, 40.0, 35.0, 47.0, 46.0, 43.0, 35.0, 36.0, 30.0, 32.0, 30.0, 40.0, 23.0, 26.0, 17.0, 18.0, 17.0, 17.0, 13.0, 16.0, 11.0, 10.0, 6.0, 5.0, 5.0, 4.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.615243911743164, -24.830129623413086, -24.045015335083008, -23.25990104675293, -22.47478675842285, -21.689672470092773, -20.904560089111328, -20.11944580078125, -19.334331512451172, -18.549217224121094, -17.764102935791016, -16.978988647460938, -16.19387435913086, -15.408760070800781, -14.62364673614502, -13.838532447814941, -13.053417205810547, -12.268302917480469, -11.48318862915039, -10.698074340820312, -9.912960052490234, -9.127845764160156, -8.342732429504395, -7.557618141174316, -6.772503852844238, -5.98738956451416, -5.202275276184082, -4.417161464691162, -3.632047176361084, -2.846932888031006, -2.061819076538086, -1.2767047882080078, -0.4915924072265625, 0.2935217618942261, 1.0786359310150146, 1.8637499809265137, 2.648864269256592, 3.43397855758667, 4.21909236907959, 5.004206657409668, 5.789320945739746, 6.574435234069824, 7.359549522399902, 8.144662857055664, 8.929777145385742, 9.71489143371582, 10.500005722045898, 11.285120010375977, 12.070234298706055, 12.855348587036133, 13.640462875366211, 14.425577163696289, 15.210691452026367, 15.995805740356445, 16.78091812133789, 17.56603240966797, 18.351146697998047, 19.136260986328125, 19.921375274658203, 20.70648956298828, 21.49160385131836, 22.276718139648438, 23.061832427978516, 23.846946716308594, 24.632061004638672]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 12.0, 15.0, 26.0, 20.0, 43.0, 62.0, 91.0, 164.0, 251.0, 385.0, 580.0, 864.0, 1248.0, 2018.0, 3241.0, 5210.0, 8410.0, 13471.0, 21555.0, 34992.0, 58269.0, 94223.0, 149020.0, 199817.0, 168677.0, 109294.0, 68190.0, 41451.0, 25132.0, 15603.0, 9572.0, 6009.0, 3821.0, 2369.0, 1590.0, 984.0, 631.0, 403.0, 285.0, 187.0, 129.0, 73.0, 52.0, 41.0, 26.0, 17.0, 12.0, 12.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.830078125, -2.740692138671875, -2.65130615234375, -2.561920166015625, -2.4725341796875, -2.383148193359375, -2.29376220703125, -2.204376220703125, -2.114990234375, -2.025604248046875, -1.93621826171875, -1.846832275390625, -1.7574462890625, -1.668060302734375, -1.57867431640625, -1.489288330078125, -1.39990234375, -1.310516357421875, -1.22113037109375, -1.131744384765625, -1.0423583984375, -0.952972412109375, -0.86358642578125, -0.774200439453125, -0.684814453125, -0.595428466796875, -0.50604248046875, -0.416656494140625, -0.3272705078125, -0.237884521484375, -0.14849853515625, -0.059112548828125, 0.0302734375, 0.119659423828125, 0.20904541015625, 0.298431396484375, 0.3878173828125, 0.477203369140625, 0.56658935546875, 0.655975341796875, 0.745361328125, 0.834747314453125, 0.92413330078125, 1.013519287109375, 1.1029052734375, 1.192291259765625, 1.28167724609375, 1.371063232421875, 1.46044921875, 1.549835205078125, 1.63922119140625, 1.728607177734375, 1.8179931640625, 1.907379150390625, 1.99676513671875, 2.086151123046875, 2.175537109375, 2.264923095703125, 2.35430908203125, 2.443695068359375, 2.5330810546875, 2.622467041015625, 2.71185302734375, 2.801239013671875, 2.890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 6.0, 14.0, 14.0, 22.0, 29.0, 19.0, 22.0, 32.0, 20.0, 24.0, 43.0, 29.0, 37.0, 37.0, 45.0, 42.0, 36.0, 52.0, 45.0, 49.0, 43.0, 37.0, 35.0, 32.0, 20.0, 30.0, 24.0, 17.0, 14.0, 21.0, 19.0, 21.0, 9.0, 7.0, 9.0, 6.0, 3.0, 2.0, 10.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.453125, -26.599853515625, -25.74658203125, -24.893310546875, -24.0400390625, -23.186767578125, -22.33349609375, -21.480224609375, -20.626953125, -19.773681640625, -18.92041015625, -18.067138671875, -17.2138671875, -16.360595703125, -15.50732421875, -14.654052734375, -13.80078125, -12.947509765625, -12.09423828125, -11.240966796875, -10.3876953125, -9.534423828125, -8.68115234375, -7.827880859375, -6.974609375, -6.121337890625, -5.26806640625, -4.414794921875, -3.5615234375, -2.708251953125, -1.85498046875, -1.001708984375, -0.1484375, 0.704833984375, 1.55810546875, 2.411376953125, 3.2646484375, 4.117919921875, 4.97119140625, 5.824462890625, 6.677734375, 7.531005859375, 8.38427734375, 9.237548828125, 10.0908203125, 10.944091796875, 11.79736328125, 12.650634765625, 13.50390625, 14.357177734375, 15.21044921875, 16.063720703125, 16.9169921875, 17.770263671875, 18.62353515625, 19.476806640625, 20.330078125, 21.183349609375, 22.03662109375, 22.889892578125, 23.7431640625, 24.596435546875, 25.44970703125, 26.302978515625, 27.15625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 4.0, 4.0, 13.0, 11.0, 22.0, 30.0, 42.0, 63.0, 90.0, 161.0, 179.0, 273.0, 406.0, 572.0, 784.0, 1092.0, 1532.0, 2102.0, 3084.0, 4444.0, 6628.0, 9629.0, 14619.0, 21747.0, 32931.0, 51203.0, 78019.0, 115358.0, 159933.0, 167497.0, 125082.0, 85731.0, 55596.0, 36086.0, 23551.0, 15885.0, 10661.0, 7186.0, 4927.0, 3428.0, 2302.0, 1639.0, 1137.0, 851.0, 569.0, 421.0, 325.0, 217.0, 139.0, 124.0, 85.0, 41.0, 37.0, 27.0, 16.0, 14.0, 10.0, 2.0, 1.0, 3.0, 2.0], "bins": [-2.642578125, -2.560272216796875, -2.47796630859375, -2.395660400390625, -2.3133544921875, -2.231048583984375, -2.14874267578125, -2.066436767578125, -1.984130859375, -1.901824951171875, -1.81951904296875, -1.737213134765625, -1.6549072265625, -1.572601318359375, -1.49029541015625, -1.407989501953125, -1.32568359375, -1.243377685546875, -1.16107177734375, -1.078765869140625, -0.9964599609375, -0.914154052734375, -0.83184814453125, -0.749542236328125, -0.667236328125, -0.584930419921875, -0.50262451171875, -0.420318603515625, -0.3380126953125, -0.255706787109375, -0.17340087890625, -0.091094970703125, -0.0087890625, 0.073516845703125, 0.15582275390625, 0.238128662109375, 0.3204345703125, 0.402740478515625, 0.48504638671875, 0.567352294921875, 0.649658203125, 0.731964111328125, 0.81427001953125, 0.896575927734375, 0.9788818359375, 1.061187744140625, 1.14349365234375, 1.225799560546875, 1.30810546875, 1.390411376953125, 1.47271728515625, 1.555023193359375, 1.6373291015625, 1.719635009765625, 1.80194091796875, 1.884246826171875, 1.966552734375, 2.048858642578125, 2.13116455078125, 2.213470458984375, 2.2957763671875, 2.378082275390625, 2.46038818359375, 2.542694091796875, 2.625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 4.0, 9.0, 10.0, 16.0, 8.0, 17.0, 14.0, 24.0, 17.0, 25.0, 29.0, 30.0, 34.0, 26.0, 32.0, 31.0, 32.0, 28.0, 40.0, 33.0, 29.0, 42.0, 35.0, 31.0, 32.0, 29.0, 38.0, 35.0, 30.0, 24.0, 33.0, 26.0, 27.0, 21.0, 14.0, 18.0, 11.0, 13.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 5.0, 5.0, 6.0, 0.0, 0.0, 1.0], "bins": [-16.34375, -15.8681640625, -15.392578125, -14.9169921875, -14.44140625, -13.9658203125, -13.490234375, -13.0146484375, -12.5390625, -12.0634765625, -11.587890625, -11.1123046875, -10.63671875, -10.1611328125, -9.685546875, -9.2099609375, -8.734375, -8.2587890625, -7.783203125, -7.3076171875, -6.83203125, -6.3564453125, -5.880859375, -5.4052734375, -4.9296875, -4.4541015625, -3.978515625, -3.5029296875, -3.02734375, -2.5517578125, -2.076171875, -1.6005859375, -1.125, -0.6494140625, -0.173828125, 0.3017578125, 0.77734375, 1.2529296875, 1.728515625, 2.2041015625, 2.6796875, 3.1552734375, 3.630859375, 4.1064453125, 4.58203125, 5.0576171875, 5.533203125, 6.0087890625, 6.484375, 6.9599609375, 7.435546875, 7.9111328125, 8.38671875, 8.8623046875, 9.337890625, 9.8134765625, 10.2890625, 10.7646484375, 11.240234375, 11.7158203125, 12.19140625, 12.6669921875, 13.142578125, 13.6181640625, 14.09375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 12.0, 19.0, 16.0, 30.0, 43.0, 66.0, 89.0, 137.0, 208.0, 302.0, 454.0, 646.0, 985.0, 1504.0, 2183.0, 3327.0, 4950.0, 7618.0, 12255.0, 19416.0, 31987.0, 54819.0, 98731.0, 188241.0, 255512.0, 158853.0, 83971.0, 46461.0, 27557.0, 17016.0, 10642.0, 7018.0, 4419.0, 2981.0, 2000.0, 1339.0, 879.0, 624.0, 373.0, 280.0, 161.0, 131.0, 84.0, 61.0, 44.0, 39.0, 29.0, 10.0, 13.0, 10.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0933837890625, -0.09040641784667969, -0.08742904663085938, -0.08445167541503906, -0.08147430419921875, -0.07849693298339844, -0.07551956176757812, -0.07254219055175781, -0.0695648193359375, -0.06658744812011719, -0.06361007690429688, -0.06063270568847656, -0.05765533447265625, -0.05467796325683594, -0.051700592041015625, -0.04872322082519531, -0.045745849609375, -0.04276847839355469, -0.039791107177734375, -0.03681373596191406, -0.03383636474609375, -0.030858993530273438, -0.027881622314453125, -0.024904251098632812, -0.0219268798828125, -0.018949508666992188, -0.015972137451171875, -0.012994766235351562, -0.01001739501953125, -0.0070400238037109375, -0.004062652587890625, -0.0010852813720703125, 0.00189208984375, 0.0048694610595703125, 0.007846832275390625, 0.010824203491210938, 0.01380157470703125, 0.016778945922851562, 0.019756317138671875, 0.022733688354492188, 0.0257110595703125, 0.028688430786132812, 0.031665802001953125, 0.03464317321777344, 0.03762054443359375, 0.04059791564941406, 0.043575286865234375, 0.04655265808105469, 0.049530029296875, 0.05250740051269531, 0.055484771728515625, 0.05846214294433594, 0.06143951416015625, 0.06441688537597656, 0.06739425659179688, 0.07037162780761719, 0.0733489990234375, 0.07632637023925781, 0.07930374145507812, 0.08228111267089844, 0.08525848388671875, 0.08823585510253906, 0.09121322631835938, 0.09419059753417969, 0.09716796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 13.0, 10.0, 6.0, 7.0, 17.0, 13.0, 18.0, 18.0, 23.0, 23.0, 28.0, 26.0, 36.0, 38.0, 35.0, 34.0, 47.0, 37.0, 48.0, 55.0, 35.0, 39.0, 45.0, 58.0, 31.0, 28.0, 19.0, 23.0, 29.0, 25.0, 16.0, 20.0, 16.0, 15.0, 14.0, 8.0, 9.0, 10.0, 6.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9371509552001953e-05, -1.8822960555553436e-05, -1.827441155910492e-05, -1.7725862562656403e-05, -1.7177313566207886e-05, -1.662876456975937e-05, -1.6080215573310852e-05, -1.5531666576862335e-05, -1.4983117580413818e-05, -1.4434568583965302e-05, -1.3886019587516785e-05, -1.3337470591068268e-05, -1.2788921594619751e-05, -1.2240372598171234e-05, -1.1691823601722717e-05, -1.11432746052742e-05, -1.0594725608825684e-05, -1.0046176612377167e-05, -9.49762761592865e-06, -8.949078619480133e-06, -8.400529623031616e-06, -7.8519806265831e-06, -7.3034316301345825e-06, -6.754882633686066e-06, -6.206333637237549e-06, -5.657784640789032e-06, -5.109235644340515e-06, -4.560686647891998e-06, -4.0121376514434814e-06, -3.4635886549949646e-06, -2.9150396585464478e-06, -2.366490662097931e-06, -1.817941665649414e-06, -1.2693926692008972e-06, -7.208436727523804e-07, -1.7229467630386353e-07, 3.762543201446533e-07, 9.248033165931702e-07, 1.473352313041687e-06, 2.021901309490204e-06, 2.5704503059387207e-06, 3.1189993023872375e-06, 3.6675482988357544e-06, 4.216097295284271e-06, 4.764646291732788e-06, 5.313195288181305e-06, 5.861744284629822e-06, 6.410293281078339e-06, 6.9588422775268555e-06, 7.507391273975372e-06, 8.05594027042389e-06, 8.604489266872406e-06, 9.153038263320923e-06, 9.70158725976944e-06, 1.0250136256217957e-05, 1.0798685252666473e-05, 1.134723424911499e-05, 1.1895783245563507e-05, 1.2444332242012024e-05, 1.299288123846054e-05, 1.3541430234909058e-05, 1.4089979231357574e-05, 1.4638528227806091e-05, 1.5187077224254608e-05, 1.5735626220703125e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 14.0, 32.0, 50.0, 80.0, 140.0, 185.0, 276.0, 438.0, 685.0, 1065.0, 1665.0, 2590.0, 3972.0, 6450.0, 10387.0, 17062.0, 28415.0, 49068.0, 93533.0, 203754.0, 305586.0, 149479.0, 72827.0, 39662.0, 23314.0, 14332.0, 8698.0, 5362.0, 3467.0, 2139.0, 1413.0, 911.0, 517.0, 363.0, 218.0, 170.0, 96.0, 48.0, 34.0, 22.0, 10.0, 9.0, 6.0, 0.0, 3.0, 3.0], "bins": [-0.275634765625, -0.26844024658203125, -0.2612457275390625, -0.25405120849609375, -0.246856689453125, -0.23966217041015625, -0.2324676513671875, -0.22527313232421875, -0.21807861328125, -0.21088409423828125, -0.2036895751953125, -0.19649505615234375, -0.189300537109375, -0.18210601806640625, -0.1749114990234375, -0.16771697998046875, -0.1605224609375, -0.15332794189453125, -0.1461334228515625, -0.13893890380859375, -0.131744384765625, -0.12454986572265625, -0.1173553466796875, -0.11016082763671875, -0.10296630859375, -0.09577178955078125, -0.0885772705078125, -0.08138275146484375, -0.074188232421875, -0.06699371337890625, -0.0597991943359375, -0.05260467529296875, -0.04541015625, -0.03821563720703125, -0.0310211181640625, -0.02382659912109375, -0.016632080078125, -0.00943756103515625, -0.0022430419921875, 0.00495147705078125, 0.01214599609375, 0.01934051513671875, 0.0265350341796875, 0.03372955322265625, 0.040924072265625, 0.04811859130859375, 0.0553131103515625, 0.06250762939453125, 0.0697021484375, 0.07689666748046875, 0.0840911865234375, 0.09128570556640625, 0.098480224609375, 0.10567474365234375, 0.1128692626953125, 0.12006378173828125, 0.12725830078125, 0.13445281982421875, 0.1416473388671875, 0.14884185791015625, 0.156036376953125, 0.16323089599609375, 0.1704254150390625, 0.17761993408203125, 0.184814453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 1.0, 6.0, 10.0, 5.0, 5.0, 7.0, 6.0, 17.0, 10.0, 20.0, 19.0, 21.0, 26.0, 32.0, 37.0, 29.0, 46.0, 43.0, 55.0, 65.0, 73.0, 61.0, 56.0, 40.0, 40.0, 47.0, 30.0, 21.0, 25.0, 22.0, 22.0, 11.0, 11.0, 14.0, 12.0, 6.0, 5.0, 9.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.106201171875, -0.10307502746582031, -0.09994888305664062, -0.09682273864746094, -0.09369659423828125, -0.09057044982910156, -0.08744430541992188, -0.08431816101074219, -0.0811920166015625, -0.07806587219238281, -0.07493972778320312, -0.07181358337402344, -0.06868743896484375, -0.06556129455566406, -0.062435150146484375, -0.05930900573730469, -0.056182861328125, -0.05305671691894531, -0.049930572509765625, -0.04680442810058594, -0.04367828369140625, -0.04055213928222656, -0.037425994873046875, -0.03429985046386719, -0.0311737060546875, -0.028047561645507812, -0.024921417236328125, -0.021795272827148438, -0.01866912841796875, -0.015542984008789062, -0.012416839599609375, -0.009290695190429688, -0.00616455078125, -0.0030384063720703125, 8.7738037109375e-05, 0.0032138824462890625, 0.00634002685546875, 0.009466171264648438, 0.012592315673828125, 0.015718460083007812, 0.0188446044921875, 0.021970748901367188, 0.025096893310546875, 0.028223037719726562, 0.03134918212890625, 0.03447532653808594, 0.037601470947265625, 0.04072761535644531, 0.043853759765625, 0.04697990417480469, 0.050106048583984375, 0.05323219299316406, 0.05635833740234375, 0.05948448181152344, 0.06261062622070312, 0.06573677062988281, 0.0688629150390625, 0.07198905944824219, 0.07511520385742188, 0.07824134826660156, 0.08136749267578125, 0.08449363708496094, 0.08761978149414062, 0.09074592590332031, 0.0938720703125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 4.0, 4.0, 7.0, 16.0, 9.0, 8.0, 16.0, 11.0, 17.0, 17.0, 28.0, 29.0, 34.0, 38.0, 51.0, 38.0, 57.0, 46.0, 43.0, 48.0, 43.0, 58.0, 43.0, 41.0, 42.0, 41.0, 34.0, 33.0, 32.0, 23.0, 17.0, 10.0, 6.0, 11.0, 8.0, 2.0, 10.0, 8.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.042255401611328, -24.314136505126953, -23.58601951599121, -22.85790252685547, -22.129783630371094, -21.40166473388672, -20.673547744750977, -19.945430755615234, -19.21731185913086, -18.489192962646484, -17.761075973510742, -17.032958984375, -16.304840087890625, -15.576722145080566, -14.848604202270508, -14.12048625946045, -13.39236831665039, -12.664250373840332, -11.936132431030273, -11.208014488220215, -10.479896545410156, -9.751778602600098, -9.023660659790039, -8.29554271697998, -7.567424774169922, -6.839306831359863, -6.111188888549805, -5.383070945739746, -4.6549530029296875, -3.926835060119629, -3.1987171173095703, -2.4705991744995117, -1.742483139038086, -1.0143651962280273, -0.28624725341796875, 0.44187068939208984, 1.1699886322021484, 1.898106575012207, 2.6262245178222656, 3.354342460632324, 4.082460403442383, 4.810578346252441, 5.5386962890625, 6.266814231872559, 6.994932174682617, 7.723050117492676, 8.451168060302734, 9.179286003112793, 9.907403945922852, 10.63552188873291, 11.363639831542969, 12.091757774353027, 12.819875717163086, 13.547993659973145, 14.276111602783203, 15.004229545593262, 15.73234748840332, 16.460464477539062, 17.188583374023438, 17.916702270507812, 18.644819259643555, 19.372936248779297, 20.101055145263672, 20.829174041748047, 21.55729103088379]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 10.0, 11.0, 15.0, 17.0, 30.0, 22.0, 28.0, 28.0, 16.0, 36.0, 26.0, 25.0, 36.0, 36.0, 36.0, 41.0, 36.0, 47.0, 45.0, 41.0, 37.0, 37.0, 29.0, 31.0, 32.0, 40.0, 24.0, 23.0, 17.0, 20.0, 16.0, 18.0, 13.0, 15.0, 12.0, 9.0, 6.0, 6.0, 4.0, 4.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.85509490966797, -25.070707321166992, -24.286319732666016, -23.50193214416504, -22.717544555664062, -21.933156967163086, -21.14876937866211, -20.364381790161133, -19.579994201660156, -18.79560661315918, -18.011219024658203, -17.226831436157227, -16.44244384765625, -15.658056259155273, -14.873668670654297, -14.08928108215332, -13.304893493652344, -12.520505905151367, -11.73611831665039, -10.951730728149414, -10.167343139648438, -9.382955551147461, -8.598567962646484, -7.814180374145508, -7.029792785644531, -6.245405197143555, -5.461017608642578, -4.676630020141602, -3.892242431640625, -3.1078548431396484, -2.323467254638672, -1.5390796661376953, -0.7546939849853516, 0.029693603515625, 0.8140811920166016, 1.5984687805175781, 2.3828563690185547, 3.1672439575195312, 3.951631546020508, 4.736019134521484, 5.520406723022461, 6.3047943115234375, 7.089181900024414, 7.873569488525391, 8.657957077026367, 9.442344665527344, 10.22673225402832, 11.011119842529297, 11.795507431030273, 12.57989501953125, 13.364282608032227, 14.148670196533203, 14.93305778503418, 15.717445373535156, 16.501832962036133, 17.28622055053711, 18.070608139038086, 18.854995727539062, 19.63938331604004, 20.423770904541016, 21.208158493041992, 21.99254608154297, 22.776933670043945, 23.561321258544922, 24.3457088470459]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 10.0, 16.0, 26.0, 36.0, 69.0, 116.0, 182.0, 343.0, 542.0, 885.0, 1366.0, 2077.0, 3521.0, 5352.0, 8537.0, 12293.0, 17913.0, 25969.0, 36104.0, 47952.0, 60978.0, 74454.0, 85743.0, 93836.0, 96337.0, 93719.0, 85383.0, 73733.0, 60256.0, 47184.0, 35443.0, 25692.0, 18029.0, 12094.0, 8138.0, 5296.0, 3402.0, 2072.0, 1384.0, 832.0, 491.0, 313.0, 178.0, 106.0, 70.0, 27.0, 24.0, 17.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3046875, -9.966552734375, -9.62841796875, -9.290283203125, -8.9521484375, -8.614013671875, -8.27587890625, -7.937744140625, -7.599609375, -7.261474609375, -6.92333984375, -6.585205078125, -6.2470703125, -5.908935546875, -5.57080078125, -5.232666015625, -4.89453125, -4.556396484375, -4.21826171875, -3.880126953125, -3.5419921875, -3.203857421875, -2.86572265625, -2.527587890625, -2.189453125, -1.851318359375, -1.51318359375, -1.175048828125, -0.8369140625, -0.498779296875, -0.16064453125, 0.177490234375, 0.515625, 0.853759765625, 1.19189453125, 1.530029296875, 1.8681640625, 2.206298828125, 2.54443359375, 2.882568359375, 3.220703125, 3.558837890625, 3.89697265625, 4.235107421875, 4.5732421875, 4.911376953125, 5.24951171875, 5.587646484375, 5.92578125, 6.263916015625, 6.60205078125, 6.940185546875, 7.2783203125, 7.616455078125, 7.95458984375, 8.292724609375, 8.630859375, 8.968994140625, 9.30712890625, 9.645263671875, 9.9833984375, 10.321533203125, 10.65966796875, 10.997802734375, 11.3359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 13.0, 16.0, 13.0, 30.0, 26.0, 30.0, 30.0, 21.0, 34.0, 35.0, 34.0, 41.0, 31.0, 47.0, 45.0, 44.0, 46.0, 36.0, 48.0, 46.0, 27.0, 41.0, 36.0, 32.0, 23.0, 20.0, 19.0, 20.0, 18.0, 13.0, 16.0, 17.0, 10.0, 5.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.9375, -28.05810546875, -27.1787109375, -26.29931640625, -25.419921875, -24.54052734375, -23.6611328125, -22.78173828125, -21.90234375, -21.02294921875, -20.1435546875, -19.26416015625, -18.384765625, -17.50537109375, -16.6259765625, -15.74658203125, -14.8671875, -13.98779296875, -13.1083984375, -12.22900390625, -11.349609375, -10.47021484375, -9.5908203125, -8.71142578125, -7.83203125, -6.95263671875, -6.0732421875, -5.19384765625, -4.314453125, -3.43505859375, -2.5556640625, -1.67626953125, -0.796875, 0.08251953125, 0.9619140625, 1.84130859375, 2.720703125, 3.60009765625, 4.4794921875, 5.35888671875, 6.23828125, 7.11767578125, 7.9970703125, 8.87646484375, 9.755859375, 10.63525390625, 11.5146484375, 12.39404296875, 13.2734375, 14.15283203125, 15.0322265625, 15.91162109375, 16.791015625, 17.67041015625, 18.5498046875, 19.42919921875, 20.30859375, 21.18798828125, 22.0673828125, 22.94677734375, 23.826171875, 24.70556640625, 25.5849609375, 26.46435546875, 27.34375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 9.0, 14.0, 15.0, 33.0, 40.0, 81.0, 96.0, 172.0, 240.0, 429.0, 652.0, 1012.0, 1542.0, 2438.0, 3622.0, 5541.0, 8310.0, 12013.0, 17286.0, 24413.0, 32866.0, 43691.0, 54914.0, 66543.0, 77582.0, 85413.0, 90327.0, 89510.0, 84564.0, 76325.0, 65325.0, 53752.0, 42145.0, 32106.0, 23383.0, 16673.0, 11863.0, 8124.0, 5340.0, 3597.0, 2335.0, 1544.0, 1001.0, 587.0, 398.0, 250.0, 155.0, 109.0, 58.0, 53.0, 24.0, 17.0, 15.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.3125, -9.98974609375, -9.6669921875, -9.34423828125, -9.021484375, -8.69873046875, -8.3759765625, -8.05322265625, -7.73046875, -7.40771484375, -7.0849609375, -6.76220703125, -6.439453125, -6.11669921875, -5.7939453125, -5.47119140625, -5.1484375, -4.82568359375, -4.5029296875, -4.18017578125, -3.857421875, -3.53466796875, -3.2119140625, -2.88916015625, -2.56640625, -2.24365234375, -1.9208984375, -1.59814453125, -1.275390625, -0.95263671875, -0.6298828125, -0.30712890625, 0.015625, 0.33837890625, 0.6611328125, 0.98388671875, 1.306640625, 1.62939453125, 1.9521484375, 2.27490234375, 2.59765625, 2.92041015625, 3.2431640625, 3.56591796875, 3.888671875, 4.21142578125, 4.5341796875, 4.85693359375, 5.1796875, 5.50244140625, 5.8251953125, 6.14794921875, 6.470703125, 6.79345703125, 7.1162109375, 7.43896484375, 7.76171875, 8.08447265625, 8.4072265625, 8.72998046875, 9.052734375, 9.37548828125, 9.6982421875, 10.02099609375, 10.34375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 15.0, 18.0, 15.0, 17.0, 19.0, 25.0, 29.0, 18.0, 37.0, 40.0, 39.0, 28.0, 24.0, 49.0, 56.0, 43.0, 57.0, 36.0, 48.0, 49.0, 45.0, 26.0, 37.0, 35.0, 37.0, 26.0, 17.0, 24.0, 20.0, 17.0, 10.0, 8.0, 9.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -16.208251953125, -15.60400390625, -14.999755859375, -14.3955078125, -13.791259765625, -13.18701171875, -12.582763671875, -11.978515625, -11.374267578125, -10.77001953125, -10.165771484375, -9.5615234375, -8.957275390625, -8.35302734375, -7.748779296875, -7.14453125, -6.540283203125, -5.93603515625, -5.331787109375, -4.7275390625, -4.123291015625, -3.51904296875, -2.914794921875, -2.310546875, -1.706298828125, -1.10205078125, -0.497802734375, 0.1064453125, 0.710693359375, 1.31494140625, 1.919189453125, 2.5234375, 3.127685546875, 3.73193359375, 4.336181640625, 4.9404296875, 5.544677734375, 6.14892578125, 6.753173828125, 7.357421875, 7.961669921875, 8.56591796875, 9.170166015625, 9.7744140625, 10.378662109375, 10.98291015625, 11.587158203125, 12.19140625, 12.795654296875, 13.39990234375, 14.004150390625, 14.6083984375, 15.212646484375, 15.81689453125, 16.421142578125, 17.025390625, 17.629638671875, 18.23388671875, 18.838134765625, 19.4423828125, 20.046630859375, 20.65087890625, 21.255126953125, 21.859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 10.0, 15.0, 22.0, 29.0, 41.0, 82.0, 128.0, 252.0, 351.0, 578.0, 1047.0, 1687.0, 2844.0, 4905.0, 7755.0, 12535.0, 19481.0, 29299.0, 41941.0, 57225.0, 74204.0, 89198.0, 101029.0, 106255.0, 104127.0, 95746.0, 81612.0, 66352.0, 49463.0, 35529.0, 24039.0, 15714.0, 9996.0, 6055.0, 3579.0, 2235.0, 1261.0, 792.0, 436.0, 281.0, 156.0, 97.0, 66.0, 36.0, 31.0, 14.0, 11.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.0078125, -3.88543701171875, -3.7630615234375, -3.64068603515625, -3.518310546875, -3.39593505859375, -3.2735595703125, -3.15118408203125, -3.02880859375, -2.90643310546875, -2.7840576171875, -2.66168212890625, -2.539306640625, -2.41693115234375, -2.2945556640625, -2.17218017578125, -2.0498046875, -1.92742919921875, -1.8050537109375, -1.68267822265625, -1.560302734375, -1.43792724609375, -1.3155517578125, -1.19317626953125, -1.07080078125, -0.94842529296875, -0.8260498046875, -0.70367431640625, -0.581298828125, -0.45892333984375, -0.3365478515625, -0.21417236328125, -0.091796875, 0.03057861328125, 0.1529541015625, 0.27532958984375, 0.397705078125, 0.52008056640625, 0.6424560546875, 0.76483154296875, 0.88720703125, 1.00958251953125, 1.1319580078125, 1.25433349609375, 1.376708984375, 1.49908447265625, 1.6214599609375, 1.74383544921875, 1.8662109375, 1.98858642578125, 2.1109619140625, 2.23333740234375, 2.355712890625, 2.47808837890625, 2.6004638671875, 2.72283935546875, 2.84521484375, 2.96759033203125, 3.0899658203125, 3.21234130859375, 3.334716796875, 3.45709228515625, 3.5794677734375, 3.70184326171875, 3.82421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 8.0, 12.0, 8.0, 12.0, 11.0, 12.0, 14.0, 10.0, 27.0, 11.0, 25.0, 34.0, 38.0, 37.0, 33.0, 49.0, 37.0, 31.0, 47.0, 50.0, 51.0, 32.0, 49.0, 47.0, 30.0, 34.0, 37.0, 27.0, 27.0, 26.0, 18.0, 17.0, 13.0, 9.0, 10.0, 9.0, 15.0, 5.0, 10.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00044083595275878906, -0.0004268437623977661, -0.00041285157203674316, -0.0003988593816757202, -0.00038486719131469727, -0.0003708750009536743, -0.00035688281059265137, -0.0003428906202316284, -0.00032889842987060547, -0.0003149062395095825, -0.00030091404914855957, -0.0002869218587875366, -0.00027292966842651367, -0.0002589374780654907, -0.0002449452877044678, -0.00023095309734344482, -0.00021696090698242188, -0.00020296871662139893, -0.00018897652626037598, -0.00017498433589935303, -0.00016099214553833008, -0.00014699995517730713, -0.00013300776481628418, -0.00011901557445526123, -0.00010502338409423828, -9.103119373321533e-05, -7.703900337219238e-05, -6.304681301116943e-05, -4.9054622650146484e-05, -3.5062432289123535e-05, -2.1070241928100586e-05, -7.078051567077637e-06, 6.9141387939453125e-06, 2.0906329154968262e-05, 3.489851951599121e-05, 4.889070987701416e-05, 6.288290023803711e-05, 7.687509059906006e-05, 9.086728096008301e-05, 0.00010485947132110596, 0.0001188516616821289, 0.00013284385204315186, 0.0001468360424041748, 0.00016082823276519775, 0.0001748204231262207, 0.00018881261348724365, 0.0002028048038482666, 0.00021679699420928955, 0.0002307891845703125, 0.00024478137493133545, 0.0002587735652923584, 0.00027276575565338135, 0.0002867579460144043, 0.00030075013637542725, 0.0003147423267364502, 0.00032873451709747314, 0.0003427267074584961, 0.00035671889781951904, 0.000370711088180542, 0.00038470327854156494, 0.0003986954689025879, 0.00041268765926361084, 0.0004266798496246338, 0.00044067203998565674, 0.0004546642303466797]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 8.0, 12.0, 14.0, 22.0, 24.0, 49.0, 85.0, 123.0, 177.0, 317.0, 502.0, 733.0, 1257.0, 2094.0, 3463.0, 5720.0, 9661.0, 15390.0, 24832.0, 38024.0, 54360.0, 73719.0, 93306.0, 108417.0, 115994.0, 114644.0, 102980.0, 85164.0, 66177.0, 46756.0, 31776.0, 20581.0, 12736.0, 7647.0, 4735.0, 2831.0, 1636.0, 927.0, 618.0, 385.0, 223.0, 162.0, 94.0, 64.0, 36.0, 30.0, 21.0, 17.0, 9.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.4375, -4.29791259765625, -4.1583251953125, -4.01873779296875, -3.879150390625, -3.73956298828125, -3.5999755859375, -3.46038818359375, -3.32080078125, -3.18121337890625, -3.0416259765625, -2.90203857421875, -2.762451171875, -2.62286376953125, -2.4832763671875, -2.34368896484375, -2.2041015625, -2.06451416015625, -1.9249267578125, -1.78533935546875, -1.645751953125, -1.50616455078125, -1.3665771484375, -1.22698974609375, -1.08740234375, -0.94781494140625, -0.8082275390625, -0.66864013671875, -0.529052734375, -0.38946533203125, -0.2498779296875, -0.11029052734375, 0.029296875, 0.16888427734375, 0.3084716796875, 0.44805908203125, 0.587646484375, 0.72723388671875, 0.8668212890625, 1.00640869140625, 1.14599609375, 1.28558349609375, 1.4251708984375, 1.56475830078125, 1.704345703125, 1.84393310546875, 1.9835205078125, 2.12310791015625, 2.2626953125, 2.40228271484375, 2.5418701171875, 2.68145751953125, 2.821044921875, 2.96063232421875, 3.1002197265625, 3.23980712890625, 3.37939453125, 3.51898193359375, 3.6585693359375, 3.79815673828125, 3.937744140625, 4.07733154296875, 4.2169189453125, 4.35650634765625, 4.49609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 3.0, 11.0, 7.0, 15.0, 22.0, 27.0, 34.0, 40.0, 40.0, 50.0, 61.0, 63.0, 55.0, 74.0, 57.0, 60.0, 58.0, 67.0, 52.0, 31.0, 38.0, 19.0, 27.0, 24.0, 20.0, 9.0, 5.0, 1.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.541015625, -2.455780029296875, -2.37054443359375, -2.285308837890625, -2.2000732421875, -2.114837646484375, -2.02960205078125, -1.944366455078125, -1.859130859375, -1.773895263671875, -1.68865966796875, -1.603424072265625, -1.5181884765625, -1.432952880859375, -1.34771728515625, -1.262481689453125, -1.17724609375, -1.092010498046875, -1.00677490234375, -0.921539306640625, -0.8363037109375, -0.751068115234375, -0.66583251953125, -0.580596923828125, -0.495361328125, -0.410125732421875, -0.32489013671875, -0.239654541015625, -0.1544189453125, -0.069183349609375, 0.01605224609375, 0.101287841796875, 0.1865234375, 0.271759033203125, 0.35699462890625, 0.442230224609375, 0.5274658203125, 0.612701416015625, 0.69793701171875, 0.783172607421875, 0.868408203125, 0.953643798828125, 1.03887939453125, 1.124114990234375, 1.2093505859375, 1.294586181640625, 1.37982177734375, 1.465057373046875, 1.55029296875, 1.635528564453125, 1.72076416015625, 1.805999755859375, 1.8912353515625, 1.976470947265625, 2.06170654296875, 2.146942138671875, 2.232177734375, 2.317413330078125, 2.40264892578125, 2.487884521484375, 2.5731201171875, 2.658355712890625, 2.74359130859375, 2.828826904296875, 2.9140625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 7.0, 2.0, 3.0, 3.0, 8.0, 10.0, 9.0, 11.0, 15.0, 18.0, 16.0, 15.0, 29.0, 32.0, 31.0, 28.0, 48.0, 49.0, 42.0, 39.0, 32.0, 44.0, 44.0, 56.0, 56.0, 47.0, 43.0, 33.0, 24.0, 32.0, 37.0, 25.0, 29.0, 16.0, 15.0, 10.0, 8.0, 5.0, 4.0, 7.0, 7.0, 9.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.956127166748047, -23.24897575378418, -22.541824340820312, -21.834674835205078, -21.12752342224121, -20.420372009277344, -19.713220596313477, -19.00606918334961, -18.298919677734375, -17.591768264770508, -16.88461685180664, -16.177467346191406, -15.470315933227539, -14.763164520263672, -14.056013107299805, -13.348862648010254, -12.641711235046387, -11.93455982208252, -11.227409362792969, -10.520257949829102, -9.81310749053955, -9.105956077575684, -8.398805618286133, -7.691654205322266, -6.984503269195557, -6.277352333068848, -5.570201396942139, -4.86305046081543, -4.1558990478515625, -3.4487483501434326, -2.7415971755981445, -2.0344462394714355, -1.3272953033447266, -0.6201443076133728, 0.08700668811798096, 0.7941577434539795, 1.5013086795806885, 2.2084596157073975, 2.9156107902526855, 3.6227617263793945, 4.3299126625061035, 5.0370635986328125, 5.7442145347595215, 6.4513654708862305, 7.158516883850098, 7.865667343139648, 8.572818756103516, 9.279970169067383, 9.987120628356934, 10.6942720413208, 11.401422500610352, 12.108573913574219, 12.81572437286377, 13.522875785827637, 14.230026245117188, 14.937177658081055, 15.644329071044922, 16.35148048400879, 17.058631896972656, 17.76578140258789, 18.472932815551758, 19.180084228515625, 19.887235641479492, 20.59438705444336, 21.301536560058594]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 8.0, 7.0, 9.0, 12.0, 9.0, 15.0, 25.0, 20.0, 31.0, 30.0, 34.0, 28.0, 34.0, 36.0, 31.0, 25.0, 47.0, 45.0, 35.0, 39.0, 41.0, 41.0, 31.0, 36.0, 23.0, 40.0, 30.0, 31.0, 27.0, 25.0, 26.0, 20.0, 15.0, 9.0, 11.0, 14.0, 8.0, 12.0, 6.0, 5.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.08310890197754, -26.21101951599121, -25.338930130004883, -24.466840744018555, -23.594751358032227, -22.72266387939453, -21.850574493408203, -20.978485107421875, -20.106395721435547, -19.23430633544922, -18.36221694946289, -17.490127563476562, -16.618038177490234, -15.745949745178223, -14.873860359191895, -14.001771926879883, -13.129681587219238, -12.25759220123291, -11.385502815246582, -10.51341438293457, -9.641324996948242, -8.769235610961914, -7.897146224975586, -7.025057315826416, -6.152967929840088, -5.28087854385376, -4.40878963470459, -3.5367002487182617, -2.6646111011505127, -1.7925219535827637, -0.9204325675964355, -0.048343658447265625, 0.8237457275390625, 1.6958348751068115, 2.5679240226745605, 3.4400134086608887, 4.312102317810059, 5.184191703796387, 6.056281089782715, 6.928369998931885, 7.800459384918213, 8.672548294067383, 9.544637680053711, 10.416727066040039, 11.288816452026367, 12.160905838012695, 13.032995223999023, 13.905083656311035, 14.777173042297363, 15.649262428283691, 16.521350860595703, 17.39344024658203, 18.26552963256836, 19.137619018554688, 20.009708404541016, 20.881797790527344, 21.753887176513672, 22.6259765625, 23.498065948486328, 24.370155334472656, 25.242244720458984, 26.114334106445312, 26.98642349243164, 27.858510971069336, 28.730600357055664]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 12.0, 21.0, 59.0, 104.0, 157.0, 304.0, 550.0, 1018.0, 1762.0, 2982.0, 5187.0, 8743.0, 15033.0, 24482.0, 39851.0, 63770.0, 99411.0, 148066.0, 210314.0, 283273.0, 358261.0, 419378.0, 451482.0, 446545.0, 408927.0, 344271.0, 270687.0, 199546.0, 139534.0, 93210.0, 60768.0, 38139.0, 23420.0, 14305.0, 8580.0, 5029.0, 2931.0, 1741.0, 1030.0, 586.0, 372.0, 192.0, 115.0, 57.0, 27.0, 24.0, 18.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.703369140625, -18.07861328125, -17.453857421875, -16.8291015625, -16.204345703125, -15.57958984375, -14.954833984375, -14.330078125, -13.705322265625, -13.08056640625, -12.455810546875, -11.8310546875, -11.206298828125, -10.58154296875, -9.956787109375, -9.33203125, -8.707275390625, -8.08251953125, -7.457763671875, -6.8330078125, -6.208251953125, -5.58349609375, -4.958740234375, -4.333984375, -3.709228515625, -3.08447265625, -2.459716796875, -1.8349609375, -1.210205078125, -0.58544921875, 0.039306640625, 0.6640625, 1.288818359375, 1.91357421875, 2.538330078125, 3.1630859375, 3.787841796875, 4.41259765625, 5.037353515625, 5.662109375, 6.286865234375, 6.91162109375, 7.536376953125, 8.1611328125, 8.785888671875, 9.41064453125, 10.035400390625, 10.66015625, 11.284912109375, 11.90966796875, 12.534423828125, 13.1591796875, 13.783935546875, 14.40869140625, 15.033447265625, 15.658203125, 16.282958984375, 16.90771484375, 17.532470703125, 18.1572265625, 18.781982421875, 19.40673828125, 20.031494140625, 20.65625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 1.0, 5.0, 6.0, 4.0, 3.0, 11.0, 10.0, 15.0, 14.0, 11.0, 16.0, 29.0, 22.0, 21.0, 33.0, 31.0, 37.0, 26.0, 34.0, 36.0, 42.0, 38.0, 34.0, 34.0, 36.0, 41.0, 37.0, 25.0, 32.0, 40.0, 25.0, 21.0, 39.0, 22.0, 20.0, 18.0, 19.0, 19.0, 12.0, 12.0, 11.0, 11.0, 6.0, 9.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-23.578125, -22.855712890625, -22.13330078125, -21.410888671875, -20.6884765625, -19.966064453125, -19.24365234375, -18.521240234375, -17.798828125, -17.076416015625, -16.35400390625, -15.631591796875, -14.9091796875, -14.186767578125, -13.46435546875, -12.741943359375, -12.01953125, -11.297119140625, -10.57470703125, -9.852294921875, -9.1298828125, -8.407470703125, -7.68505859375, -6.962646484375, -6.240234375, -5.517822265625, -4.79541015625, -4.072998046875, -3.3505859375, -2.628173828125, -1.90576171875, -1.183349609375, -0.4609375, 0.261474609375, 0.98388671875, 1.706298828125, 2.4287109375, 3.151123046875, 3.87353515625, 4.595947265625, 5.318359375, 6.040771484375, 6.76318359375, 7.485595703125, 8.2080078125, 8.930419921875, 9.65283203125, 10.375244140625, 11.09765625, 11.820068359375, 12.54248046875, 13.264892578125, 13.9873046875, 14.709716796875, 15.43212890625, 16.154541015625, 16.876953125, 17.599365234375, 18.32177734375, 19.044189453125, 19.7666015625, 20.489013671875, 21.21142578125, 21.933837890625, 22.65625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 11.0, 17.0, 29.0, 48.0, 82.0, 153.0, 237.0, 432.0, 657.0, 1046.0, 1823.0, 3252.0, 5338.0, 8809.0, 14470.0, 23970.0, 37332.0, 58328.0, 88078.0, 128398.0, 178496.0, 238227.0, 299969.0, 357312.0, 398994.0, 415457.0, 405786.0, 366649.0, 313454.0, 251700.0, 190159.0, 138586.0, 94907.0, 64015.0, 41352.0, 26057.0, 16287.0, 9740.0, 5884.0, 3465.0, 2180.0, 1269.0, 720.0, 449.0, 278.0, 141.0, 104.0, 63.0, 31.0, 19.0, 8.0, 8.0, 6.0, 3.0, 2.0], "bins": [-21.796875, -21.1669921875, -20.537109375, -19.9072265625, -19.27734375, -18.6474609375, -18.017578125, -17.3876953125, -16.7578125, -16.1279296875, -15.498046875, -14.8681640625, -14.23828125, -13.6083984375, -12.978515625, -12.3486328125, -11.71875, -11.0888671875, -10.458984375, -9.8291015625, -9.19921875, -8.5693359375, -7.939453125, -7.3095703125, -6.6796875, -6.0498046875, -5.419921875, -4.7900390625, -4.16015625, -3.5302734375, -2.900390625, -2.2705078125, -1.640625, -1.0107421875, -0.380859375, 0.2490234375, 0.87890625, 1.5087890625, 2.138671875, 2.7685546875, 3.3984375, 4.0283203125, 4.658203125, 5.2880859375, 5.91796875, 6.5478515625, 7.177734375, 7.8076171875, 8.4375, 9.0673828125, 9.697265625, 10.3271484375, 10.95703125, 11.5869140625, 12.216796875, 12.8466796875, 13.4765625, 14.1064453125, 14.736328125, 15.3662109375, 15.99609375, 16.6259765625, 17.255859375, 17.8857421875, 18.515625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 11.0, 18.0, 23.0, 21.0, 37.0, 44.0, 58.0, 67.0, 80.0, 102.0, 112.0, 125.0, 160.0, 177.0, 202.0, 214.0, 222.0, 234.0, 207.0, 210.0, 212.0, 187.0, 193.0, 168.0, 176.0, 146.0, 123.0, 116.0, 80.0, 74.0, 61.0, 41.0, 39.0, 30.0, 22.0, 19.0, 15.0, 17.0, 6.0, 6.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.90625, -12.4854736328125, -12.064697265625, -11.6439208984375, -11.22314453125, -10.8023681640625, -10.381591796875, -9.9608154296875, -9.5400390625, -9.1192626953125, -8.698486328125, -8.2777099609375, -7.85693359375, -7.4361572265625, -7.015380859375, -6.5946044921875, -6.173828125, -5.7530517578125, -5.332275390625, -4.9114990234375, -4.49072265625, -4.0699462890625, -3.649169921875, -3.2283935546875, -2.8076171875, -2.3868408203125, -1.966064453125, -1.5452880859375, -1.12451171875, -0.7037353515625, -0.282958984375, 0.1378173828125, 0.55859375, 0.9793701171875, 1.400146484375, 1.8209228515625, 2.24169921875, 2.6624755859375, 3.083251953125, 3.5040283203125, 3.9248046875, 4.3455810546875, 4.766357421875, 5.1871337890625, 5.60791015625, 6.0286865234375, 6.449462890625, 6.8702392578125, 7.291015625, 7.7117919921875, 8.132568359375, 8.5533447265625, 8.97412109375, 9.3948974609375, 9.815673828125, 10.2364501953125, 10.6572265625, 11.0780029296875, 11.498779296875, 11.9195556640625, 12.34033203125, 12.7611083984375, 13.181884765625, 13.6026611328125, 14.0234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 3.0, 6.0, 10.0, 5.0, 12.0, 10.0, 14.0, 19.0, 25.0, 29.0, 40.0, 37.0, 44.0, 44.0, 55.0, 51.0, 62.0, 56.0, 50.0, 61.0, 59.0, 49.0, 45.0, 34.0, 36.0, 32.0, 18.0, 18.0, 23.0, 8.0, 9.0, 13.0, 8.0, 1.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.709590911865234, -33.64313888549805, -32.57668685913086, -31.510234832763672, -30.443784713745117, -29.37733268737793, -28.310880661010742, -27.244428634643555, -26.177978515625, -25.111526489257812, -24.045074462890625, -22.978622436523438, -21.912172317504883, -20.845720291137695, -19.779268264770508, -18.71281623840332, -17.646364212036133, -16.579912185668945, -15.513461112976074, -14.447009086608887, -13.380558013916016, -12.314105987548828, -11.24765396118164, -10.181201934814453, -9.114750862121582, -8.048298835754395, -6.981847763061523, -5.915395736694336, -4.848944187164307, -3.7824926376342773, -2.71604061126709, -1.6495890617370605, -0.5831375122070312, 0.4833141565322876, 1.5497658252716064, 2.616217613220215, 3.682669162750244, 4.749120712280273, 5.815572738647461, 6.88202428817749, 7.9484758377075195, 9.014927864074707, 10.081378936767578, 11.147830963134766, 12.214282989501953, 13.280734062194824, 14.347186088562012, 15.413637161254883, 16.48008918762207, 17.546541213989258, 18.612993240356445, 19.679443359375, 20.745895385742188, 21.812347412109375, 22.878799438476562, 23.94525146484375, 25.011703491210938, 26.078155517578125, 27.144607543945312, 28.2110595703125, 29.277509689331055, 30.343961715698242, 31.41041374206543, 32.476863861083984, 33.54331588745117]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 9.0, 16.0, 13.0, 12.0, 16.0, 11.0, 22.0, 28.0, 30.0, 20.0, 33.0, 27.0, 32.0, 36.0, 39.0, 43.0, 26.0, 39.0, 45.0, 37.0, 46.0, 35.0, 26.0, 39.0, 33.0, 24.0, 25.0, 30.0, 22.0, 22.0, 19.0, 15.0, 17.0, 22.0, 11.0, 12.0, 8.0, 5.0, 6.0, 7.0, 2.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-31.980066299438477, -30.99169158935547, -30.003314971923828, -29.01494026184082, -28.026565551757812, -27.038188934326172, -26.049814224243164, -25.061439514160156, -24.073062896728516, -23.084688186645508, -22.096311569213867, -21.10793685913086, -20.11956214904785, -19.131187438964844, -18.142810821533203, -17.154436111450195, -16.166061401367188, -15.177685737609863, -14.189311027526855, -13.200935363769531, -12.212560653686523, -11.2241849899292, -10.235809326171875, -9.247434616088867, -8.259058952331543, -7.270683765411377, -6.282308578491211, -5.293932914733887, -4.305557727813721, -3.3171825408935547, -2.3288068771362305, -1.3404316902160645, -0.35205841064453125, 0.6363168954849243, 1.6246922016143799, 2.613067626953125, 3.601442813873291, 4.589818000793457, 5.578193664550781, 6.566568851470947, 7.554944038391113, 8.543319702148438, 9.531694412231445, 10.52007007598877, 11.508445739746094, 12.496820449829102, 13.485196113586426, 14.47357177734375, 15.461946487426758, 16.450321197509766, 17.438697814941406, 18.427072525024414, 19.415447235107422, 20.403823852539062, 21.39219856262207, 22.380573272705078, 23.36894989013672, 24.357324600219727, 25.345701217651367, 26.334075927734375, 27.322450637817383, 28.31082534790039, 29.29920196533203, 30.28757667541504, 31.275951385498047]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 11.0, 10.0, 22.0, 28.0, 33.0, 47.0, 72.0, 151.0, 233.0, 314.0, 504.0, 740.0, 1321.0, 1948.0, 3129.0, 4961.0, 8449.0, 13930.0, 23484.0, 39217.0, 67090.0, 113082.0, 181086.0, 213717.0, 150940.0, 90591.0, 53603.0, 31949.0, 18774.0, 11212.0, 6703.0, 4181.0, 2551.0, 1572.0, 994.0, 657.0, 420.0, 312.0, 173.0, 129.0, 81.0, 47.0, 38.0, 18.0, 12.0, 8.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33984375, -3.229583740234375, -3.11932373046875, -3.009063720703125, -2.8988037109375, -2.788543701171875, -2.67828369140625, -2.568023681640625, -2.457763671875, -2.347503662109375, -2.23724365234375, -2.126983642578125, -2.0167236328125, -1.906463623046875, -1.79620361328125, -1.685943603515625, -1.57568359375, -1.465423583984375, -1.35516357421875, -1.244903564453125, -1.1346435546875, -1.024383544921875, -0.91412353515625, -0.803863525390625, -0.693603515625, -0.583343505859375, -0.47308349609375, -0.362823486328125, -0.2525634765625, -0.142303466796875, -0.03204345703125, 0.078216552734375, 0.1884765625, 0.298736572265625, 0.40899658203125, 0.519256591796875, 0.6295166015625, 0.739776611328125, 0.85003662109375, 0.960296630859375, 1.070556640625, 1.180816650390625, 1.29107666015625, 1.401336669921875, 1.5115966796875, 1.621856689453125, 1.73211669921875, 1.842376708984375, 1.95263671875, 2.062896728515625, 2.17315673828125, 2.283416748046875, 2.3936767578125, 2.503936767578125, 2.61419677734375, 2.724456787109375, 2.834716796875, 2.944976806640625, 3.05523681640625, 3.165496826171875, 3.2757568359375, 3.386016845703125, 3.49627685546875, 3.606536865234375, 3.716796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 6.0, 8.0, 16.0, 12.0, 12.0, 13.0, 11.0, 16.0, 19.0, 31.0, 28.0, 38.0, 32.0, 37.0, 39.0, 43.0, 33.0, 39.0, 37.0, 46.0, 33.0, 53.0, 34.0, 41.0, 40.0, 30.0, 36.0, 31.0, 22.0, 25.0, 22.0, 20.0, 16.0, 16.0, 15.0, 12.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.1875, -33.05859375, -31.9296875, -30.80078125, -29.671875, -28.54296875, -27.4140625, -26.28515625, -25.15625, -24.02734375, -22.8984375, -21.76953125, -20.640625, -19.51171875, -18.3828125, -17.25390625, -16.125, -14.99609375, -13.8671875, -12.73828125, -11.609375, -10.48046875, -9.3515625, -8.22265625, -7.09375, -5.96484375, -4.8359375, -3.70703125, -2.578125, -1.44921875, -0.3203125, 0.80859375, 1.9375, 3.06640625, 4.1953125, 5.32421875, 6.453125, 7.58203125, 8.7109375, 9.83984375, 10.96875, 12.09765625, 13.2265625, 14.35546875, 15.484375, 16.61328125, 17.7421875, 18.87109375, 20.0, 21.12890625, 22.2578125, 23.38671875, 24.515625, 25.64453125, 26.7734375, 27.90234375, 29.03125, 30.16015625, 31.2890625, 32.41796875, 33.546875, 34.67578125, 35.8046875, 36.93359375, 38.0625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 10.0, 11.0, 17.0, 29.0, 38.0, 44.0, 67.0, 94.0, 133.0, 188.0, 321.0, 453.0, 646.0, 989.0, 1451.0, 2197.0, 3475.0, 5602.0, 8905.0, 14347.0, 23160.0, 38332.0, 62848.0, 101035.0, 156368.0, 199579.0, 158780.0, 102869.0, 63858.0, 39327.0, 23908.0, 14395.0, 9024.0, 5665.0, 3550.0, 2251.0, 1462.0, 1019.0, 692.0, 438.0, 302.0, 207.0, 127.0, 106.0, 65.0, 39.0, 43.0, 22.0, 22.0, 15.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.71875, -3.60076904296875, -3.4827880859375, -3.36480712890625, -3.246826171875, -3.12884521484375, -3.0108642578125, -2.89288330078125, -2.77490234375, -2.65692138671875, -2.5389404296875, -2.42095947265625, -2.302978515625, -2.18499755859375, -2.0670166015625, -1.94903564453125, -1.8310546875, -1.71307373046875, -1.5950927734375, -1.47711181640625, -1.359130859375, -1.24114990234375, -1.1231689453125, -1.00518798828125, -0.88720703125, -0.76922607421875, -0.6512451171875, -0.53326416015625, -0.415283203125, -0.29730224609375, -0.1793212890625, -0.06134033203125, 0.056640625, 0.17462158203125, 0.2926025390625, 0.41058349609375, 0.528564453125, 0.64654541015625, 0.7645263671875, 0.88250732421875, 1.00048828125, 1.11846923828125, 1.2364501953125, 1.35443115234375, 1.472412109375, 1.59039306640625, 1.7083740234375, 1.82635498046875, 1.9443359375, 2.06231689453125, 2.1802978515625, 2.29827880859375, 2.416259765625, 2.53424072265625, 2.6522216796875, 2.77020263671875, 2.88818359375, 3.00616455078125, 3.1241455078125, 3.24212646484375, 3.360107421875, 3.47808837890625, 3.5960693359375, 3.71405029296875, 3.83203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 9.0, 6.0, 12.0, 17.0, 10.0, 16.0, 16.0, 25.0, 26.0, 37.0, 20.0, 23.0, 27.0, 34.0, 42.0, 31.0, 41.0, 36.0, 45.0, 49.0, 36.0, 24.0, 37.0, 36.0, 35.0, 39.0, 37.0, 32.0, 30.0, 21.0, 15.0, 22.0, 13.0, 9.0, 10.0, 19.0, 12.0, 7.0, 7.0, 8.0, 3.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-22.71875, -22.06005859375, -21.4013671875, -20.74267578125, -20.083984375, -19.42529296875, -18.7666015625, -18.10791015625, -17.44921875, -16.79052734375, -16.1318359375, -15.47314453125, -14.814453125, -14.15576171875, -13.4970703125, -12.83837890625, -12.1796875, -11.52099609375, -10.8623046875, -10.20361328125, -9.544921875, -8.88623046875, -8.2275390625, -7.56884765625, -6.91015625, -6.25146484375, -5.5927734375, -4.93408203125, -4.275390625, -3.61669921875, -2.9580078125, -2.29931640625, -1.640625, -0.98193359375, -0.3232421875, 0.33544921875, 0.994140625, 1.65283203125, 2.3115234375, 2.97021484375, 3.62890625, 4.28759765625, 4.9462890625, 5.60498046875, 6.263671875, 6.92236328125, 7.5810546875, 8.23974609375, 8.8984375, 9.55712890625, 10.2158203125, 10.87451171875, 11.533203125, 12.19189453125, 12.8505859375, 13.50927734375, 14.16796875, 14.82666015625, 15.4853515625, 16.14404296875, 16.802734375, 17.46142578125, 18.1201171875, 18.77880859375, 19.4375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 5.0, 13.0, 13.0, 15.0, 25.0, 35.0, 47.0, 93.0, 119.0, 186.0, 295.0, 410.0, 648.0, 966.0, 1495.0, 2197.0, 3411.0, 5557.0, 9309.0, 15294.0, 26141.0, 46025.0, 85157.0, 165816.0, 267319.0, 192081.0, 99200.0, 52805.0, 29358.0, 16817.0, 10026.0, 6392.0, 4097.0, 2544.0, 1588.0, 1068.0, 641.0, 429.0, 303.0, 166.0, 143.0, 104.0, 65.0, 49.0, 30.0, 21.0, 15.0, 7.0, 9.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10693359375, -0.10355091094970703, -0.10016822814941406, -0.0967855453491211, -0.09340286254882812, -0.09002017974853516, -0.08663749694824219, -0.08325481414794922, -0.07987213134765625, -0.07648944854736328, -0.07310676574707031, -0.06972408294677734, -0.06634140014648438, -0.0629587173461914, -0.05957603454589844, -0.05619335174560547, -0.0528106689453125, -0.04942798614501953, -0.04604530334472656, -0.042662620544433594, -0.039279937744140625, -0.035897254943847656, -0.03251457214355469, -0.02913188934326172, -0.02574920654296875, -0.02236652374267578, -0.018983840942382812, -0.015601158142089844, -0.012218475341796875, -0.008835792541503906, -0.0054531097412109375, -0.0020704269409179688, 0.001312255859375, 0.004694938659667969, 0.008077621459960938, 0.011460304260253906, 0.014842987060546875, 0.018225669860839844, 0.021608352661132812, 0.02499103546142578, 0.02837371826171875, 0.03175640106201172, 0.03513908386230469, 0.038521766662597656, 0.041904449462890625, 0.045287132263183594, 0.04866981506347656, 0.05205249786376953, 0.0554351806640625, 0.05881786346435547, 0.06220054626464844, 0.0655832290649414, 0.06896591186523438, 0.07234859466552734, 0.07573127746582031, 0.07911396026611328, 0.08249664306640625, 0.08587932586669922, 0.08926200866699219, 0.09264469146728516, 0.09602737426757812, 0.0994100570678711, 0.10279273986816406, 0.10617542266845703, 0.10955810546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 8.0, 12.0, 11.0, 20.0, 11.0, 17.0, 27.0, 23.0, 39.0, 38.0, 25.0, 43.0, 36.0, 42.0, 36.0, 48.0, 38.0, 72.0, 49.0, 44.0, 44.0, 50.0, 50.0, 37.0, 33.0, 30.0, 22.0, 15.0, 14.0, 12.0, 12.0, 10.0, 9.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.014636993408203e-05, -1.9420869648456573e-05, -1.8695369362831116e-05, -1.7969869077205658e-05, -1.72443687915802e-05, -1.6518868505954742e-05, -1.5793368220329285e-05, -1.5067867934703827e-05, -1.4342367649078369e-05, -1.3616867363452911e-05, -1.2891367077827454e-05, -1.2165866792201996e-05, -1.1440366506576538e-05, -1.071486622095108e-05, -9.989365935325623e-06, -9.263865649700165e-06, -8.538365364074707e-06, -7.81286507844925e-06, -7.0873647928237915e-06, -6.361864507198334e-06, -5.636364221572876e-06, -4.910863935947418e-06, -4.1853636503219604e-06, -3.4598633646965027e-06, -2.734363079071045e-06, -2.008862793445587e-06, -1.2833625078201294e-06, -5.578622221946716e-07, 1.6763806343078613e-07, 8.931383490562439e-07, 1.6186386346817017e-06, 2.3441389203071594e-06, 3.069639205932617e-06, 3.795139491558075e-06, 4.520639777183533e-06, 5.2461400628089905e-06, 5.971640348434448e-06, 6.697140634059906e-06, 7.422640919685364e-06, 8.148141205310822e-06, 8.87364149093628e-06, 9.599141776561737e-06, 1.0324642062187195e-05, 1.1050142347812653e-05, 1.177564263343811e-05, 1.2501142919063568e-05, 1.3226643204689026e-05, 1.3952143490314484e-05, 1.4677643775939941e-05, 1.54031440615654e-05, 1.6128644347190857e-05, 1.6854144632816315e-05, 1.7579644918441772e-05, 1.830514520406723e-05, 1.9030645489692688e-05, 1.9756145775318146e-05, 2.0481646060943604e-05, 2.120714634656906e-05, 2.193264663219452e-05, 2.2658146917819977e-05, 2.3383647203445435e-05, 2.4109147489070892e-05, 2.483464777469635e-05, 2.5560148060321808e-05, 2.6285648345947266e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 11.0, 9.0, 9.0, 14.0, 27.0, 53.0, 72.0, 84.0, 160.0, 226.0, 357.0, 577.0, 843.0, 1302.0, 1834.0, 2833.0, 4054.0, 6375.0, 9344.0, 14303.0, 21926.0, 35116.0, 56797.0, 99546.0, 195624.0, 262268.0, 136738.0, 74039.0, 44202.0, 27525.0, 17843.0, 11398.0, 7671.0, 5118.0, 3502.0, 2286.0, 1472.0, 1035.0, 670.0, 439.0, 309.0, 200.0, 124.0, 86.0, 56.0, 31.0, 24.0, 11.0, 9.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.2342529296875, -0.22720718383789062, -0.22016143798828125, -0.21311569213867188, -0.2060699462890625, -0.19902420043945312, -0.19197845458984375, -0.18493270874023438, -0.177886962890625, -0.17084121704101562, -0.16379547119140625, -0.15674972534179688, -0.1497039794921875, -0.14265823364257812, -0.13561248779296875, -0.12856674194335938, -0.12152099609375, -0.11447525024414062, -0.10742950439453125, -0.10038375854492188, -0.0933380126953125, -0.08629226684570312, -0.07924652099609375, -0.07220077514648438, -0.065155029296875, -0.058109283447265625, -0.05106353759765625, -0.044017791748046875, -0.0369720458984375, -0.029926300048828125, -0.02288055419921875, -0.015834808349609375, -0.0087890625, -0.001743316650390625, 0.00530242919921875, 0.012348175048828125, 0.0193939208984375, 0.026439666748046875, 0.03348541259765625, 0.040531158447265625, 0.047576904296875, 0.054622650146484375, 0.06166839599609375, 0.06871414184570312, 0.0757598876953125, 0.08280563354492188, 0.08985137939453125, 0.09689712524414062, 0.10394287109375, 0.11098861694335938, 0.11803436279296875, 0.12508010864257812, 0.1321258544921875, 0.13917160034179688, 0.14621734619140625, 0.15326309204101562, 0.160308837890625, 0.16735458374023438, 0.17440032958984375, 0.18144607543945312, 0.1884918212890625, 0.19553756713867188, 0.20258331298828125, 0.20962905883789062, 0.2166748046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 5.0, 7.0, 9.0, 8.0, 9.0, 17.0, 8.0, 15.0, 21.0, 18.0, 26.0, 28.0, 39.0, 69.0, 99.0, 176.0, 115.0, 89.0, 48.0, 34.0, 18.0, 24.0, 18.0, 19.0, 14.0, 17.0, 7.0, 8.0, 8.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10791587829589844, -0.10401535034179688, -0.10011482238769531, -0.09621429443359375, -0.09231376647949219, -0.08841323852539062, -0.08451271057128906, -0.0806121826171875, -0.07671165466308594, -0.07281112670898438, -0.06891059875488281, -0.06501007080078125, -0.06110954284667969, -0.057209014892578125, -0.05330848693847656, -0.049407958984375, -0.04550743103027344, -0.041606903076171875, -0.03770637512207031, -0.03380584716796875, -0.029905319213867188, -0.026004791259765625, -0.022104263305664062, -0.0182037353515625, -0.014303207397460938, -0.010402679443359375, -0.0065021514892578125, -0.00260162353515625, 0.0012989044189453125, 0.005199432373046875, 0.009099960327148438, 0.01300048828125, 0.016901016235351562, 0.020801544189453125, 0.024702072143554688, 0.02860260009765625, 0.03250312805175781, 0.036403656005859375, 0.04030418395996094, 0.0442047119140625, 0.04810523986816406, 0.052005767822265625, 0.05590629577636719, 0.05980682373046875, 0.06370735168457031, 0.06760787963867188, 0.07150840759277344, 0.075408935546875, 0.07930946350097656, 0.08320999145507812, 0.08711051940917969, 0.09101104736328125, 0.09491157531738281, 0.09881210327148438, 0.10271263122558594, 0.1066131591796875, 0.11051368713378906, 0.11441421508789062, 0.11831474304199219, 0.12221527099609375, 0.1261157989501953, 0.13001632690429688, 0.13391685485839844, 0.1378173828125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 2.0, 15.0, 9.0, 15.0, 14.0, 33.0, 25.0, 41.0, 33.0, 47.0, 44.0, 56.0, 57.0, 58.0, 58.0, 53.0, 59.0, 59.0, 46.0, 44.0, 39.0, 34.0, 33.0, 14.0, 21.0, 18.0, 14.0, 8.0, 11.0, 7.0, 2.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.00875473022461, -33.93449401855469, -32.860233306884766, -31.785972595214844, -30.711711883544922, -29.637451171875, -28.563190460205078, -27.488929748535156, -26.414669036865234, -25.340408325195312, -24.26614761352539, -23.19188690185547, -22.117626190185547, -21.043365478515625, -19.969104766845703, -18.89484405517578, -17.82058334350586, -16.746322631835938, -15.672061920166016, -14.597801208496094, -13.523540496826172, -12.44927978515625, -11.375019073486328, -10.300758361816406, -9.226497650146484, -8.152236938476562, -7.077976226806641, -6.003715515136719, -4.929454803466797, -3.855194091796875, -2.780933380126953, -1.7066726684570312, -0.6324119567871094, 0.4418487548828125, 1.5161094665527344, 2.5903701782226562, 3.664630889892578, 4.7388916015625, 5.813152313232422, 6.887413024902344, 7.961673736572266, 9.035934448242188, 10.11019515991211, 11.184455871582031, 12.258716583251953, 13.332977294921875, 14.407238006591797, 15.481498718261719, 16.55575942993164, 17.630020141601562, 18.704280853271484, 19.778541564941406, 20.852802276611328, 21.92706298828125, 23.001323699951172, 24.075584411621094, 25.149845123291016, 26.224105834960938, 27.29836654663086, 28.37262725830078, 29.446887969970703, 30.521148681640625, 31.595409393310547, 32.66967010498047, 33.74393081665039]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 8.0, 8.0, 11.0, 8.0, 16.0, 14.0, 11.0, 16.0, 11.0, 23.0, 27.0, 29.0, 23.0, 30.0, 28.0, 33.0, 36.0, 37.0, 44.0, 28.0, 40.0, 41.0, 40.0, 45.0, 34.0, 29.0, 37.0, 33.0, 25.0, 24.0, 31.0, 22.0, 23.0, 18.0, 15.0, 18.0, 20.0, 11.0, 11.0, 9.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0], "bins": [-31.977569580078125, -30.98874855041504, -29.999929428100586, -29.0111083984375, -28.022289276123047, -27.03346824645996, -26.044647216796875, -25.055828094482422, -24.067007064819336, -23.07818603515625, -22.089366912841797, -21.10054588317871, -20.111726760864258, -19.122905731201172, -18.13408660888672, -17.145265579223633, -16.156444549560547, -15.167624473571777, -14.178804397583008, -13.189983367919922, -12.201163291931152, -11.212343215942383, -10.223523139953613, -9.234703063964844, -8.24588394165039, -7.257063865661621, -6.268243312835693, -5.279423236846924, -4.290602684020996, -3.3017826080322266, -2.312962532043457, -1.3241419792175293, -0.33532142639160156, 0.6534988284111023, 1.6423190832138062, 2.6311392784118652, 3.619959592819214, 4.6087799072265625, 5.597599983215332, 6.58642053604126, 7.575240612030029, 8.564061164855957, 9.552881240844727, 10.541701316833496, 11.530521392822266, 12.519342422485352, 13.508161544799805, 14.49698257446289, 15.48580265045166, 16.47462272644043, 17.463443756103516, 18.45226287841797, 19.441083908081055, 20.42990493774414, 21.418724060058594, 22.40754508972168, 23.396364212036133, 24.38518524169922, 25.374004364013672, 26.362825393676758, 27.35164451599121, 28.340465545654297, 29.32928466796875, 30.318105697631836, 31.306926727294922]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 19.0, 34.0, 39.0, 74.0, 133.0, 194.0, 301.0, 514.0, 806.0, 1257.0, 2074.0, 3368.0, 5091.0, 8117.0, 12402.0, 18308.0, 27098.0, 38227.0, 51872.0, 66952.0, 82201.0, 94042.0, 101037.0, 101200.0, 95985.0, 84438.0, 69959.0, 55008.0, 40737.0, 29190.0, 20193.0, 13505.0, 8840.0, 5651.0, 3613.0, 2291.0, 1406.0, 925.0, 580.0, 338.0, 187.0, 116.0, 93.0, 39.0, 31.0, 26.0, 15.0, 14.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.421875, -13.0037841796875, -12.585693359375, -12.1676025390625, -11.74951171875, -11.3314208984375, -10.913330078125, -10.4952392578125, -10.0771484375, -9.6590576171875, -9.240966796875, -8.8228759765625, -8.40478515625, -7.9866943359375, -7.568603515625, -7.1505126953125, -6.732421875, -6.3143310546875, -5.896240234375, -5.4781494140625, -5.06005859375, -4.6419677734375, -4.223876953125, -3.8057861328125, -3.3876953125, -2.9696044921875, -2.551513671875, -2.1334228515625, -1.71533203125, -1.2972412109375, -0.879150390625, -0.4610595703125, -0.04296875, 0.3751220703125, 0.793212890625, 1.2113037109375, 1.62939453125, 2.0474853515625, 2.465576171875, 2.8836669921875, 3.3017578125, 3.7198486328125, 4.137939453125, 4.5560302734375, 4.97412109375, 5.3922119140625, 5.810302734375, 6.2283935546875, 6.646484375, 7.0645751953125, 7.482666015625, 7.9007568359375, 8.31884765625, 8.7369384765625, 9.155029296875, 9.5731201171875, 9.9912109375, 10.4093017578125, 10.827392578125, 11.2454833984375, 11.66357421875, 12.0816650390625, 12.499755859375, 12.9178466796875, 13.3359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 7.0, 4.0, 12.0, 11.0, 13.0, 17.0, 16.0, 10.0, 24.0, 25.0, 25.0, 33.0, 31.0, 31.0, 44.0, 38.0, 28.0, 49.0, 49.0, 45.0, 53.0, 44.0, 45.0, 34.0, 25.0, 37.0, 31.0, 34.0, 24.0, 23.0, 19.0, 21.0, 22.0, 19.0, 15.0, 12.0, 6.0, 5.0, 5.0, 3.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -35.92578125, -34.7890625, -33.65234375, -32.515625, -31.37890625, -30.2421875, -29.10546875, -27.96875, -26.83203125, -25.6953125, -24.55859375, -23.421875, -22.28515625, -21.1484375, -20.01171875, -18.875, -17.73828125, -16.6015625, -15.46484375, -14.328125, -13.19140625, -12.0546875, -10.91796875, -9.78125, -8.64453125, -7.5078125, -6.37109375, -5.234375, -4.09765625, -2.9609375, -1.82421875, -0.6875, 0.44921875, 1.5859375, 2.72265625, 3.859375, 4.99609375, 6.1328125, 7.26953125, 8.40625, 9.54296875, 10.6796875, 11.81640625, 12.953125, 14.08984375, 15.2265625, 16.36328125, 17.5, 18.63671875, 19.7734375, 20.91015625, 22.046875, 23.18359375, 24.3203125, 25.45703125, 26.59375, 27.73046875, 28.8671875, 30.00390625, 31.140625, 32.27734375, 33.4140625, 34.55078125, 35.6875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 19.0, 20.0, 35.0, 57.0, 83.0, 121.0, 207.0, 320.0, 504.0, 773.0, 1243.0, 2052.0, 3124.0, 4717.0, 7047.0, 10915.0, 15641.0, 22365.0, 30727.0, 41619.0, 53389.0, 66370.0, 78724.0, 88020.0, 93264.0, 93518.0, 88688.0, 79080.0, 66990.0, 54658.0, 42158.0, 31387.0, 22777.0, 15984.0, 10913.0, 7346.0, 4952.0, 3089.0, 2026.0, 1311.0, 829.0, 569.0, 347.0, 207.0, 129.0, 83.0, 58.0, 39.0, 25.0, 11.0, 5.0, 5.0, 8.0, 5.0, 1.0, 1.0], "bins": [-13.2890625, -12.88671875, -12.484375, -12.08203125, -11.6796875, -11.27734375, -10.875, -10.47265625, -10.0703125, -9.66796875, -9.265625, -8.86328125, -8.4609375, -8.05859375, -7.65625, -7.25390625, -6.8515625, -6.44921875, -6.046875, -5.64453125, -5.2421875, -4.83984375, -4.4375, -4.03515625, -3.6328125, -3.23046875, -2.828125, -2.42578125, -2.0234375, -1.62109375, -1.21875, -0.81640625, -0.4140625, -0.01171875, 0.390625, 0.79296875, 1.1953125, 1.59765625, 2.0, 2.40234375, 2.8046875, 3.20703125, 3.609375, 4.01171875, 4.4140625, 4.81640625, 5.21875, 5.62109375, 6.0234375, 6.42578125, 6.828125, 7.23046875, 7.6328125, 8.03515625, 8.4375, 8.83984375, 9.2421875, 9.64453125, 10.046875, 10.44921875, 10.8515625, 11.25390625, 11.65625, 12.05859375, 12.4609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 8.0, 2.0, 9.0, 5.0, 11.0, 14.0, 13.0, 15.0, 24.0, 24.0, 18.0, 22.0, 34.0, 37.0, 41.0, 36.0, 49.0, 37.0, 43.0, 41.0, 46.0, 41.0, 25.0, 34.0, 52.0, 37.0, 37.0, 25.0, 35.0, 28.0, 30.0, 16.0, 21.0, 11.0, 14.0, 18.0, 9.0, 9.0, 3.0, 12.0, 1.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.859375, -20.1533203125, -19.447265625, -18.7412109375, -18.03515625, -17.3291015625, -16.623046875, -15.9169921875, -15.2109375, -14.5048828125, -13.798828125, -13.0927734375, -12.38671875, -11.6806640625, -10.974609375, -10.2685546875, -9.5625, -8.8564453125, -8.150390625, -7.4443359375, -6.73828125, -6.0322265625, -5.326171875, -4.6201171875, -3.9140625, -3.2080078125, -2.501953125, -1.7958984375, -1.08984375, -0.3837890625, 0.322265625, 1.0283203125, 1.734375, 2.4404296875, 3.146484375, 3.8525390625, 4.55859375, 5.2646484375, 5.970703125, 6.6767578125, 7.3828125, 8.0888671875, 8.794921875, 9.5009765625, 10.20703125, 10.9130859375, 11.619140625, 12.3251953125, 13.03125, 13.7373046875, 14.443359375, 15.1494140625, 15.85546875, 16.5615234375, 17.267578125, 17.9736328125, 18.6796875, 19.3857421875, 20.091796875, 20.7978515625, 21.50390625, 22.2099609375, 22.916015625, 23.6220703125, 24.328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 16.0, 16.0, 26.0, 36.0, 63.0, 105.0, 174.0, 268.0, 443.0, 683.0, 1165.0, 1910.0, 3173.0, 4831.0, 7921.0, 12156.0, 18099.0, 26837.0, 37353.0, 50313.0, 64637.0, 78492.0, 89566.0, 96863.0, 98521.0, 94657.0, 85255.0, 72748.0, 58752.0, 44892.0, 32798.0, 22990.0, 15397.0, 10231.0, 6430.0, 4068.0, 2542.0, 1597.0, 953.0, 601.0, 367.0, 251.0, 118.0, 87.0, 47.0, 43.0, 25.0, 16.0, 10.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.8984375, -4.74676513671875, -4.5950927734375, -4.44342041015625, -4.291748046875, -4.14007568359375, -3.9884033203125, -3.83673095703125, -3.68505859375, -3.53338623046875, -3.3817138671875, -3.23004150390625, -3.078369140625, -2.92669677734375, -2.7750244140625, -2.62335205078125, -2.4716796875, -2.32000732421875, -2.1683349609375, -2.01666259765625, -1.864990234375, -1.71331787109375, -1.5616455078125, -1.40997314453125, -1.25830078125, -1.10662841796875, -0.9549560546875, -0.80328369140625, -0.651611328125, -0.49993896484375, -0.3482666015625, -0.19659423828125, -0.044921875, 0.10675048828125, 0.2584228515625, 0.41009521484375, 0.561767578125, 0.71343994140625, 0.8651123046875, 1.01678466796875, 1.16845703125, 1.32012939453125, 1.4718017578125, 1.62347412109375, 1.775146484375, 1.92681884765625, 2.0784912109375, 2.23016357421875, 2.3818359375, 2.53350830078125, 2.6851806640625, 2.83685302734375, 2.988525390625, 3.14019775390625, 3.2918701171875, 3.44354248046875, 3.59521484375, 3.74688720703125, 3.8985595703125, 4.05023193359375, 4.201904296875, 4.35357666015625, 4.5052490234375, 4.65692138671875, 4.80859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 4.0, 8.0, 4.0, 10.0, 10.0, 11.0, 19.0, 17.0, 18.0, 22.0, 30.0, 25.0, 28.0, 19.0, 30.0, 38.0, 28.0, 34.0, 39.0, 48.0, 39.0, 39.0, 34.0, 37.0, 43.0, 42.0, 38.0, 38.0, 27.0, 20.0, 22.0, 27.0, 20.0, 18.0, 10.0, 13.0, 19.0, 18.0, 8.0, 5.0, 4.0, 7.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.0006222724914550781, -0.0006042718887329102, -0.0005862712860107422, -0.0005682706832885742, -0.0005502700805664062, -0.0005322694778442383, -0.0005142688751220703, -0.0004962682723999023, -0.0004782676696777344, -0.0004602670669555664, -0.00044226646423339844, -0.00042426586151123047, -0.0004062652587890625, -0.00038826465606689453, -0.00037026405334472656, -0.0003522634506225586, -0.0003342628479003906, -0.00031626224517822266, -0.0002982616424560547, -0.0002802610397338867, -0.00026226043701171875, -0.0002442598342895508, -0.0002262592315673828, -0.00020825862884521484, -0.00019025802612304688, -0.0001722574234008789, -0.00015425682067871094, -0.00013625621795654297, -0.000118255615234375, -0.00010025501251220703, -8.225440979003906e-05, -6.42538070678711e-05, -4.6253204345703125e-05, -2.8252601623535156e-05, -1.0251998901367188e-05, 7.748603820800781e-06, 2.574920654296875e-05, 4.374980926513672e-05, 6.175041198730469e-05, 7.975101470947266e-05, 9.775161743164062e-05, 0.0001157522201538086, 0.00013375282287597656, 0.00015175342559814453, 0.0001697540283203125, 0.00018775463104248047, 0.00020575523376464844, 0.0002237558364868164, 0.00024175643920898438, 0.00025975704193115234, 0.0002777576446533203, 0.0002957582473754883, 0.00031375885009765625, 0.0003317594528198242, 0.0003497600555419922, 0.00036776065826416016, 0.0003857612609863281, 0.0004037618637084961, 0.00042176246643066406, 0.00043976306915283203, 0.000457763671875, 0.00047576427459716797, 0.0004937648773193359, 0.0005117654800415039, 0.0005297660827636719]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 16.0, 16.0, 30.0, 41.0, 85.0, 113.0, 169.0, 306.0, 473.0, 697.0, 1163.0, 1894.0, 3047.0, 5241.0, 8184.0, 13226.0, 20747.0, 31492.0, 45651.0, 63095.0, 81437.0, 97597.0, 108033.0, 111929.0, 106316.0, 93811.0, 76008.0, 58564.0, 41577.0, 28594.0, 18312.0, 11876.0, 7285.0, 4377.0, 2772.0, 1658.0, 1040.0, 644.0, 392.0, 217.0, 175.0, 100.0, 63.0, 40.0, 22.0, 16.0, 6.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.83984375, -5.659423828125, -5.47900390625, -5.298583984375, -5.1181640625, -4.937744140625, -4.75732421875, -4.576904296875, -4.396484375, -4.216064453125, -4.03564453125, -3.855224609375, -3.6748046875, -3.494384765625, -3.31396484375, -3.133544921875, -2.953125, -2.772705078125, -2.59228515625, -2.411865234375, -2.2314453125, -2.051025390625, -1.87060546875, -1.690185546875, -1.509765625, -1.329345703125, -1.14892578125, -0.968505859375, -0.7880859375, -0.607666015625, -0.42724609375, -0.246826171875, -0.06640625, 0.114013671875, 0.29443359375, 0.474853515625, 0.6552734375, 0.835693359375, 1.01611328125, 1.196533203125, 1.376953125, 1.557373046875, 1.73779296875, 1.918212890625, 2.0986328125, 2.279052734375, 2.45947265625, 2.639892578125, 2.8203125, 3.000732421875, 3.18115234375, 3.361572265625, 3.5419921875, 3.722412109375, 3.90283203125, 4.083251953125, 4.263671875, 4.444091796875, 4.62451171875, 4.804931640625, 4.9853515625, 5.165771484375, 5.34619140625, 5.526611328125, 5.70703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 9.0, 4.0, 10.0, 12.0, 8.0, 15.0, 18.0, 17.0, 28.0, 25.0, 31.0, 30.0, 33.0, 46.0, 55.0, 46.0, 44.0, 47.0, 54.0, 41.0, 41.0, 47.0, 52.0, 33.0, 42.0, 23.0, 23.0, 27.0, 21.0, 18.0, 21.0, 9.0, 12.0, 8.0, 11.0, 2.0, 5.0, 6.0, 1.0, 4.0, 9.0, 1.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-3.060546875, -2.9644775390625, -2.868408203125, -2.7723388671875, -2.67626953125, -2.5802001953125, -2.484130859375, -2.3880615234375, -2.2919921875, -2.1959228515625, -2.099853515625, -2.0037841796875, -1.90771484375, -1.8116455078125, -1.715576171875, -1.6195068359375, -1.5234375, -1.4273681640625, -1.331298828125, -1.2352294921875, -1.13916015625, -1.0430908203125, -0.947021484375, -0.8509521484375, -0.7548828125, -0.6588134765625, -0.562744140625, -0.4666748046875, -0.37060546875, -0.2745361328125, -0.178466796875, -0.0823974609375, 0.013671875, 0.1097412109375, 0.205810546875, 0.3018798828125, 0.39794921875, 0.4940185546875, 0.590087890625, 0.6861572265625, 0.7822265625, 0.8782958984375, 0.974365234375, 1.0704345703125, 1.16650390625, 1.2625732421875, 1.358642578125, 1.4547119140625, 1.55078125, 1.6468505859375, 1.742919921875, 1.8389892578125, 1.93505859375, 2.0311279296875, 2.127197265625, 2.2232666015625, 2.3193359375, 2.4154052734375, 2.511474609375, 2.6075439453125, 2.70361328125, 2.7996826171875, 2.895751953125, 2.9918212890625, 3.087890625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 16.0, 11.0, 16.0, 25.0, 20.0, 25.0, 36.0, 39.0, 44.0, 49.0, 42.0, 46.0, 51.0, 48.0, 62.0, 57.0, 54.0, 46.0, 48.0, 40.0, 33.0, 35.0, 33.0, 15.0, 19.0, 18.0, 11.0, 13.0, 7.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.38981628417969, -33.34634780883789, -32.302879333496094, -31.25940704345703, -30.215938568115234, -29.172470092773438, -28.128999710083008, -27.085529327392578, -26.04206085205078, -24.998592376708984, -23.955121994018555, -22.911651611328125, -21.868183135986328, -20.82471466064453, -19.7812442779541, -18.737773895263672, -17.694305419921875, -16.650836944580078, -15.607366561889648, -14.563897132873535, -13.520427703857422, -12.476958274841309, -11.433488845825195, -10.390019416809082, -9.346549987792969, -8.303080558776855, -7.259611129760742, -6.216141700744629, -5.172672271728516, -4.129202842712402, -3.085733413696289, -2.042263984680176, -0.9987983703613281, 0.044671058654785156, 1.0881404876708984, 2.1316099166870117, 3.175079345703125, 4.218548774719238, 5.262018203735352, 6.305487632751465, 7.348957061767578, 8.392426490783691, 9.435895919799805, 10.479365348815918, 11.522834777832031, 12.566304206848145, 13.609773635864258, 14.653243064880371, 15.696712493896484, 16.74018096923828, 17.78365135192871, 18.82712173461914, 19.870590209960938, 20.914058685302734, 21.957529067993164, 23.000999450683594, 24.04446792602539, 25.087936401367188, 26.131406784057617, 27.174877166748047, 28.218345642089844, 29.26181411743164, 30.30528450012207, 31.3487548828125, 32.3922233581543]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 8.0, 14.0, 17.0, 14.0, 26.0, 18.0, 16.0, 29.0, 25.0, 31.0, 33.0, 45.0, 35.0, 39.0, 43.0, 38.0, 44.0, 56.0, 37.0, 45.0, 42.0, 29.0, 36.0, 37.0, 32.0, 29.0, 23.0, 23.0, 20.0, 19.0, 13.0, 13.0, 9.0, 15.0, 9.0, 9.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.09646224975586, -42.79240417480469, -41.488346099853516, -40.184288024902344, -38.88023376464844, -37.576175689697266, -36.272117614746094, -34.96805953979492, -33.66400146484375, -32.35994338989258, -31.055885314941406, -29.751829147338867, -28.447771072387695, -27.143712997436523, -25.839656829833984, -24.535598754882812, -23.23154067993164, -21.92748260498047, -20.623424530029297, -19.319368362426758, -18.015310287475586, -16.711252212524414, -15.407195091247559, -14.103137969970703, -12.799079895019531, -11.49502182006836, -10.190964698791504, -8.886907577514648, -7.582849502563477, -6.278791904449463, -4.974734306335449, -3.6706771850585938, -2.3666152954101562, -1.0625576972961426, 0.2414999008178711, 1.5455574989318848, 2.8496150970458984, 4.153672695159912, 5.457730293273926, 6.761787414550781, 8.065845489501953, 9.369903564453125, 10.67396068572998, 11.978017807006836, 13.282075881958008, 14.58613395690918, 15.890191078186035, 17.19424819946289, 18.498306274414062, 19.802364349365234, 21.106422424316406, 22.410478591918945, 23.714536666870117, 25.01859474182129, 26.322650909423828, 27.626708984375, 28.930767059326172, 30.234825134277344, 31.538883209228516, 32.84294128417969, 34.146995544433594, 35.451053619384766, 36.75511169433594, 38.05916976928711, 39.36322784423828]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 12.0, 14.0, 28.0, 40.0, 66.0, 120.0, 155.0, 258.0, 434.0, 678.0, 1046.0, 1699.0, 2582.0, 4253.0, 6704.0, 10714.0, 16490.0, 25650.0, 39476.0, 59770.0, 88193.0, 126751.0, 176667.0, 236538.0, 301726.0, 360497.0, 403562.0, 420144.0, 406825.0, 364230.0, 307038.0, 241676.0, 182192.0, 132353.0, 92761.0, 63300.0, 42078.0, 27462.0, 18109.0, 11595.0, 7555.0, 4814.0, 2978.0, 1905.0, 1179.0, 733.0, 442.0, 304.0, 185.0, 111.0, 73.0, 60.0, 23.0, 18.0, 8.0, 12.0, 6.0, 2.0], "bins": [-25.828125, -25.058837890625, -24.28955078125, -23.520263671875, -22.7509765625, -21.981689453125, -21.21240234375, -20.443115234375, -19.673828125, -18.904541015625, -18.13525390625, -17.365966796875, -16.5966796875, -15.827392578125, -15.05810546875, -14.288818359375, -13.51953125, -12.750244140625, -11.98095703125, -11.211669921875, -10.4423828125, -9.673095703125, -8.90380859375, -8.134521484375, -7.365234375, -6.595947265625, -5.82666015625, -5.057373046875, -4.2880859375, -3.518798828125, -2.74951171875, -1.980224609375, -1.2109375, -0.441650390625, 0.32763671875, 1.096923828125, 1.8662109375, 2.635498046875, 3.40478515625, 4.174072265625, 4.943359375, 5.712646484375, 6.48193359375, 7.251220703125, 8.0205078125, 8.789794921875, 9.55908203125, 10.328369140625, 11.09765625, 11.866943359375, 12.63623046875, 13.405517578125, 14.1748046875, 14.944091796875, 15.71337890625, 16.482666015625, 17.251953125, 18.021240234375, 18.79052734375, 19.559814453125, 20.3291015625, 21.098388671875, 21.86767578125, 22.636962890625, 23.40625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 11.0, 6.0, 9.0, 9.0, 14.0, 20.0, 18.0, 18.0, 18.0, 22.0, 19.0, 20.0, 38.0, 25.0, 29.0, 37.0, 36.0, 44.0, 39.0, 39.0, 41.0, 53.0, 36.0, 30.0, 33.0, 26.0, 35.0, 34.0, 32.0, 27.0, 22.0, 22.0, 15.0, 22.0, 15.0, 15.0, 13.0, 11.0, 6.0, 7.0, 10.0, 9.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-35.15625, -34.078125, -33.0, -31.921875, -30.84375, -29.765625, -28.6875, -27.609375, -26.53125, -25.453125, -24.375, -23.296875, -22.21875, -21.140625, -20.0625, -18.984375, -17.90625, -16.828125, -15.75, -14.671875, -13.59375, -12.515625, -11.4375, -10.359375, -9.28125, -8.203125, -7.125, -6.046875, -4.96875, -3.890625, -2.8125, -1.734375, -0.65625, 0.421875, 1.5, 2.578125, 3.65625, 4.734375, 5.8125, 6.890625, 7.96875, 9.046875, 10.125, 11.203125, 12.28125, 13.359375, 14.4375, 15.515625, 16.59375, 17.671875, 18.75, 19.828125, 20.90625, 21.984375, 23.0625, 24.140625, 25.21875, 26.296875, 27.375, 28.453125, 29.53125, 30.609375, 31.6875, 32.765625, 33.84375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 11.0, 7.0, 30.0, 43.0, 72.0, 114.0, 196.0, 317.0, 504.0, 877.0, 1462.0, 2360.0, 3945.0, 6330.0, 10304.0, 16790.0, 26721.0, 41941.0, 64373.0, 96580.0, 140106.0, 195467.0, 259375.0, 325622.0, 382360.0, 418656.0, 426410.0, 403447.0, 354188.0, 291336.0, 225636.0, 164738.0, 116133.0, 78285.0, 51922.0, 33115.0, 20798.0, 13028.0, 8046.0, 5061.0, 2951.0, 1852.0, 1083.0, 693.0, 367.0, 220.0, 146.0, 101.0, 56.0, 40.0, 25.0, 12.0, 12.0, 6.0, 5.0, 0.0, 3.0, 2.0], "bins": [-28.46875, -27.585693359375, -26.70263671875, -25.819580078125, -24.9365234375, -24.053466796875, -23.17041015625, -22.287353515625, -21.404296875, -20.521240234375, -19.63818359375, -18.755126953125, -17.8720703125, -16.989013671875, -16.10595703125, -15.222900390625, -14.33984375, -13.456787109375, -12.57373046875, -11.690673828125, -10.8076171875, -9.924560546875, -9.04150390625, -8.158447265625, -7.275390625, -6.392333984375, -5.50927734375, -4.626220703125, -3.7431640625, -2.860107421875, -1.97705078125, -1.093994140625, -0.2109375, 0.672119140625, 1.55517578125, 2.438232421875, 3.3212890625, 4.204345703125, 5.08740234375, 5.970458984375, 6.853515625, 7.736572265625, 8.61962890625, 9.502685546875, 10.3857421875, 11.268798828125, 12.15185546875, 13.034912109375, 13.91796875, 14.801025390625, 15.68408203125, 16.567138671875, 17.4501953125, 18.333251953125, 19.21630859375, 20.099365234375, 20.982421875, 21.865478515625, 22.74853515625, 23.631591796875, 24.5146484375, 25.397705078125, 26.28076171875, 27.163818359375, 28.046875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 9.0, 6.0, 4.0, 12.0, 15.0, 20.0, 17.0, 34.0, 41.0, 45.0, 48.0, 73.0, 94.0, 94.0, 118.0, 118.0, 146.0, 140.0, 161.0, 179.0, 199.0, 211.0, 199.0, 230.0, 183.0, 209.0, 198.0, 154.0, 159.0, 153.0, 119.0, 113.0, 102.0, 81.0, 76.0, 70.0, 56.0, 38.0, 33.0, 29.0, 29.0, 23.0, 10.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-17.328125, -16.766845703125, -16.20556640625, -15.644287109375, -15.0830078125, -14.521728515625, -13.96044921875, -13.399169921875, -12.837890625, -12.276611328125, -11.71533203125, -11.154052734375, -10.5927734375, -10.031494140625, -9.47021484375, -8.908935546875, -8.34765625, -7.786376953125, -7.22509765625, -6.663818359375, -6.1025390625, -5.541259765625, -4.97998046875, -4.418701171875, -3.857421875, -3.296142578125, -2.73486328125, -2.173583984375, -1.6123046875, -1.051025390625, -0.48974609375, 0.071533203125, 0.6328125, 1.194091796875, 1.75537109375, 2.316650390625, 2.8779296875, 3.439208984375, 4.00048828125, 4.561767578125, 5.123046875, 5.684326171875, 6.24560546875, 6.806884765625, 7.3681640625, 7.929443359375, 8.49072265625, 9.052001953125, 9.61328125, 10.174560546875, 10.73583984375, 11.297119140625, 11.8583984375, 12.419677734375, 12.98095703125, 13.542236328125, 14.103515625, 14.664794921875, 15.22607421875, 15.787353515625, 16.3486328125, 16.909912109375, 17.47119140625, 18.032470703125, 18.59375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 6.0, 10.0, 18.0, 22.0, 24.0, 29.0, 40.0, 48.0, 54.0, 54.0, 63.0, 69.0, 76.0, 65.0, 67.0, 66.0, 59.0, 47.0, 32.0, 29.0, 23.0, 18.0, 15.0, 18.0, 15.0, 10.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.15007781982422, -63.26443862915039, -61.37879943847656, -59.49315643310547, -57.60751724243164, -55.72187805175781, -53.836238861083984, -51.950599670410156, -50.06495666503906, -48.179317474365234, -46.293678283691406, -44.40803527832031, -42.522396087646484, -40.636756896972656, -38.75111770629883, -36.865478515625, -34.97983932495117, -33.094200134277344, -31.208559036254883, -29.322919845581055, -27.437278747558594, -25.551639556884766, -23.666000366210938, -21.78036117553711, -19.89472007751465, -18.00908088684082, -16.12343978881836, -14.237800598144531, -12.352160453796387, -10.466520309448242, -8.580881118774414, -6.6952409744262695, -4.809597015380859, -2.923957109451294, -1.0383172035217285, 0.8473224639892578, 2.7329626083374023, 4.618602752685547, 6.504241943359375, 8.38988208770752, 10.275522232055664, 12.161162376403809, 14.046802520751953, 15.932441711425781, 17.81808090209961, 19.70372200012207, 21.5893611907959, 23.47500228881836, 25.360641479492188, 27.246280670166016, 29.131921768188477, 31.017560958862305, 32.903202056884766, 34.788841247558594, 36.67448043823242, 38.56011962890625, 40.445762634277344, 42.33140182495117, 44.217041015625, 46.102684020996094, 47.98832321166992, 49.87396240234375, 51.75960159301758, 53.645240783691406, 55.530879974365234]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 8.0, 0.0, 11.0, 9.0, 17.0, 10.0, 10.0, 14.0, 27.0, 27.0, 22.0, 27.0, 30.0, 41.0, 42.0, 33.0, 42.0, 51.0, 40.0, 31.0, 31.0, 40.0, 40.0, 39.0, 37.0, 45.0, 33.0, 47.0, 21.0, 22.0, 26.0, 18.0, 16.0, 23.0, 11.0, 10.0, 9.0, 13.0, 10.0, 2.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.76868438720703, -51.064918518066406, -49.361148834228516, -47.65738296508789, -45.95361328125, -44.249847412109375, -42.54608154296875, -40.842315673828125, -39.138545989990234, -37.43478012084961, -35.73101043701172, -34.027244567871094, -32.32347869873047, -30.619709014892578, -28.915943145751953, -27.212175369262695, -25.508407592773438, -23.80463981628418, -22.100872039794922, -20.397106170654297, -18.69333839416504, -16.98957061767578, -15.28580379486084, -13.582036972045898, -11.87826919555664, -10.174501419067383, -8.470734596252441, -6.766967296600342, -5.063199996948242, -3.3594322204589844, -1.655665397644043, 0.04810142517089844, 1.7518692016601562, 3.455636501312256, 5.1594038009643555, 6.863171100616455, 8.566938400268555, 10.270706176757812, 11.974472999572754, 13.678239822387695, 15.382007598876953, 17.08577537536621, 18.78954315185547, 20.493309020996094, 22.19707679748535, 23.90084457397461, 25.604610443115234, 27.308378219604492, 29.01214599609375, 30.715913772583008, 32.419681549072266, 34.12344741821289, 35.82721710205078, 37.530982971191406, 39.23474884033203, 40.938514709472656, 42.64228439331055, 44.34605026245117, 46.04981994628906, 47.75358581542969, 49.45735168457031, 51.1611213684082, 52.86488723754883, 54.56865692138672, 56.272422790527344]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 13.0, 18.0, 19.0, 36.0, 47.0, 97.0, 147.0, 217.0, 378.0, 648.0, 1088.0, 1877.0, 3134.0, 5627.0, 9568.0, 16687.0, 29597.0, 52634.0, 93312.0, 160563.0, 232146.0, 185785.0, 110371.0, 62543.0, 35311.0, 19897.0, 11242.0, 6521.0, 3724.0, 2151.0, 1295.0, 741.0, 436.0, 249.0, 175.0, 90.0, 58.0, 47.0, 21.0, 11.0, 12.0, 6.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.59173583984375, -4.4256591796875, -4.25958251953125, -4.093505859375, -3.92742919921875, -3.7613525390625, -3.59527587890625, -3.42919921875, -3.26312255859375, -3.0970458984375, -2.93096923828125, -2.764892578125, -2.59881591796875, -2.4327392578125, -2.26666259765625, -2.1005859375, -1.93450927734375, -1.7684326171875, -1.60235595703125, -1.436279296875, -1.27020263671875, -1.1041259765625, -0.93804931640625, -0.77197265625, -0.60589599609375, -0.4398193359375, -0.27374267578125, -0.107666015625, 0.05841064453125, 0.2244873046875, 0.39056396484375, 0.556640625, 0.72271728515625, 0.8887939453125, 1.05487060546875, 1.220947265625, 1.38702392578125, 1.5531005859375, 1.71917724609375, 1.88525390625, 2.05133056640625, 2.2174072265625, 2.38348388671875, 2.549560546875, 2.71563720703125, 2.8817138671875, 3.04779052734375, 3.2138671875, 3.37994384765625, 3.5460205078125, 3.71209716796875, 3.878173828125, 4.04425048828125, 4.2103271484375, 4.37640380859375, 4.54248046875, 4.70855712890625, 4.8746337890625, 5.04071044921875, 5.206787109375, 5.37286376953125, 5.5389404296875, 5.70501708984375, 5.87109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 11.0, 8.0, 5.0, 15.0, 16.0, 17.0, 18.0, 29.0, 38.0, 33.0, 35.0, 41.0, 28.0, 46.0, 33.0, 51.0, 43.0, 50.0, 46.0, 35.0, 32.0, 41.0, 42.0, 35.0, 38.0, 26.0, 27.0, 24.0, 17.0, 12.0, 20.0, 18.0, 16.0, 5.0, 16.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.90625, -52.07958984375, -50.2529296875, -48.42626953125, -46.599609375, -44.77294921875, -42.9462890625, -41.11962890625, -39.29296875, -37.46630859375, -35.6396484375, -33.81298828125, -31.986328125, -30.15966796875, -28.3330078125, -26.50634765625, -24.6796875, -22.85302734375, -21.0263671875, -19.19970703125, -17.373046875, -15.54638671875, -13.7197265625, -11.89306640625, -10.06640625, -8.23974609375, -6.4130859375, -4.58642578125, -2.759765625, -0.93310546875, 0.8935546875, 2.72021484375, 4.546875, 6.37353515625, 8.2001953125, 10.02685546875, 11.853515625, 13.68017578125, 15.5068359375, 17.33349609375, 19.16015625, 20.98681640625, 22.8134765625, 24.64013671875, 26.466796875, 28.29345703125, 30.1201171875, 31.94677734375, 33.7734375, 35.60009765625, 37.4267578125, 39.25341796875, 41.080078125, 42.90673828125, 44.7333984375, 46.56005859375, 48.38671875, 50.21337890625, 52.0400390625, 53.86669921875, 55.693359375, 57.52001953125, 59.3466796875, 61.17333984375, 63.0]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 17.0, 16.0, 27.0, 30.0, 52.0, 72.0, 105.0, 153.0, 197.0, 285.0, 430.0, 697.0, 1001.0, 1474.0, 2272.0, 3230.0, 4933.0, 7635.0, 11790.0, 17889.0, 27723.0, 43167.0, 67090.0, 101481.0, 146042.0, 179393.0, 144119.0, 99916.0, 65997.0, 42475.0, 27345.0, 17687.0, 11575.0, 7390.0, 4867.0, 3244.0, 2130.0, 1484.0, 959.0, 686.0, 491.0, 318.0, 219.0, 126.0, 103.0, 75.0, 38.0, 26.0, 32.0, 18.0, 13.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.26171875, -4.1263427734375, -3.990966796875, -3.8555908203125, -3.72021484375, -3.5848388671875, -3.449462890625, -3.3140869140625, -3.1787109375, -3.0433349609375, -2.907958984375, -2.7725830078125, -2.63720703125, -2.5018310546875, -2.366455078125, -2.2310791015625, -2.095703125, -1.9603271484375, -1.824951171875, -1.6895751953125, -1.55419921875, -1.4188232421875, -1.283447265625, -1.1480712890625, -1.0126953125, -0.8773193359375, -0.741943359375, -0.6065673828125, -0.47119140625, -0.3358154296875, -0.200439453125, -0.0650634765625, 0.0703125, 0.2056884765625, 0.341064453125, 0.4764404296875, 0.61181640625, 0.7471923828125, 0.882568359375, 1.0179443359375, 1.1533203125, 1.2886962890625, 1.424072265625, 1.5594482421875, 1.69482421875, 1.8302001953125, 1.965576171875, 2.1009521484375, 2.236328125, 2.3717041015625, 2.507080078125, 2.6424560546875, 2.77783203125, 2.9132080078125, 3.048583984375, 3.1839599609375, 3.3193359375, 3.4547119140625, 3.590087890625, 3.7254638671875, 3.86083984375, 3.9962158203125, 4.131591796875, 4.2669677734375, 4.40234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 2.0, 2.0, 7.0, 2.0, 14.0, 5.0, 13.0, 15.0, 16.0, 16.0, 21.0, 18.0, 27.0, 33.0, 29.0, 32.0, 42.0, 26.0, 46.0, 37.0, 43.0, 38.0, 49.0, 44.0, 34.0, 34.0, 40.0, 47.0, 27.0, 34.0, 31.0, 21.0, 18.0, 25.0, 19.0, 17.0, 10.0, 14.0, 16.0, 7.0, 8.0, 6.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.375, -32.31884765625, -31.2626953125, -30.20654296875, -29.150390625, -28.09423828125, -27.0380859375, -25.98193359375, -24.92578125, -23.86962890625, -22.8134765625, -21.75732421875, -20.701171875, -19.64501953125, -18.5888671875, -17.53271484375, -16.4765625, -15.42041015625, -14.3642578125, -13.30810546875, -12.251953125, -11.19580078125, -10.1396484375, -9.08349609375, -8.02734375, -6.97119140625, -5.9150390625, -4.85888671875, -3.802734375, -2.74658203125, -1.6904296875, -0.63427734375, 0.421875, 1.47802734375, 2.5341796875, 3.59033203125, 4.646484375, 5.70263671875, 6.7587890625, 7.81494140625, 8.87109375, 9.92724609375, 10.9833984375, 12.03955078125, 13.095703125, 14.15185546875, 15.2080078125, 16.26416015625, 17.3203125, 18.37646484375, 19.4326171875, 20.48876953125, 21.544921875, 22.60107421875, 23.6572265625, 24.71337890625, 25.76953125, 26.82568359375, 27.8818359375, 28.93798828125, 29.994140625, 31.05029296875, 32.1064453125, 33.16259765625, 34.21875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 12.0, 10.0, 23.0, 36.0, 39.0, 62.0, 74.0, 111.0, 147.0, 196.0, 283.0, 409.0, 639.0, 944.0, 1284.0, 1814.0, 2813.0, 4130.0, 6171.0, 9820.0, 15755.0, 25638.0, 45435.0, 86973.0, 187168.0, 301762.0, 168705.0, 79110.0, 42260.0, 24233.0, 14779.0, 9285.0, 5849.0, 3950.0, 2735.0, 1802.0, 1246.0, 846.0, 598.0, 393.0, 293.0, 200.0, 130.0, 114.0, 90.0, 53.0, 45.0, 28.0, 22.0, 19.0, 10.0, 5.0, 3.0, 7.0, 3.0, 2.0], "bins": [-0.2159423828125, -0.20948410034179688, -0.20302581787109375, -0.19656753540039062, -0.1901092529296875, -0.18365097045898438, -0.17719268798828125, -0.17073440551757812, -0.164276123046875, -0.15781784057617188, -0.15135955810546875, -0.14490127563476562, -0.1384429931640625, -0.13198471069335938, -0.12552642822265625, -0.11906814575195312, -0.11260986328125, -0.10615158081054688, -0.09969329833984375, -0.09323501586914062, -0.0867767333984375, -0.08031845092773438, -0.07386016845703125, -0.06740188598632812, -0.060943603515625, -0.054485321044921875, -0.04802703857421875, -0.041568756103515625, -0.0351104736328125, -0.028652191162109375, -0.02219390869140625, -0.015735626220703125, -0.00927734375, -0.002819061279296875, 0.00363922119140625, 0.010097503662109375, 0.0165557861328125, 0.023014068603515625, 0.02947235107421875, 0.035930633544921875, 0.042388916015625, 0.048847198486328125, 0.05530548095703125, 0.061763763427734375, 0.0682220458984375, 0.07468032836914062, 0.08113861083984375, 0.08759689331054688, 0.09405517578125, 0.10051345825195312, 0.10697174072265625, 0.11343002319335938, 0.1198883056640625, 0.12634658813476562, 0.13280487060546875, 0.13926315307617188, 0.145721435546875, 0.15217971801757812, 0.15863800048828125, 0.16509628295898438, 0.1715545654296875, 0.17801284790039062, 0.18447113037109375, 0.19092941284179688, 0.1973876953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 9.0, 7.0, 23.0, 15.0, 22.0, 26.0, 30.0, 34.0, 40.0, 46.0, 51.0, 54.0, 40.0, 50.0, 56.0, 57.0, 67.0, 48.0, 41.0, 47.0, 37.0, 38.0, 24.0, 25.0, 25.0, 21.0, 9.0, 13.0, 9.0, 4.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.892183303833008e-05, -3.7590041756629944e-05, -3.625825047492981e-05, -3.4926459193229675e-05, -3.359466791152954e-05, -3.226287662982941e-05, -3.093108534812927e-05, -2.9599294066429138e-05, -2.8267502784729004e-05, -2.693571150302887e-05, -2.5603920221328735e-05, -2.42721289396286e-05, -2.2940337657928467e-05, -2.1608546376228333e-05, -2.0276755094528198e-05, -1.8944963812828064e-05, -1.761317253112793e-05, -1.6281381249427795e-05, -1.4949589967727661e-05, -1.3617798686027527e-05, -1.2286007404327393e-05, -1.0954216122627258e-05, -9.622424840927124e-06, -8.29063355922699e-06, -6.9588422775268555e-06, -5.627050995826721e-06, -4.295259714126587e-06, -2.9634684324264526e-06, -1.6316771507263184e-06, -2.998858690261841e-07, 1.0319054126739502e-06, 2.3636966943740845e-06, 3.6954879760742188e-06, 5.027279257774353e-06, 6.359070539474487e-06, 7.690861821174622e-06, 9.022653102874756e-06, 1.035444438457489e-05, 1.1686235666275024e-05, 1.3018026947975159e-05, 1.4349818229675293e-05, 1.5681609511375427e-05, 1.701340079307556e-05, 1.8345192074775696e-05, 1.967698335647583e-05, 2.1008774638175964e-05, 2.23405659198761e-05, 2.3672357201576233e-05, 2.5004148483276367e-05, 2.63359397649765e-05, 2.7667731046676636e-05, 2.899952232837677e-05, 3.0331313610076904e-05, 3.166310489177704e-05, 3.299489617347717e-05, 3.432668745517731e-05, 3.565847873687744e-05, 3.6990270018577576e-05, 3.832206130027771e-05, 3.9653852581977844e-05, 4.098564386367798e-05, 4.231743514537811e-05, 4.364922642707825e-05, 4.498101770877838e-05, 4.6312808990478516e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 13.0, 15.0, 32.0, 30.0, 58.0, 49.0, 91.0, 123.0, 165.0, 256.0, 340.0, 457.0, 626.0, 907.0, 1345.0, 1861.0, 2778.0, 4056.0, 6044.0, 9290.0, 14621.0, 23472.0, 36911.0, 63514.0, 118299.0, 265799.0, 235773.0, 106804.0, 58262.0, 34440.0, 21315.0, 13565.0, 8755.0, 5871.0, 3927.0, 2630.0, 1789.0, 1245.0, 837.0, 615.0, 413.0, 333.0, 244.0, 176.0, 95.0, 91.0, 54.0, 42.0, 39.0, 17.0, 17.0, 14.0, 10.0, 9.0, 6.0, 3.0, 4.0], "bins": [-0.5478515625, -0.5312118530273438, -0.5145721435546875, -0.49793243408203125, -0.481292724609375, -0.46465301513671875, -0.4480133056640625, -0.43137359619140625, -0.41473388671875, -0.39809417724609375, -0.3814544677734375, -0.36481475830078125, -0.348175048828125, -0.33153533935546875, -0.3148956298828125, -0.29825592041015625, -0.2816162109375, -0.26497650146484375, -0.2483367919921875, -0.23169708251953125, -0.215057373046875, -0.19841766357421875, -0.1817779541015625, -0.16513824462890625, -0.14849853515625, -0.13185882568359375, -0.1152191162109375, -0.09857940673828125, -0.081939697265625, -0.06529998779296875, -0.0486602783203125, -0.03202056884765625, -0.015380859375, 0.00125885009765625, 0.0178985595703125, 0.03453826904296875, 0.051177978515625, 0.06781768798828125, 0.0844573974609375, 0.10109710693359375, 0.11773681640625, 0.13437652587890625, 0.1510162353515625, 0.16765594482421875, 0.184295654296875, 0.20093536376953125, 0.2175750732421875, 0.23421478271484375, 0.2508544921875, 0.26749420166015625, 0.2841339111328125, 0.30077362060546875, 0.317413330078125, 0.33405303955078125, 0.3506927490234375, 0.36733245849609375, 0.38397216796875, 0.40061187744140625, 0.4172515869140625, 0.43389129638671875, 0.450531005859375, 0.46717071533203125, 0.4838104248046875, 0.5004501342773438, 0.51708984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 3.0, 9.0, 10.0, 18.0, 12.0, 15.0, 27.0, 20.0, 30.0, 41.0, 38.0, 53.0, 46.0, 54.0, 76.0, 75.0, 92.0, 54.0, 60.0, 35.0, 28.0, 24.0, 27.0, 28.0, 18.0, 14.0, 17.0, 15.0, 9.0, 6.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.42236328125, -0.4100303649902344, -0.39769744873046875, -0.3853645324707031, -0.3730316162109375, -0.3606986999511719, -0.34836578369140625, -0.3360328674316406, -0.323699951171875, -0.3113670349121094, -0.29903411865234375, -0.2867012023925781, -0.2743682861328125, -0.2620353698730469, -0.24970245361328125, -0.23736953735351562, -0.22503662109375, -0.21270370483398438, -0.20037078857421875, -0.18803787231445312, -0.1757049560546875, -0.16337203979492188, -0.15103912353515625, -0.13870620727539062, -0.126373291015625, -0.11404037475585938, -0.10170745849609375, -0.08937454223632812, -0.0770416259765625, -0.06470870971679688, -0.05237579345703125, -0.040042877197265625, -0.0277099609375, -0.015377044677734375, -0.00304412841796875, 0.009288787841796875, 0.0216217041015625, 0.033954620361328125, 0.04628753662109375, 0.058620452880859375, 0.070953369140625, 0.08328628540039062, 0.09561920166015625, 0.10795211791992188, 0.1202850341796875, 0.13261795043945312, 0.14495086669921875, 0.15728378295898438, 0.16961669921875, 0.18194961547851562, 0.19428253173828125, 0.20661544799804688, 0.2189483642578125, 0.23128128051757812, 0.24361419677734375, 0.2559471130371094, 0.268280029296875, 0.2806129455566406, 0.29294586181640625, 0.3052787780761719, 0.3176116943359375, 0.3299446105957031, 0.34227752685546875, 0.3546104431152344, 0.366943359375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 5.0, 5.0, 7.0, 10.0, 22.0, 20.0, 24.0, 33.0, 37.0, 49.0, 57.0, 56.0, 66.0, 66.0, 72.0, 68.0, 69.0, 69.0, 48.0, 51.0, 26.0, 32.0, 21.0, 18.0, 13.0, 19.0, 14.0, 11.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.27672576904297, -63.38839340209961, -61.50006103515625, -59.611732482910156, -57.7234001159668, -55.83506774902344, -53.94673538208008, -52.05840301513672, -50.17007064819336, -48.28173828125, -46.39340591430664, -44.50507354736328, -42.61674499511719, -40.72841262817383, -38.84008026123047, -36.95174789428711, -35.06341552734375, -33.17508316040039, -31.286752700805664, -29.398420333862305, -27.510087966918945, -25.62175750732422, -23.73342514038086, -21.8450927734375, -19.956764221191406, -18.068431854248047, -16.18010139465332, -14.291769027709961, -12.403436660766602, -10.515105247497559, -8.626773834228516, -6.738441467285156, -4.850109100341797, -2.9617772102355957, -1.0734455585479736, 0.8148860931396484, 2.7032179832458496, 4.591549873352051, 6.479881286621094, 8.368213653564453, 10.256545066833496, 12.144876480102539, 14.033208847045898, 15.921540260314941, 17.809871673583984, 19.698204040527344, 21.586536407470703, 23.474868774414062, 25.36319923400879, 27.25153160095215, 29.139862060546875, 31.028194427490234, 32.916526794433594, 34.80485916137695, 36.69319152832031, 38.581520080566406, 40.469852447509766, 42.358184814453125, 44.246517181396484, 46.134849548339844, 48.02317810058594, 49.9115104675293, 51.799842834472656, 53.688175201416016, 55.576507568359375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 7.0, 2.0, 10.0, 9.0, 16.0, 12.0, 9.0, 14.0, 26.0, 29.0, 21.0, 28.0, 30.0, 41.0, 41.0, 39.0, 37.0, 52.0, 41.0, 27.0, 31.0, 42.0, 42.0, 37.0, 38.0, 46.0, 33.0, 44.0, 21.0, 24.0, 27.0, 18.0, 15.0, 22.0, 13.0, 8.0, 8.0, 12.0, 11.0, 3.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.08054733276367, -51.367488861083984, -49.6544303894043, -47.94137191772461, -46.22831344604492, -44.515254974365234, -42.80219268798828, -41.089134216308594, -39.376075744628906, -37.66301727294922, -35.94995880126953, -34.236900329589844, -32.523841857910156, -30.81078338623047, -29.09772300720215, -27.38466453552246, -25.671607971191406, -23.95854949951172, -22.24549102783203, -20.532432556152344, -18.819374084472656, -17.10631561279297, -15.393255233764648, -13.680196762084961, -11.967138290405273, -10.254079818725586, -8.541021347045898, -6.8279619216918945, -5.114903450012207, -3.4018449783325195, -1.6887855529785156, 0.024272918701171875, 1.7373275756835938, 3.4503862857818604, 5.163444995880127, 6.876503944396973, 8.58956241607666, 10.302620887756348, 12.015680313110352, 13.728738784790039, 15.441797256469727, 17.154855728149414, 18.8679141998291, 20.580974578857422, 22.29403305053711, 24.007091522216797, 25.720149993896484, 27.433208465576172, 29.14626693725586, 30.859325408935547, 32.572383880615234, 34.28544235229492, 35.99850082397461, 37.7115592956543, 39.42462158203125, 41.13768005371094, 42.850738525390625, 44.56379699707031, 46.27685546875, 47.98991394042969, 49.702972412109375, 51.41603088378906, 53.12908935546875, 54.84214782714844, 56.555206298828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 21.0, 28.0, 41.0, 91.0, 157.0, 166.0, 318.0, 459.0, 741.0, 1132.0, 1765.0, 2841.0, 4360.0, 6856.0, 10604.0, 15942.0, 24131.0, 35836.0, 50087.0, 67493.0, 85575.0, 101329.0, 110274.0, 110864.0, 102100.0, 86894.0, 68967.0, 51010.0, 36746.0, 24783.0, 16635.0, 10747.0, 6957.0, 4536.0, 2836.0, 1829.0, 1155.0, 775.0, 543.0, 339.0, 204.0, 134.0, 74.0, 72.0, 34.0, 20.0, 14.0, 13.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.578125, -18.947265625, -18.31640625, -17.685546875, -17.0546875, -16.423828125, -15.79296875, -15.162109375, -14.53125, -13.900390625, -13.26953125, -12.638671875, -12.0078125, -11.376953125, -10.74609375, -10.115234375, -9.484375, -8.853515625, -8.22265625, -7.591796875, -6.9609375, -6.330078125, -5.69921875, -5.068359375, -4.4375, -3.806640625, -3.17578125, -2.544921875, -1.9140625, -1.283203125, -0.65234375, -0.021484375, 0.609375, 1.240234375, 1.87109375, 2.501953125, 3.1328125, 3.763671875, 4.39453125, 5.025390625, 5.65625, 6.287109375, 6.91796875, 7.548828125, 8.1796875, 8.810546875, 9.44140625, 10.072265625, 10.703125, 11.333984375, 11.96484375, 12.595703125, 13.2265625, 13.857421875, 14.48828125, 15.119140625, 15.75, 16.380859375, 17.01171875, 17.642578125, 18.2734375, 18.904296875, 19.53515625, 20.166015625, 20.796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 15.0, 12.0, 11.0, 12.0, 16.0, 25.0, 25.0, 31.0, 27.0, 35.0, 39.0, 42.0, 49.0, 48.0, 40.0, 45.0, 34.0, 38.0, 41.0, 45.0, 42.0, 45.0, 38.0, 40.0, 26.0, 24.0, 13.0, 19.0, 26.0, 21.0, 11.0, 15.0, 8.0, 9.0, 7.0, 4.0, 4.0, 2.0, 6.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.0, -52.2314453125, -50.462890625, -48.6943359375, -46.92578125, -45.1572265625, -43.388671875, -41.6201171875, -39.8515625, -38.0830078125, -36.314453125, -34.5458984375, -32.77734375, -31.0087890625, -29.240234375, -27.4716796875, -25.703125, -23.9345703125, -22.166015625, -20.3974609375, -18.62890625, -16.8603515625, -15.091796875, -13.3232421875, -11.5546875, -9.7861328125, -8.017578125, -6.2490234375, -4.48046875, -2.7119140625, -0.943359375, 0.8251953125, 2.59375, 4.3623046875, 6.130859375, 7.8994140625, 9.66796875, 11.4365234375, 13.205078125, 14.9736328125, 16.7421875, 18.5107421875, 20.279296875, 22.0478515625, 23.81640625, 25.5849609375, 27.353515625, 29.1220703125, 30.890625, 32.6591796875, 34.427734375, 36.1962890625, 37.96484375, 39.7333984375, 41.501953125, 43.2705078125, 45.0390625, 46.8076171875, 48.576171875, 50.3447265625, 52.11328125, 53.8818359375, 55.650390625, 57.4189453125, 59.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 19.0, 16.0, 22.0, 44.0, 60.0, 83.0, 123.0, 145.0, 234.0, 360.0, 551.0, 814.0, 1250.0, 1836.0, 2973.0, 4630.0, 7289.0, 11199.0, 17448.0, 26423.0, 39439.0, 56020.0, 76027.0, 96106.0, 111634.0, 117790.0, 113858.0, 99613.0, 79728.0, 59177.0, 41811.0, 28487.0, 18747.0, 12368.0, 7855.0, 5118.0, 3174.0, 2108.0, 1335.0, 888.0, 600.0, 399.0, 246.0, 168.0, 105.0, 64.0, 54.0, 43.0, 25.0, 13.0, 9.0, 9.0, 6.0, 1.0, 5.0, 0.0, 3.0, 1.0], "bins": [-23.9375, -23.1796875, -22.421875, -21.6640625, -20.90625, -20.1484375, -19.390625, -18.6328125, -17.875, -17.1171875, -16.359375, -15.6015625, -14.84375, -14.0859375, -13.328125, -12.5703125, -11.8125, -11.0546875, -10.296875, -9.5390625, -8.78125, -8.0234375, -7.265625, -6.5078125, -5.75, -4.9921875, -4.234375, -3.4765625, -2.71875, -1.9609375, -1.203125, -0.4453125, 0.3125, 1.0703125, 1.828125, 2.5859375, 3.34375, 4.1015625, 4.859375, 5.6171875, 6.375, 7.1328125, 7.890625, 8.6484375, 9.40625, 10.1640625, 10.921875, 11.6796875, 12.4375, 13.1953125, 13.953125, 14.7109375, 15.46875, 16.2265625, 16.984375, 17.7421875, 18.5, 19.2578125, 20.015625, 20.7734375, 21.53125, 22.2890625, 23.046875, 23.8046875, 24.5625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 4.0, 10.0, 5.0, 9.0, 7.0, 14.0, 11.0, 14.0, 21.0, 31.0, 16.0, 19.0, 35.0, 36.0, 33.0, 35.0, 38.0, 44.0, 45.0, 35.0, 44.0, 47.0, 42.0, 35.0, 34.0, 36.0, 35.0, 31.0, 37.0, 29.0, 26.0, 19.0, 20.0, 15.0, 22.0, 16.0, 11.0, 10.0, 3.0, 4.0, 3.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-34.5, -33.44873046875, -32.3974609375, -31.34619140625, -30.294921875, -29.24365234375, -28.1923828125, -27.14111328125, -26.08984375, -25.03857421875, -23.9873046875, -22.93603515625, -21.884765625, -20.83349609375, -19.7822265625, -18.73095703125, -17.6796875, -16.62841796875, -15.5771484375, -14.52587890625, -13.474609375, -12.42333984375, -11.3720703125, -10.32080078125, -9.26953125, -8.21826171875, -7.1669921875, -6.11572265625, -5.064453125, -4.01318359375, -2.9619140625, -1.91064453125, -0.859375, 0.19189453125, 1.2431640625, 2.29443359375, 3.345703125, 4.39697265625, 5.4482421875, 6.49951171875, 7.55078125, 8.60205078125, 9.6533203125, 10.70458984375, 11.755859375, 12.80712890625, 13.8583984375, 14.90966796875, 15.9609375, 17.01220703125, 18.0634765625, 19.11474609375, 20.166015625, 21.21728515625, 22.2685546875, 23.31982421875, 24.37109375, 25.42236328125, 26.4736328125, 27.52490234375, 28.576171875, 29.62744140625, 30.6787109375, 31.72998046875, 32.78125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 13.0, 16.0, 28.0, 61.0, 81.0, 130.0, 277.0, 400.0, 736.0, 1223.0, 1989.0, 3359.0, 5640.0, 9215.0, 14941.0, 23041.0, 34540.0, 48988.0, 65776.0, 83441.0, 99303.0, 108278.0, 110289.0, 103473.0, 90602.0, 73492.0, 56003.0, 39530.0, 27473.0, 17615.0, 11272.0, 7056.0, 4162.0, 2442.0, 1537.0, 873.0, 513.0, 300.0, 160.0, 115.0, 76.0, 39.0, 17.0, 18.0, 6.0, 6.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.15625, -8.8885498046875, -8.620849609375, -8.3531494140625, -8.08544921875, -7.8177490234375, -7.550048828125, -7.2823486328125, -7.0146484375, -6.7469482421875, -6.479248046875, -6.2115478515625, -5.94384765625, -5.6761474609375, -5.408447265625, -5.1407470703125, -4.873046875, -4.6053466796875, -4.337646484375, -4.0699462890625, -3.80224609375, -3.5345458984375, -3.266845703125, -2.9991455078125, -2.7314453125, -2.4637451171875, -2.196044921875, -1.9283447265625, -1.66064453125, -1.3929443359375, -1.125244140625, -0.8575439453125, -0.58984375, -0.3221435546875, -0.054443359375, 0.2132568359375, 0.48095703125, 0.7486572265625, 1.016357421875, 1.2840576171875, 1.5517578125, 1.8194580078125, 2.087158203125, 2.3548583984375, 2.62255859375, 2.8902587890625, 3.157958984375, 3.4256591796875, 3.693359375, 3.9610595703125, 4.228759765625, 4.4964599609375, 4.76416015625, 5.0318603515625, 5.299560546875, 5.5672607421875, 5.8349609375, 6.1026611328125, 6.370361328125, 6.6380615234375, 6.90576171875, 7.1734619140625, 7.441162109375, 7.7088623046875, 7.9765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 6.0, 9.0, 10.0, 19.0, 17.0, 23.0, 20.0, 26.0, 24.0, 28.0, 19.0, 34.0, 38.0, 46.0, 47.0, 46.0, 47.0, 45.0, 42.0, 37.0, 49.0, 41.0, 46.0, 23.0, 34.0, 38.0, 21.0, 26.0, 27.0, 26.0, 13.0, 13.0, 13.0, 15.0, 8.0, 3.0, 7.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0010652542114257812, -0.0010346770286560059, -0.0010040998458862305, -0.0009735226631164551, -0.0009429454803466797, -0.0009123682975769043, -0.0008817911148071289, -0.0008512139320373535, -0.0008206367492675781, -0.0007900595664978027, -0.0007594823837280273, -0.000728905200958252, -0.0006983280181884766, -0.0006677508354187012, -0.0006371736526489258, -0.0006065964698791504, -0.000576019287109375, -0.0005454421043395996, -0.0005148649215698242, -0.00048428773880004883, -0.00045371055603027344, -0.00042313337326049805, -0.00039255619049072266, -0.00036197900772094727, -0.0003314018249511719, -0.0003008246421813965, -0.0002702474594116211, -0.0002396702766418457, -0.0002090930938720703, -0.00017851591110229492, -0.00014793872833251953, -0.00011736154556274414, -8.678436279296875e-05, -5.620718002319336e-05, -2.562999725341797e-05, 4.947185516357422e-06, 3.552436828613281e-05, 6.61015510559082e-05, 9.66787338256836e-05, 0.00012725591659545898, 0.00015783309936523438, 0.00018841028213500977, 0.00021898746490478516, 0.00024956464767456055, 0.00028014183044433594, 0.00031071901321411133, 0.0003412961959838867, 0.0003718733787536621, 0.0004024505615234375, 0.0004330277442932129, 0.0004636049270629883, 0.0004941821098327637, 0.0005247592926025391, 0.0005553364753723145, 0.0005859136581420898, 0.0006164908409118652, 0.0006470680236816406, 0.000677645206451416, 0.0007082223892211914, 0.0007387995719909668, 0.0007693767547607422, 0.0007999539375305176, 0.000830531120300293, 0.0008611083030700684, 0.0008916854858398438]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 7.0, 11.0, 13.0, 32.0, 36.0, 50.0, 81.0, 160.0, 233.0, 338.0, 654.0, 1083.0, 1858.0, 3166.0, 5708.0, 9558.0, 16109.0, 26567.0, 41004.0, 60908.0, 83586.0, 105027.0, 120090.0, 125515.0, 117192.0, 100428.0, 78121.0, 55719.0, 37398.0, 23558.0, 14198.0, 8368.0, 4928.0, 2831.0, 1639.0, 926.0, 580.0, 347.0, 197.0, 128.0, 73.0, 56.0, 28.0, 20.0, 12.0, 8.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.620849609375, -9.30419921875, -8.987548828125, -8.6708984375, -8.354248046875, -8.03759765625, -7.720947265625, -7.404296875, -7.087646484375, -6.77099609375, -6.454345703125, -6.1376953125, -5.821044921875, -5.50439453125, -5.187744140625, -4.87109375, -4.554443359375, -4.23779296875, -3.921142578125, -3.6044921875, -3.287841796875, -2.97119140625, -2.654541015625, -2.337890625, -2.021240234375, -1.70458984375, -1.387939453125, -1.0712890625, -0.754638671875, -0.43798828125, -0.121337890625, 0.1953125, 0.511962890625, 0.82861328125, 1.145263671875, 1.4619140625, 1.778564453125, 2.09521484375, 2.411865234375, 2.728515625, 3.045166015625, 3.36181640625, 3.678466796875, 3.9951171875, 4.311767578125, 4.62841796875, 4.945068359375, 5.26171875, 5.578369140625, 5.89501953125, 6.211669921875, 6.5283203125, 6.844970703125, 7.16162109375, 7.478271484375, 7.794921875, 8.111572265625, 8.42822265625, 8.744873046875, 9.0615234375, 9.378173828125, 9.69482421875, 10.011474609375, 10.328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 4.0, 3.0, 9.0, 9.0, 14.0, 16.0, 18.0, 27.0, 28.0, 34.0, 47.0, 43.0, 45.0, 49.0, 46.0, 63.0, 72.0, 74.0, 54.0, 48.0, 45.0, 55.0, 28.0, 25.0, 37.0, 26.0, 15.0, 22.0, 15.0, 9.0, 7.0, 8.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.38671875, -5.2247314453125, -5.062744140625, -4.9007568359375, -4.73876953125, -4.5767822265625, -4.414794921875, -4.2528076171875, -4.0908203125, -3.9288330078125, -3.766845703125, -3.6048583984375, -3.44287109375, -3.2808837890625, -3.118896484375, -2.9569091796875, -2.794921875, -2.6329345703125, -2.470947265625, -2.3089599609375, -2.14697265625, -1.9849853515625, -1.822998046875, -1.6610107421875, -1.4990234375, -1.3370361328125, -1.175048828125, -1.0130615234375, -0.85107421875, -0.6890869140625, -0.527099609375, -0.3651123046875, -0.203125, -0.0411376953125, 0.120849609375, 0.2828369140625, 0.44482421875, 0.6068115234375, 0.768798828125, 0.9307861328125, 1.0927734375, 1.2547607421875, 1.416748046875, 1.5787353515625, 1.74072265625, 1.9027099609375, 2.064697265625, 2.2266845703125, 2.388671875, 2.5506591796875, 2.712646484375, 2.8746337890625, 3.03662109375, 3.1986083984375, 3.360595703125, 3.5225830078125, 3.6845703125, 3.8465576171875, 4.008544921875, 4.1705322265625, 4.33251953125, 4.4945068359375, 4.656494140625, 4.8184814453125, 4.98046875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 5.0, 7.0, 7.0, 12.0, 13.0, 18.0, 16.0, 23.0, 34.0, 44.0, 65.0, 58.0, 63.0, 64.0, 86.0, 70.0, 65.0, 58.0, 59.0, 64.0, 39.0, 30.0, 29.0, 16.0, 20.0, 11.0, 9.0, 11.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.45816802978516, -67.41261291503906, -65.36705780029297, -63.32150650024414, -61.27595138549805, -59.23039627075195, -57.184844970703125, -55.13928985595703, -53.09373474121094, -51.048179626464844, -49.00262451171875, -46.95707321166992, -44.91151809692383, -42.865962982177734, -40.820411682128906, -38.77485656738281, -36.72930145263672, -34.683746337890625, -32.63819122314453, -30.592639923095703, -28.54708480834961, -26.501529693603516, -24.455976486206055, -22.410423278808594, -20.3648681640625, -18.319313049316406, -16.273759841918945, -14.228205680847168, -12.18265151977539, -10.137097358703613, -8.091543197631836, -6.045989036560059, -4.000438690185547, -1.9548845291137695, 0.09066963195800781, 2.136223793029785, 4.1817779541015625, 6.22733211517334, 8.272886276245117, 10.318440437316895, 12.363994598388672, 14.40954875946045, 16.455102920532227, 18.500656127929688, 20.54621124267578, 22.591766357421875, 24.637319564819336, 26.682872772216797, 28.72842788696289, 30.773983001708984, 32.81953430175781, 34.865089416503906, 36.91064453125, 38.956199645996094, 41.00175476074219, 43.047306060791016, 45.09286117553711, 47.1384162902832, 49.18396759033203, 51.229522705078125, 53.27507781982422, 55.32063293457031, 57.366188049316406, 59.411739349365234, 61.45729446411133]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 7.0, 12.0, 5.0, 8.0, 9.0, 17.0, 12.0, 14.0, 23.0, 20.0, 34.0, 32.0, 38.0, 37.0, 33.0, 46.0, 43.0, 39.0, 42.0, 48.0, 44.0, 49.0, 37.0, 39.0, 37.0, 26.0, 37.0, 34.0, 35.0, 14.0, 24.0, 18.0, 24.0, 13.0, 10.0, 10.0, 10.0, 6.0, 3.0, 2.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.278377532958984, -60.16998291015625, -58.061588287353516, -55.95319366455078, -53.84479904174805, -51.73640441894531, -49.628013610839844, -47.519615173339844, -45.411224365234375, -43.30282974243164, -41.194435119628906, -39.08604049682617, -36.97764587402344, -34.8692512512207, -32.76085662841797, -30.652463912963867, -28.5440673828125, -26.435672760009766, -24.32727813720703, -22.218883514404297, -20.110488891601562, -18.002094268798828, -15.893701553344727, -13.785306930541992, -11.676912307739258, -9.568517684936523, -7.460123538970947, -5.351729393005371, -3.2433347702026367, -1.1349401473999023, 0.9734535217285156, 3.08184814453125, 5.19024658203125, 7.298641204833984, 9.407035827636719, 11.515429496765137, 13.623824119567871, 15.732218742370605, 17.840612411499023, 19.949007034301758, 22.057401657104492, 24.165796279907227, 26.27419090270996, 28.382583618164062, 30.490978240966797, 32.59937286376953, 34.707767486572266, 36.816162109375, 38.924556732177734, 41.03295135498047, 43.1413459777832, 45.24974060058594, 47.35813522338867, 49.466529846191406, 51.574920654296875, 53.683319091796875, 55.791709899902344, 57.90010452270508, 60.00849914550781, 62.11689376831055, 64.22528839111328, 66.33367919921875, 68.44207763671875, 70.55046844482422, 72.65886688232422]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 10.0, 19.0, 25.0, 47.0, 47.0, 73.0, 133.0, 147.0, 220.0, 303.0, 410.0, 644.0, 837.0, 1200.0, 1648.0, 2229.0, 2930.0, 3976.0, 5010.0, 6410.0, 1002349.0, 5539.0, 4209.0, 3225.0, 2522.0, 1765.0, 1328.0, 967.0, 673.0, 470.0, 354.0, 253.0, 187.0, 119.0, 92.0, 64.0, 54.0, 37.0, 23.0, 12.0, 8.0, 12.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-445.0298767089844, -431.61474609375, -418.19964599609375, -404.7845153808594, -391.3694152832031, -377.95428466796875, -364.5391845703125, -351.1240539550781, -337.70892333984375, -324.2937927246094, -310.8786926269531, -297.46356201171875, -284.0484619140625, -270.6333312988281, -257.21820068359375, -243.8031005859375, -230.38800048828125, -216.97288513183594, -203.55776977539062, -190.14263916015625, -176.7275390625, -163.31240844726562, -149.8972930908203, -136.482177734375, -123.06706237792969, -109.65194702148438, -96.23683166503906, -82.82170867919922, -69.4065933227539, -55.991477966308594, -42.57635498046875, -29.161239624023438, -15.746124267578125, -2.3310070037841797, 11.084110260009766, 24.499229431152344, 37.914344787597656, 51.32946014404297, 64.74458312988281, 78.15969848632812, 91.57481384277344, 104.98992919921875, 118.40504455566406, 131.82015991210938, 145.23529052734375, 158.650390625, 172.06552124023438, 185.4806365966797, 198.895751953125, 212.3108673095703, 225.72598266601562, 239.14111328125, 252.55621337890625, 265.9713439941406, 279.386474609375, 292.80157470703125, 306.2166748046875, 319.6318054199219, 333.0469055175781, 346.4620361328125, 359.87713623046875, 373.2922668457031, 386.7073974609375, 400.12249755859375, 413.5376281738281]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 3.0, 9.0, 11.0, 16.0, 20.0, 28.0, 27.0, 25.0, 35.0, 50.0, 36.0, 51.0, 55.0, 79.0, 78.0, 131.0, 222.0, 388.0, 667.0, 1119.0, 2091.0, 3698.0, 7303.0, 15105.0, 27565.0, 56314.0, 51245740.0, 53498.0, 27203.0, 14238.0, 7138.0, 3511.0, 1936.0, 1064.0, 655.0, 354.0, 209.0, 148.0, 93.0, 61.0, 60.0, 44.0, 34.0, 38.0, 42.0, 22.0, 36.0, 20.0, 18.0, 10.0, 11.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-858.0, -831.578125, -805.15625, -778.734375, -752.3125, -725.890625, -699.46875, -673.046875, -646.625, -620.203125, -593.78125, -567.359375, -540.9375, -514.515625, -488.09375, -461.671875, -435.25, -408.828125, -382.40625, -355.984375, -329.5625, -303.140625, -276.71875, -250.296875, -223.875, -197.453125, -171.03125, -144.609375, -118.1875, -91.765625, -65.34375, -38.921875, -12.5, 13.921875, 40.34375, 66.765625, 93.1875, 119.609375, 146.03125, 172.453125, 198.875, 225.296875, 251.71875, 278.140625, 304.5625, 330.984375, 357.40625, 383.828125, 410.25, 436.671875, 463.09375, 489.515625, 515.9375, 542.359375, 568.78125, 595.203125, 621.625, 648.046875, 674.46875, 700.890625, 727.3125, 753.734375, 780.15625, 806.578125, 833.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 10.0, 27.0, 38.0, 28.0, 46.0, 70.0, 89.0, 133.0, 186.0, 240.0, 405.0, 543.0, 763.0, 1017.0, 1736.0, 2413.0, 3424.0, 5581.0, 9158.0, 15032.0, 25363.0, 46589.0, 90378.0, 185955.0, 425608.0, 2757793.0, 1945058.0, 399962.0, 177455.0, 86596.0, 45182.0, 25295.0, 14265.0, 8534.0, 5519.0, 3465.0, 2345.0, 1529.0, 1096.0, 743.0, 546.0, 357.0, 221.0, 179.0, 129.0, 94.0, 67.0, 48.0, 34.0, 20.0, 16.0, 22.0, 13.0, 7.0, 3.0, 10.0], "bins": [-9.2265625, -8.9549560546875, -8.683349609375, -8.4117431640625, -8.14013671875, -7.8685302734375, -7.596923828125, -7.3253173828125, -7.0537109375, -6.7821044921875, -6.510498046875, -6.2388916015625, -5.96728515625, -5.6956787109375, -5.424072265625, -5.1524658203125, -4.880859375, -4.6092529296875, -4.337646484375, -4.0660400390625, -3.79443359375, -3.5228271484375, -3.251220703125, -2.9796142578125, -2.7080078125, -2.4364013671875, -2.164794921875, -1.8931884765625, -1.62158203125, -1.3499755859375, -1.078369140625, -0.8067626953125, -0.53515625, -0.2635498046875, 0.008056640625, 0.2796630859375, 0.55126953125, 0.8228759765625, 1.094482421875, 1.3660888671875, 1.6376953125, 1.9093017578125, 2.180908203125, 2.4525146484375, 2.72412109375, 2.9957275390625, 3.267333984375, 3.5389404296875, 3.810546875, 4.0821533203125, 4.353759765625, 4.6253662109375, 4.89697265625, 5.1685791015625, 5.440185546875, 5.7117919921875, 5.9833984375, 6.2550048828125, 6.526611328125, 6.7982177734375, 7.06982421875, 7.3414306640625, 7.613037109375, 7.8846435546875, 8.15625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 11.0, 16.0, 15.0, 28.0, 24.0, 16.0, 23.0, 26.0, 22.0, 51.0, 39.0, 48.0, 41.0, 40.0, 44.0, 378.0, 620.0, 111.0, 78.0, 41.0, 48.0, 29.0, 27.0, 37.0, 28.0, 20.0, 29.0, 20.0, 23.0, 15.0, 12.0, 10.0, 6.0, 3.0, 7.0, 5.0, 5.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-40.78125, -39.647705078125, -38.51416015625, -37.380615234375, -36.2470703125, -35.113525390625, -33.97998046875, -32.846435546875, -31.712890625, -30.579345703125, -29.44580078125, -28.312255859375, -27.1787109375, -26.045166015625, -24.91162109375, -23.778076171875, -22.64453125, -21.510986328125, -20.37744140625, -19.243896484375, -18.1103515625, -16.976806640625, -15.84326171875, -14.709716796875, -13.576171875, -12.442626953125, -11.30908203125, -10.175537109375, -9.0419921875, -7.908447265625, -6.77490234375, -5.641357421875, -4.5078125, -3.374267578125, -2.24072265625, -1.107177734375, 0.0263671875, 1.159912109375, 2.29345703125, 3.427001953125, 4.560546875, 5.694091796875, 6.82763671875, 7.961181640625, 9.0947265625, 10.228271484375, 11.36181640625, 12.495361328125, 13.62890625, 14.762451171875, 15.89599609375, 17.029541015625, 18.1630859375, 19.296630859375, 20.43017578125, 21.563720703125, 22.697265625, 23.830810546875, 24.96435546875, 26.097900390625, 27.2314453125, 28.364990234375, 29.49853515625, 30.632080078125, 31.765625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 8.0, 8.0, 1.0, 8.0, 19.0, 11.0, 11.0, 20.0, 33.0, 42.0, 73.0, 146.0, 159.0, 236.0, 311.0, 433.0, 623.0, 1058.0, 1552.0, 2384.0, 3692.0, 5738.0, 10076.0, 17485.0, 31531.0, 61108.0, 127712.0, 318995.0, 1881770.0, 3208185.0, 342085.0, 133423.0, 63046.0, 32864.0, 18142.0, 10552.0, 6389.0, 4062.0, 2452.0, 1617.0, 1094.0, 740.0, 503.0, 383.0, 233.0, 145.0, 79.0, 68.0, 37.0, 29.0, 30.0, 17.0, 6.0, 8.0, 9.0, 4.0, 2.0, 0.0, 3.0], "bins": [-15.9609375, -15.491943359375, -15.02294921875, -14.553955078125, -14.0849609375, -13.615966796875, -13.14697265625, -12.677978515625, -12.208984375, -11.739990234375, -11.27099609375, -10.802001953125, -10.3330078125, -9.864013671875, -9.39501953125, -8.926025390625, -8.45703125, -7.988037109375, -7.51904296875, -7.050048828125, -6.5810546875, -6.112060546875, -5.64306640625, -5.174072265625, -4.705078125, -4.236083984375, -3.76708984375, -3.298095703125, -2.8291015625, -2.360107421875, -1.89111328125, -1.422119140625, -0.953125, -0.484130859375, -0.01513671875, 0.453857421875, 0.9228515625, 1.391845703125, 1.86083984375, 2.329833984375, 2.798828125, 3.267822265625, 3.73681640625, 4.205810546875, 4.6748046875, 5.143798828125, 5.61279296875, 6.081787109375, 6.55078125, 7.019775390625, 7.48876953125, 7.957763671875, 8.4267578125, 8.895751953125, 9.36474609375, 9.833740234375, 10.302734375, 10.771728515625, 11.24072265625, 11.709716796875, 12.1787109375, 12.647705078125, 13.11669921875, 13.585693359375, 14.0546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 3.0, 7.0, 9.0, 12.0, 16.0, 15.0, 10.0, 24.0, 14.0, 28.0, 24.0, 35.0, 37.0, 35.0, 36.0, 49.0, 52.0, 49.0, 171.0, 838.0, 161.0, 66.0, 51.0, 49.0, 31.0, 28.0, 20.0, 26.0, 14.0, 27.0, 19.0, 14.0, 14.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.9375, -34.65869140625, -33.3798828125, -32.10107421875, -30.822265625, -29.54345703125, -28.2646484375, -26.98583984375, -25.70703125, -24.42822265625, -23.1494140625, -21.87060546875, -20.591796875, -19.31298828125, -18.0341796875, -16.75537109375, -15.4765625, -14.19775390625, -12.9189453125, -11.64013671875, -10.361328125, -9.08251953125, -7.8037109375, -6.52490234375, -5.24609375, -3.96728515625, -2.6884765625, -1.40966796875, -0.130859375, 1.14794921875, 2.4267578125, 3.70556640625, 4.984375, 6.26318359375, 7.5419921875, 8.82080078125, 10.099609375, 11.37841796875, 12.6572265625, 13.93603515625, 15.21484375, 16.49365234375, 17.7724609375, 19.05126953125, 20.330078125, 21.60888671875, 22.8876953125, 24.16650390625, 25.4453125, 26.72412109375, 28.0029296875, 29.28173828125, 30.560546875, 31.83935546875, 33.1181640625, 34.39697265625, 35.67578125, 36.95458984375, 38.2333984375, 39.51220703125, 40.791015625, 42.06982421875, 43.3486328125, 44.62744140625, 45.90625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 10.0, 6.0, 1.0, 14.0, 13.0, 8.0, 10.0, 28.0, 29.0, 34.0, 35.0, 51.0, 75.0, 82.0, 75.0, 115.0, 126.0, 217.0, 336.0, 488.0, 662.0, 1027.0, 1640.0, 2813.0, 5433.0, 12493.0, 38300.0, 5651095.0, 514611.0, 36406.0, 11924.0, 5330.0, 2806.0, 1699.0, 1019.0, 686.0, 465.0, 335.0, 245.0, 146.0, 123.0, 94.0, 58.0, 71.0, 39.0, 38.0, 27.0, 26.0, 9.0, 13.0, 6.0, 8.0, 12.0, 9.0, 6.0, 6.0, 3.0, 10.0, 1.0], "bins": [-103.0, -99.876953125, -96.75390625, -93.630859375, -90.5078125, -87.384765625, -84.26171875, -81.138671875, -78.015625, -74.892578125, -71.76953125, -68.646484375, -65.5234375, -62.400390625, -59.27734375, -56.154296875, -53.03125, -49.908203125, -46.78515625, -43.662109375, -40.5390625, -37.416015625, -34.29296875, -31.169921875, -28.046875, -24.923828125, -21.80078125, -18.677734375, -15.5546875, -12.431640625, -9.30859375, -6.185546875, -3.0625, 0.060546875, 3.18359375, 6.306640625, 9.4296875, 12.552734375, 15.67578125, 18.798828125, 21.921875, 25.044921875, 28.16796875, 31.291015625, 34.4140625, 37.537109375, 40.66015625, 43.783203125, 46.90625, 50.029296875, 53.15234375, 56.275390625, 59.3984375, 62.521484375, 65.64453125, 68.767578125, 71.890625, 75.013671875, 78.13671875, 81.259765625, 84.3828125, 87.505859375, 90.62890625, 93.751953125, 96.875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 1.0, 5.0, 9.0, 7.0, 6.0, 8.0, 7.0, 7.0, 22.0, 28.0, 27.0, 48.0, 31.0, 56.0, 55.0, 61.0, 89.0, 813.0, 274.0, 94.0, 67.0, 48.0, 53.0, 26.0, 41.0, 25.0, 21.0, 17.0, 18.0, 10.0, 7.0, 8.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-54.9375, -53.2509765625, -51.564453125, -49.8779296875, -48.19140625, -46.5048828125, -44.818359375, -43.1318359375, -41.4453125, -39.7587890625, -38.072265625, -36.3857421875, -34.69921875, -33.0126953125, -31.326171875, -29.6396484375, -27.953125, -26.2666015625, -24.580078125, -22.8935546875, -21.20703125, -19.5205078125, -17.833984375, -16.1474609375, -14.4609375, -12.7744140625, -11.087890625, -9.4013671875, -7.71484375, -6.0283203125, -4.341796875, -2.6552734375, -0.96875, 0.7177734375, 2.404296875, 4.0908203125, 5.77734375, 7.4638671875, 9.150390625, 10.8369140625, 12.5234375, 14.2099609375, 15.896484375, 17.5830078125, 19.26953125, 20.9560546875, 22.642578125, 24.3291015625, 26.015625, 27.7021484375, 29.388671875, 31.0751953125, 32.76171875, 34.4482421875, 36.134765625, 37.8212890625, 39.5078125, 41.1943359375, 42.880859375, 44.5673828125, 46.25390625, 47.9404296875, 49.626953125, 51.3134765625, 53.0]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 10.0, 10.0, 36.0, 373.0, 449.0, 50.0, 29.0, 13.0, 8.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.73007202148438, -159.4951171875, -152.2601776123047, -145.0252227783203, -137.79026794433594, -130.55532836914062, -123.32037353515625, -116.0854263305664, -108.85047912597656, -101.61553192138672, -94.38057708740234, -87.1456298828125, -79.91068267822266, -72.67573547363281, -65.44078063964844, -58.205833435058594, -50.97087860107422, -43.73592758178711, -36.500980377197266, -29.266029357910156, -22.03108024597168, -14.796131134033203, -7.561180114746094, -0.32623291015625, 6.908718109130859, 14.143667221069336, 21.378616333007812, 28.613567352294922, 35.84851837158203, 43.083465576171875, 50.318416595458984, 57.55336380004883, 64.78831481933594, 72.02326202392578, 79.25821685791016, 86.4931640625, 93.72811126708984, 100.96305847167969, 108.19801330566406, 115.4329605102539, 122.66790771484375, 129.90286254882812, 137.13780212402344, 144.3727569580078, 151.6077117919922, 158.8426513671875, 166.07760620117188, 173.31256103515625, 180.54751586914062, 187.782470703125, 195.0174102783203, 202.2523651123047, 209.48731994628906, 216.72225952148438, 223.95721435546875, 231.19216918945312, 238.42710876464844, 245.6620635986328, 252.89700317382812, 260.1319580078125, 267.3669128417969, 274.60186767578125, 281.8367919921875, 289.0717468261719, 296.30670166015625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 9.0, 9.0, 11.0, 14.0, 26.0, 30.0, 101.0, 262.0, 312.0, 101.0, 34.0, 24.0, 18.0, 15.0, 9.0, 6.0, 7.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.35198974609375, -267.7244873046875, -259.09698486328125, -250.46946716308594, -241.84194946289062, -233.21444702148438, -224.58694458007812, -215.95944213867188, -207.33192443847656, -198.7044219970703, -190.076904296875, -181.44940185546875, -172.8218994140625, -164.1943817138672, -155.56687927246094, -146.93936157226562, -138.31185913085938, -129.68435668945312, -121.05683898925781, -112.42933654785156, -103.80182647705078, -95.17431640625, -86.54681396484375, -77.91930389404297, -69.29179382324219, -60.664283752441406, -52.03677749633789, -43.409271240234375, -34.781761169433594, -26.154251098632812, -17.526744842529297, -8.899238586425781, -0.271728515625, 8.355779647827148, 16.983287811279297, 25.610795974731445, 34.238304138183594, 42.865814208984375, 51.49332046508789, 60.120826721191406, 68.74833679199219, 77.37584686279297, 86.00335693359375, 94.630859375, 103.25836944580078, 111.88587951660156, 120.51338195800781, 129.14089965820312, 137.76840209960938, 146.39590454101562, 155.02342224121094, 163.6509246826172, 172.2784423828125, 180.90594482421875, 189.533447265625, 198.16094970703125, 206.78846740722656, 215.4159698486328, 224.04348754882812, 232.67098999023438, 241.29849243164062, 249.92601013183594, 258.55352783203125, 267.1810302734375, 275.80853271484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 9.0, 6.0, 15.0, 19.0, 27.0, 34.0, 64.0, 101.0, 190.0, 307.0, 608.0, 1337.0, 3364.0, 10476.0, 55131.0, 4049307.0, 56128.0, 10743.0, 3399.0, 1427.0, 693.0, 332.0, 193.0, 127.0, 68.0, 56.0, 38.0, 15.0, 22.0, 11.0, 10.0, 11.0, 6.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.25958251953125, -2.1773681640625, -2.09515380859375, -2.012939453125, -1.93072509765625, -1.8485107421875, -1.76629638671875, -1.68408203125, -1.60186767578125, -1.5196533203125, -1.43743896484375, -1.355224609375, -1.27301025390625, -1.1907958984375, -1.10858154296875, -1.0263671875, -0.94415283203125, -0.8619384765625, -0.77972412109375, -0.697509765625, -0.61529541015625, -0.5330810546875, -0.45086669921875, -0.36865234375, -0.28643798828125, -0.2042236328125, -0.12200927734375, -0.039794921875, 0.04241943359375, 0.1246337890625, 0.20684814453125, 0.2890625, 0.37127685546875, 0.4534912109375, 0.53570556640625, 0.617919921875, 0.70013427734375, 0.7823486328125, 0.86456298828125, 0.94677734375, 1.02899169921875, 1.1112060546875, 1.19342041015625, 1.275634765625, 1.35784912109375, 1.4400634765625, 1.52227783203125, 1.6044921875, 1.68670654296875, 1.7689208984375, 1.85113525390625, 1.933349609375, 2.01556396484375, 2.0977783203125, 2.17999267578125, 2.26220703125, 2.34442138671875, 2.4266357421875, 2.50885009765625, 2.591064453125, 2.67327880859375, 2.7554931640625, 2.83770751953125, 2.919921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 6.0, 3.0, 9.0, 9.0, 12.0, 22.0, 30.0, 787.0, 40.0, 19.0, 22.0, 13.0, 4.0, 10.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3559532165527344, -0.34300994873046875, -0.3300666809082031, -0.3171234130859375, -0.3041801452636719, -0.29123687744140625, -0.2782936096191406, -0.265350341796875, -0.2524070739746094, -0.23946380615234375, -0.22652053833007812, -0.2135772705078125, -0.20063400268554688, -0.18769073486328125, -0.17474746704101562, -0.16180419921875, -0.14886093139648438, -0.13591766357421875, -0.12297439575195312, -0.1100311279296875, -0.09708786010742188, -0.08414459228515625, -0.07120132446289062, -0.058258056640625, -0.045314788818359375, -0.03237152099609375, -0.019428253173828125, -0.0064849853515625, 0.006458282470703125, 0.01940155029296875, 0.032344818115234375, 0.0452880859375, 0.058231353759765625, 0.07117462158203125, 0.08411788940429688, 0.0970611572265625, 0.11000442504882812, 0.12294769287109375, 0.13589096069335938, 0.148834228515625, 0.16177749633789062, 0.17472076416015625, 0.18766403198242188, 0.2006072998046875, 0.21355056762695312, 0.22649383544921875, 0.23943710327148438, 0.25238037109375, 0.2653236389160156, 0.27826690673828125, 0.2912101745605469, 0.3041534423828125, 0.3170967102050781, 0.33003997802734375, 0.3429832458496094, 0.355926513671875, 0.3688697814941406, 0.38181304931640625, 0.3947563171386719, 0.4076995849609375, 0.4206428527832031, 0.43358612060546875, 0.4465293884277344, 0.45947265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 17.0, 8.0, 19.0, 34.0, 24.0, 37.0, 61.0, 79.0, 116.0, 168.0, 262.0, 422.0, 640.0, 1149.0, 1853.0, 3582.0, 6597.0, 13560.0, 30810.0, 84524.0, 358678.0, 3176865.0, 379138.0, 82611.0, 28556.0, 12016.0, 5538.0, 2802.0, 1559.0, 883.0, 497.0, 357.0, 251.0, 156.0, 108.0, 79.0, 57.0, 44.0, 30.0, 24.0, 11.0, 15.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0], "bins": [-1.048828125, -1.0193023681640625, -0.989776611328125, -0.9602508544921875, -0.93072509765625, -0.9011993408203125, -0.871673583984375, -0.8421478271484375, -0.8126220703125, -0.7830963134765625, -0.753570556640625, -0.7240447998046875, -0.69451904296875, -0.6649932861328125, -0.635467529296875, -0.6059417724609375, -0.576416015625, -0.5468902587890625, -0.517364501953125, -0.4878387451171875, -0.45831298828125, -0.4287872314453125, -0.399261474609375, -0.3697357177734375, -0.3402099609375, -0.3106842041015625, -0.281158447265625, -0.2516326904296875, -0.22210693359375, -0.1925811767578125, -0.163055419921875, -0.1335296630859375, -0.10400390625, -0.0744781494140625, -0.044952392578125, -0.0154266357421875, 0.01409912109375, 0.0436248779296875, 0.073150634765625, 0.1026763916015625, 0.1322021484375, 0.1617279052734375, 0.191253662109375, 0.2207794189453125, 0.25030517578125, 0.2798309326171875, 0.309356689453125, 0.3388824462890625, 0.368408203125, 0.3979339599609375, 0.427459716796875, 0.4569854736328125, 0.48651123046875, 0.5160369873046875, 0.545562744140625, 0.5750885009765625, 0.6046142578125, 0.6341400146484375, 0.663665771484375, 0.6931915283203125, 0.72271728515625, 0.7522430419921875, 0.781768798828125, 0.8112945556640625, 0.8408203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 5.0, 9.0, 11.0, 4.0, 8.0, 15.0, 12.0, 20.0, 13.0, 20.0, 31.0, 41.0, 33.0, 59.0, 63.0, 97.0, 121.0, 152.0, 250.0, 429.0, 1044.0, 673.0, 306.0, 202.0, 114.0, 81.0, 69.0, 45.0, 28.0, 23.0, 23.0, 10.0, 14.0, 16.0, 7.0, 2.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36962890625, -0.3586769104003906, -0.34772491455078125, -0.3367729187011719, -0.3258209228515625, -0.3148689270019531, -0.30391693115234375, -0.2929649353027344, -0.282012939453125, -0.2710609436035156, -0.26010894775390625, -0.24915695190429688, -0.2382049560546875, -0.22725296020507812, -0.21630096435546875, -0.20534896850585938, -0.19439697265625, -0.18344497680664062, -0.17249298095703125, -0.16154098510742188, -0.1505889892578125, -0.13963699340820312, -0.12868499755859375, -0.11773300170898438, -0.106781005859375, -0.09582901000976562, -0.08487701416015625, -0.07392501831054688, -0.0629730224609375, -0.052021026611328125, -0.04106903076171875, -0.030117034912109375, -0.0191650390625, -0.008213043212890625, 0.00273895263671875, 0.013690948486328125, 0.0246429443359375, 0.035594940185546875, 0.04654693603515625, 0.057498931884765625, 0.068450927734375, 0.07940292358398438, 0.09035491943359375, 0.10130691528320312, 0.1122589111328125, 0.12321090698242188, 0.13416290283203125, 0.14511489868164062, 0.15606689453125, 0.16701889038085938, 0.17797088623046875, 0.18892288208007812, 0.1998748779296875, 0.21082687377929688, 0.22177886962890625, 0.23273086547851562, 0.243682861328125, 0.2546348571777344, 0.26558685302734375, 0.2765388488769531, 0.2874908447265625, 0.2984428405761719, 0.30939483642578125, 0.3203468322753906, 0.331298828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 8.0, 10.0, 33.0, 47.0, 81.0, 230.0, 415.0, 126.0, 30.0, 15.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.846606254577637, -13.577628135681152, -13.308650016784668, -13.039671897888184, -12.7706937789917, -12.501714706420898, -12.232736587524414, -11.96375846862793, -11.694780349731445, -11.425802230834961, -11.156824111938477, -10.887845993041992, -10.618867874145508, -10.349889755249023, -10.080911636352539, -9.811932563781738, -9.54295539855957, -9.273977279663086, -9.004999160766602, -8.736021041870117, -8.467042922973633, -8.198064804077148, -7.929086208343506, -7.6601080894470215, -7.391129493713379, -7.1221513748168945, -6.85317325592041, -6.584195137023926, -6.315216541290283, -6.046238422393799, -5.7772603034973145, -5.50828218460083, -5.239303112030029, -4.970324993133545, -4.7013468742370605, -4.432368278503418, -4.163390159606934, -3.894412040710449, -3.625433921813965, -3.3564558029174805, -3.087477445602417, -2.8184993267059326, -2.549520969390869, -2.2805428504943848, -2.0115647315979004, -1.742586374282837, -1.4736082553863525, -1.2046300172805786, -0.9356517791748047, -0.6666735410690308, -0.3976953625679016, -0.12871718406677246, 0.14026105403900146, 0.4092392921447754, 0.6782174110412598, 0.9471956491470337, 1.2161738872528076, 1.4851521253585815, 1.7541303634643555, 2.02310848236084, 2.292086601257324, 2.5610649585723877, 2.830043077468872, 3.0990214347839355, 3.36799955368042]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 3.0, 3.0, 9.0, 11.0, 17.0, 14.0, 17.0, 29.0, 32.0, 44.0, 49.0, 44.0, 57.0, 64.0, 72.0, 68.0, 57.0, 57.0, 55.0, 35.0, 45.0, 40.0, 36.0, 34.0, 26.0, 24.0, 14.0, 13.0, 8.0, 7.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.503812551498413, -3.399538040161133, -3.2952632904052734, -3.190988779067993, -3.086714029312134, -2.9824395179748535, -2.878164768218994, -2.773890256881714, -2.6696155071258545, -2.565340995788574, -2.461066246032715, -2.3567917346954346, -2.252516984939575, -2.148242473602295, -2.0439677238464355, -1.9396932125091553, -1.8354185819625854, -1.7311439514160156, -1.6268693208694458, -1.522594690322876, -1.4183200597763062, -1.3140454292297363, -1.209770917892456, -1.1054961681365967, -1.0012216567993164, -0.8969470262527466, -0.7926723957061768, -0.6883977651596069, -0.5841231346130371, -0.47984856367111206, -0.37557393312454224, -0.2712993025779724, -0.1670246124267578, -0.06274998933076859, 0.04152463376522064, 0.14579924941062927, 0.2500738799571991, 0.35434848070144653, 0.45862311124801636, 0.5628977417945862, 0.667172372341156, 0.7714470028877258, 0.8757216334342957, 0.9799962043762207, 1.0842708349227905, 1.1885454654693604, 1.2928200960159302, 1.3970947265625, 1.5013693571090698, 1.6056439876556396, 1.7099186182022095, 1.8141932487487793, 1.9184678792953491, 2.022742509841919, 2.127017021179199, 2.2312917709350586, 2.335566282272339, 2.439840793609619, 2.5441155433654785, 2.648390054702759, 2.752664804458618, 2.8569393157958984, 2.961214065551758, 3.065488576889038, 3.1697633266448975]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 8.0, 9.0, 15.0, 17.0, 26.0, 28.0, 46.0, 67.0, 117.0, 128.0, 201.0, 361.0, 552.0, 1028.0, 2019.0, 4456.0, 12702.0, 85256.0, 894361.0, 32071.0, 8208.0, 3197.0, 1511.0, 786.0, 469.0, 310.0, 180.0, 121.0, 83.0, 57.0, 46.0, 27.0, 21.0, 15.0, 11.0, 8.0, 5.0, 7.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0], "bins": [-2.732421875, -2.65716552734375, -2.5819091796875, -2.50665283203125, -2.431396484375, -2.35614013671875, -2.2808837890625, -2.20562744140625, -2.13037109375, -2.05511474609375, -1.9798583984375, -1.90460205078125, -1.829345703125, -1.75408935546875, -1.6788330078125, -1.60357666015625, -1.5283203125, -1.45306396484375, -1.3778076171875, -1.30255126953125, -1.227294921875, -1.15203857421875, -1.0767822265625, -1.00152587890625, -0.92626953125, -0.85101318359375, -0.7757568359375, -0.70050048828125, -0.625244140625, -0.54998779296875, -0.4747314453125, -0.39947509765625, -0.32421875, -0.24896240234375, -0.1737060546875, -0.09844970703125, -0.023193359375, 0.05206298828125, 0.1273193359375, 0.20257568359375, 0.27783203125, 0.35308837890625, 0.4283447265625, 0.50360107421875, 0.578857421875, 0.65411376953125, 0.7293701171875, 0.80462646484375, 0.8798828125, 0.95513916015625, 1.0303955078125, 1.10565185546875, 1.180908203125, 1.25616455078125, 1.3314208984375, 1.40667724609375, 1.48193359375, 1.55718994140625, 1.6324462890625, 1.70770263671875, 1.782958984375, 1.85821533203125, 1.9334716796875, 2.00872802734375, 2.083984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 3.0, 6.0, 5.0, 11.0, 12.0, 20.0, 88.0, 294.0, 334.0, 119.0, 35.0, 25.0, 9.0, 6.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.36907196044921875, -0.3582611083984375, -0.34745025634765625, -0.336639404296875, -0.32582855224609375, -0.3150177001953125, -0.30420684814453125, -0.29339599609375, -0.28258514404296875, -0.2717742919921875, -0.26096343994140625, -0.250152587890625, -0.23934173583984375, -0.2285308837890625, -0.21772003173828125, -0.2069091796875, -0.19609832763671875, -0.1852874755859375, -0.17447662353515625, -0.163665771484375, -0.15285491943359375, -0.1420440673828125, -0.13123321533203125, -0.12042236328125, -0.10961151123046875, -0.0988006591796875, -0.08798980712890625, -0.077178955078125, -0.06636810302734375, -0.0555572509765625, -0.04474639892578125, -0.033935546875, -0.02312469482421875, -0.0123138427734375, -0.00150299072265625, 0.009307861328125, 0.02011871337890625, 0.0309295654296875, 0.04174041748046875, 0.05255126953125, 0.06336212158203125, 0.0741729736328125, 0.08498382568359375, 0.095794677734375, 0.10660552978515625, 0.1174163818359375, 0.12822723388671875, 0.1390380859375, 0.14984893798828125, 0.1606597900390625, 0.17147064208984375, 0.182281494140625, 0.19309234619140625, 0.2039031982421875, 0.21471405029296875, 0.22552490234375, 0.23633575439453125, 0.2471466064453125, 0.25795745849609375, 0.268768310546875, 0.27957916259765625, 0.2903900146484375, 0.30120086669921875, 0.31201171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 6.0, 14.0, 18.0, 17.0, 34.0, 34.0, 83.0, 136.0, 214.0, 384.0, 765.0, 2068.0, 8886.0, 167181.0, 838591.0, 24328.0, 3476.0, 1077.0, 520.0, 264.0, 145.0, 98.0, 62.0, 26.0, 31.0, 23.0, 20.0, 9.0, 5.0, 4.0, 4.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7734375, -3.6485595703125, -3.523681640625, -3.3988037109375, -3.27392578125, -3.1490478515625, -3.024169921875, -2.8992919921875, -2.7744140625, -2.6495361328125, -2.524658203125, -2.3997802734375, -2.27490234375, -2.1500244140625, -2.025146484375, -1.9002685546875, -1.775390625, -1.6505126953125, -1.525634765625, -1.4007568359375, -1.27587890625, -1.1510009765625, -1.026123046875, -0.9012451171875, -0.7763671875, -0.6514892578125, -0.526611328125, -0.4017333984375, -0.27685546875, -0.1519775390625, -0.027099609375, 0.0977783203125, 0.22265625, 0.3475341796875, 0.472412109375, 0.5972900390625, 0.72216796875, 0.8470458984375, 0.971923828125, 1.0968017578125, 1.2216796875, 1.3465576171875, 1.471435546875, 1.5963134765625, 1.72119140625, 1.8460693359375, 1.970947265625, 2.0958251953125, 2.220703125, 2.3455810546875, 2.470458984375, 2.5953369140625, 2.72021484375, 2.8450927734375, 2.969970703125, 3.0948486328125, 3.2197265625, 3.3446044921875, 3.469482421875, 3.5943603515625, 3.71923828125, 3.8441162109375, 3.968994140625, 4.0938720703125, 4.21875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 5.0, 2.0, 10.0, 6.0, 8.0, 10.0, 12.0, 13.0, 19.0, 19.0, 19.0, 25.0, 21.0, 30.0, 28.0, 32.0, 26.0, 21.0, 31.0, 37.0, 41.0, 28.0, 50.0, 41.0, 43.0, 36.0, 31.0, 35.0, 31.0, 34.0, 30.0, 23.0, 31.0, 27.0, 21.0, 12.0, 12.0, 14.0, 11.0, 13.0, 6.0, 3.0, 10.0, 8.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0], "bins": [-0.96923828125, -0.9406356811523438, -0.9120330810546875, -0.8834304809570312, -0.854827880859375, -0.8262252807617188, -0.7976226806640625, -0.7690200805664062, -0.74041748046875, -0.7118148803710938, -0.6832122802734375, -0.6546096801757812, -0.626007080078125, -0.5974044799804688, -0.5688018798828125, -0.5401992797851562, -0.5115966796875, -0.48299407958984375, -0.4543914794921875, -0.42578887939453125, -0.397186279296875, -0.36858367919921875, -0.3399810791015625, -0.31137847900390625, -0.28277587890625, -0.25417327880859375, -0.2255706787109375, -0.19696807861328125, -0.168365478515625, -0.13976287841796875, -0.1111602783203125, -0.08255767822265625, -0.053955078125, -0.02535247802734375, 0.0032501220703125, 0.03185272216796875, 0.060455322265625, 0.08905792236328125, 0.1176605224609375, 0.14626312255859375, 0.17486572265625, 0.20346832275390625, 0.2320709228515625, 0.26067352294921875, 0.289276123046875, 0.31787872314453125, 0.3464813232421875, 0.37508392333984375, 0.4036865234375, 0.43228912353515625, 0.4608917236328125, 0.48949432373046875, 0.518096923828125, 0.5466995239257812, 0.5753021240234375, 0.6039047241210938, 0.63250732421875, 0.6611099243164062, 0.6897125244140625, 0.7183151245117188, 0.746917724609375, 0.7755203247070312, 0.8041229248046875, 0.8327255249023438, 0.861328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 11.0, 16.0, 20.0, 22.0, 31.0, 55.0, 97.0, 153.0, 341.0, 851.0, 3060.0, 25222.0, 993765.0, 20407.0, 2885.0, 856.0, 311.0, 154.0, 83.0, 59.0, 38.0, 22.0, 20.0, 11.0, 12.0, 7.0, 4.0, 9.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.16015625, -4.00299072265625, -3.8458251953125, -3.68865966796875, -3.531494140625, -3.37432861328125, -3.2171630859375, -3.05999755859375, -2.90283203125, -2.74566650390625, -2.5885009765625, -2.43133544921875, -2.274169921875, -2.11700439453125, -1.9598388671875, -1.80267333984375, -1.6455078125, -1.48834228515625, -1.3311767578125, -1.17401123046875, -1.016845703125, -0.85968017578125, -0.7025146484375, -0.54534912109375, -0.38818359375, -0.23101806640625, -0.0738525390625, 0.08331298828125, 0.240478515625, 0.39764404296875, 0.5548095703125, 0.71197509765625, 0.869140625, 1.02630615234375, 1.1834716796875, 1.34063720703125, 1.497802734375, 1.65496826171875, 1.8121337890625, 1.96929931640625, 2.12646484375, 2.28363037109375, 2.4407958984375, 2.59796142578125, 2.755126953125, 2.91229248046875, 3.0694580078125, 3.22662353515625, 3.3837890625, 3.54095458984375, 3.6981201171875, 3.85528564453125, 4.012451171875, 4.16961669921875, 4.3267822265625, 4.48394775390625, 4.64111328125, 4.79827880859375, 4.9554443359375, 5.11260986328125, 5.269775390625, 5.42694091796875, 5.5841064453125, 5.74127197265625, 5.8984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 8.0, 2.0, 6.0, 7.0, 5.0, 13.0, 23.0, 25.0, 67.0, 113.0, 182.0, 203.0, 137.0, 95.0, 41.0, 31.0, 19.0, 12.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00173187255859375, -0.001681312918663025, -0.0016307532787322998, -0.0015801936388015747, -0.0015296339988708496, -0.0014790743589401245, -0.0014285147190093994, -0.0013779550790786743, -0.0013273954391479492, -0.0012768357992172241, -0.001226276159286499, -0.001175716519355774, -0.0011251568794250488, -0.0010745972394943237, -0.0010240375995635986, -0.0009734779596328735, -0.0009229183197021484, -0.0008723586797714233, -0.0008217990398406982, -0.0007712393999099731, -0.000720679759979248, -0.000670120120048523, -0.0006195604801177979, -0.0005690008401870728, -0.0005184412002563477, -0.00046788156032562256, -0.00041732192039489746, -0.00036676228046417236, -0.00031620264053344727, -0.00026564300060272217, -0.00021508336067199707, -0.00016452372074127197, -0.00011396408081054688, -6.340444087982178e-05, -1.284480094909668e-05, 3.771483898162842e-05, 8.827447891235352e-05, 0.0001388341188430786, 0.0001893937587738037, 0.0002399533987045288, 0.0002905130386352539, 0.000341072678565979, 0.0003916323184967041, 0.0004421919584274292, 0.0004927515983581543, 0.0005433112382888794, 0.0005938708782196045, 0.0006444305181503296, 0.0006949901580810547, 0.0007455497980117798, 0.0007961094379425049, 0.00084666907787323, 0.0008972287178039551, 0.0009477883577346802, 0.0009983479976654053, 0.0010489076375961304, 0.0010994672775268555, 0.0011500269174575806, 0.0012005865573883057, 0.0012511461973190308, 0.0013017058372497559, 0.001352265477180481, 0.001402825117111206, 0.0014533847570419312, 0.0015039443969726562]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 7.0, 11.0, 13.0, 21.0, 25.0, 34.0, 57.0, 85.0, 124.0, 201.0, 336.0, 553.0, 995.0, 1966.0, 4840.0, 13859.0, 63337.0, 779833.0, 146771.0, 22733.0, 6858.0, 2842.0, 1275.0, 700.0, 378.0, 238.0, 156.0, 88.0, 62.0, 35.0, 32.0, 23.0, 15.0, 10.0, 8.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9501953125, -1.8845062255859375, -1.818817138671875, -1.7531280517578125, -1.68743896484375, -1.6217498779296875, -1.556060791015625, -1.4903717041015625, -1.4246826171875, -1.3589935302734375, -1.293304443359375, -1.2276153564453125, -1.16192626953125, -1.0962371826171875, -1.030548095703125, -0.9648590087890625, -0.899169921875, -0.8334808349609375, -0.767791748046875, -0.7021026611328125, -0.63641357421875, -0.5707244873046875, -0.505035400390625, -0.4393463134765625, -0.3736572265625, -0.3079681396484375, -0.242279052734375, -0.1765899658203125, -0.11090087890625, -0.0452117919921875, 0.020477294921875, 0.0861663818359375, 0.15185546875, 0.2175445556640625, 0.283233642578125, 0.3489227294921875, 0.41461181640625, 0.4803009033203125, 0.545989990234375, 0.6116790771484375, 0.6773681640625, 0.7430572509765625, 0.808746337890625, 0.8744354248046875, 0.94012451171875, 1.0058135986328125, 1.071502685546875, 1.1371917724609375, 1.202880859375, 1.2685699462890625, 1.334259033203125, 1.3999481201171875, 1.46563720703125, 1.5313262939453125, 1.597015380859375, 1.6627044677734375, 1.7283935546875, 1.7940826416015625, 1.859771728515625, 1.9254608154296875, 1.99114990234375, 2.0568389892578125, 2.122528076171875, 2.1882171630859375, 2.25390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 16.0, 12.0, 18.0, 16.0, 31.0, 24.0, 56.0, 75.0, 111.0, 144.0, 149.0, 88.0, 62.0, 47.0, 37.0, 23.0, 22.0, 11.0, 15.0, 6.0, 4.0, 4.0, 2.0, 5.0, 7.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8515625, -1.78985595703125, -1.7281494140625, -1.66644287109375, -1.604736328125, -1.54302978515625, -1.4813232421875, -1.41961669921875, -1.35791015625, -1.29620361328125, -1.2344970703125, -1.17279052734375, -1.111083984375, -1.04937744140625, -0.9876708984375, -0.92596435546875, -0.8642578125, -0.80255126953125, -0.7408447265625, -0.67913818359375, -0.617431640625, -0.55572509765625, -0.4940185546875, -0.43231201171875, -0.37060546875, -0.30889892578125, -0.2471923828125, -0.18548583984375, -0.123779296875, -0.06207275390625, -0.0003662109375, 0.06134033203125, 0.123046875, 0.18475341796875, 0.2464599609375, 0.30816650390625, 0.369873046875, 0.43157958984375, 0.4932861328125, 0.55499267578125, 0.61669921875, 0.67840576171875, 0.7401123046875, 0.80181884765625, 0.863525390625, 0.92523193359375, 0.9869384765625, 1.04864501953125, 1.1103515625, 1.17205810546875, 1.2337646484375, 1.29547119140625, 1.357177734375, 1.41888427734375, 1.4805908203125, 1.54229736328125, 1.60400390625, 1.66571044921875, 1.7274169921875, 1.78912353515625, 1.850830078125, 1.91253662109375, 1.9742431640625, 2.03594970703125, 2.09765625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 4.0, 12.0, 56.0, 229.0, 521.0, 123.0, 28.0, 14.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.99327087402344, -31.83414077758789, -30.675012588500977, -29.515884399414062, -28.356754302978516, -27.19762420654297, -26.038496017456055, -24.87936782836914, -23.720237731933594, -22.561107635498047, -21.401979446411133, -20.24285125732422, -19.083721160888672, -17.924591064453125, -16.76546287536621, -15.60633373260498, -14.44720458984375, -13.28807544708252, -12.128946304321289, -10.969817161560059, -9.810688018798828, -8.651558876037598, -7.492429733276367, -6.333300590515137, -5.174171447753906, -4.015042304992676, -2.8559131622314453, -1.6967840194702148, -0.5376548767089844, 0.6214742660522461, 1.7806034088134766, 2.939732551574707, 4.098865509033203, 5.257994651794434, 6.417123794555664, 7.5762529373168945, 8.735382080078125, 9.894511222839355, 11.053640365600586, 12.212769508361816, 13.371898651123047, 14.531027793884277, 15.690156936645508, 16.849285125732422, 18.00841522216797, 19.167545318603516, 20.32667350769043, 21.485801696777344, 22.64493179321289, 23.804061889648438, 24.96319007873535, 26.122318267822266, 27.281448364257812, 28.44057846069336, 29.599706649780273, 30.758834838867188, 31.917964935302734, 33.07709503173828, 34.23622131347656, 35.39535140991211, 36.554481506347656, 37.7136116027832, 38.87274169921875, 40.03186798095703, 41.19099807739258]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 10.0, 8.0, 13.0, 17.0, 42.0, 39.0, 85.0, 103.0, 144.0, 157.0, 128.0, 88.0, 61.0, 37.0, 24.0, 15.0, 6.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.332351684570312, -19.522924423217773, -18.713499069213867, -17.904071807861328, -17.094646453857422, -16.285219192504883, -15.47579288482666, -14.666366577148438, -13.856939315795898, -13.047513008117676, -12.238086700439453, -11.428659439086914, -10.619233131408691, -9.809806823730469, -9.000380516052246, -8.190954208374023, -7.381527900695801, -6.572101593017578, -5.762674808502197, -4.953248500823975, -4.143821716308594, -3.334395408630371, -2.5249691009521484, -1.7155423164367676, -0.9061160087585449, -0.09668952226638794, 0.712736964225769, 1.5221633911132812, 2.331589937210083, 3.1410164833068848, 3.9504427909851074, 4.759869575500488, 5.569295883178711, 6.378722190856934, 7.1881489753723145, 7.997575283050537, 8.807002067565918, 9.61642837524414, 10.425854682922363, 11.235280990600586, 12.044708251953125, 12.854134559631348, 13.66356086730957, 14.47298812866211, 15.282414436340332, 16.091840744018555, 16.901268005371094, 17.710693359375, 18.520118713378906, 19.329545974731445, 20.13897132873535, 20.94839859008789, 21.757823944091797, 22.567251205444336, 23.376678466796875, 24.18610382080078, 24.99553108215332, 25.80495834350586, 26.614383697509766, 27.423810958862305, 28.23323631286621, 29.04266357421875, 29.852088928222656, 30.661516189575195, 31.470943450927734]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 8.0, 7.0, 6.0, 11.0, 20.0, 24.0, 50.0, 186.0, 28551.0, 4164094.0, 1038.0, 165.0, 52.0, 27.0, 19.0, 11.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.4375, -34.865234375, -33.29296875, -31.720703125, -30.1484375, -28.576171875, -27.00390625, -25.431640625, -23.859375, -22.287109375, -20.71484375, -19.142578125, -17.5703125, -15.998046875, -14.42578125, -12.853515625, -11.28125, -9.708984375, -8.13671875, -6.564453125, -4.9921875, -3.419921875, -1.84765625, -0.275390625, 1.296875, 2.869140625, 4.44140625, 6.013671875, 7.5859375, 9.158203125, 10.73046875, 12.302734375, 13.875, 15.447265625, 17.01953125, 18.591796875, 20.1640625, 21.736328125, 23.30859375, 24.880859375, 26.453125, 28.025390625, 29.59765625, 31.169921875, 32.7421875, 34.314453125, 35.88671875, 37.458984375, 39.03125, 40.603515625, 42.17578125, 43.748046875, 45.3203125, 46.892578125, 48.46484375, 50.037109375, 51.609375, 53.181640625, 54.75390625, 56.326171875, 57.8984375, 59.470703125, 61.04296875, 62.615234375, 64.1875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 11.0, 5.0, 7.0, 18.0, 27.0, 69.0, 84.0, 130.0, 160.0, 157.0, 112.0, 64.0, 44.0, 32.0, 16.0, 6.0, 8.0, 5.0, 9.0, 4.0, 1.0, 6.0, 3.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14990234375, -0.14412879943847656, -0.13835525512695312, -0.1325817108154297, -0.12680816650390625, -0.12103462219238281, -0.11526107788085938, -0.10948753356933594, -0.1037139892578125, -0.09794044494628906, -0.09216690063476562, -0.08639335632324219, -0.08061981201171875, -0.07484626770019531, -0.06907272338867188, -0.06329917907714844, -0.057525634765625, -0.05175209045410156, -0.045978546142578125, -0.04020500183105469, -0.03443145751953125, -0.028657913208007812, -0.022884368896484375, -0.017110824584960938, -0.0113372802734375, -0.0055637359619140625, 0.000209808349609375, 0.0059833526611328125, 0.01175689697265625, 0.017530441284179688, 0.023303985595703125, 0.029077529907226562, 0.03485107421875, 0.04062461853027344, 0.046398162841796875, 0.05217170715332031, 0.05794525146484375, 0.06371879577636719, 0.06949234008789062, 0.07526588439941406, 0.0810394287109375, 0.08681297302246094, 0.09258651733398438, 0.09836006164550781, 0.10413360595703125, 0.10990715026855469, 0.11568069458007812, 0.12145423889160156, 0.127227783203125, 0.13300132751464844, 0.13877487182617188, 0.1445484161376953, 0.15032196044921875, 0.1560955047607422, 0.16186904907226562, 0.16764259338378906, 0.1734161376953125, 0.17918968200683594, 0.18496322631835938, 0.1907367706298828, 0.19651031494140625, 0.2022838592529297, 0.20805740356445312, 0.21383094787597656, 0.2196044921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 3.0, 6.0, 13.0, 21.0, 41.0, 44.0, 71.0, 93.0, 134.0, 204.0, 423.0, 1695.0, 344979.0, 3843791.0, 2301.0, 311.0, 97.0, 31.0, 11.0, 7.0, 3.0, 4.0, 2.0], "bins": [-19.671875, -19.308074951171875, -18.94427490234375, -18.580474853515625, -18.2166748046875, -17.852874755859375, -17.48907470703125, -17.125274658203125, -16.761474609375, -16.397674560546875, -16.03387451171875, -15.670074462890625, -15.3062744140625, -14.942474365234375, -14.57867431640625, -14.214874267578125, -13.85107421875, -13.487274169921875, -13.12347412109375, -12.759674072265625, -12.3958740234375, -12.032073974609375, -11.66827392578125, -11.304473876953125, -10.940673828125, -10.576873779296875, -10.21307373046875, -9.849273681640625, -9.4854736328125, -9.121673583984375, -8.75787353515625, -8.394073486328125, -8.0302734375, -7.666473388671875, -7.30267333984375, -6.938873291015625, -6.5750732421875, -6.211273193359375, -5.84747314453125, -5.483673095703125, -5.119873046875, -4.756072998046875, -4.39227294921875, -4.028472900390625, -3.6646728515625, -3.300872802734375, -2.93707275390625, -2.573272705078125, -2.20947265625, -1.845672607421875, -1.48187255859375, -1.118072509765625, -0.7542724609375, -0.390472412109375, -0.02667236328125, 0.337127685546875, 0.700927734375, 1.064727783203125, 1.42852783203125, 1.792327880859375, 2.1561279296875, 2.519927978515625, 2.88372802734375, 3.247528076171875, 3.611328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 10.0, 8.0, 18.0, 30.0, 23.0, 62.0, 113.0, 230.0, 454.0, 981.0, 1178.0, 410.0, 180.0, 107.0, 60.0, 47.0, 32.0, 25.0, 26.0, 9.0, 16.0, 9.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326904296875, -0.3175849914550781, -0.30826568603515625, -0.2989463806152344, -0.2896270751953125, -0.2803077697753906, -0.27098846435546875, -0.2616691589355469, -0.252349853515625, -0.24303054809570312, -0.23371124267578125, -0.22439193725585938, -0.2150726318359375, -0.20575332641601562, -0.19643402099609375, -0.18711471557617188, -0.17779541015625, -0.16847610473632812, -0.15915679931640625, -0.14983749389648438, -0.1405181884765625, -0.13119888305664062, -0.12187957763671875, -0.11256027221679688, -0.103240966796875, -0.09392166137695312, -0.08460235595703125, -0.07528305053710938, -0.0659637451171875, -0.056644439697265625, -0.04732513427734375, -0.038005828857421875, -0.0286865234375, -0.019367218017578125, -0.01004791259765625, -0.000728607177734375, 0.0085906982421875, 0.017910003662109375, 0.02722930908203125, 0.036548614501953125, 0.045867919921875, 0.055187225341796875, 0.06450653076171875, 0.07382583618164062, 0.0831451416015625, 0.09246444702148438, 0.10178375244140625, 0.11110305786132812, 0.12042236328125, 0.12974166870117188, 0.13906097412109375, 0.14838027954101562, 0.1576995849609375, 0.16701889038085938, 0.17633819580078125, 0.18565750122070312, 0.194976806640625, 0.20429611206054688, 0.21361541748046875, 0.22293472290039062, 0.2322540283203125, 0.24157333374023438, 0.25089263916015625, 0.2602119445800781, 0.26953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 77.0, 904.0, 24.0, 2.0, 2.0, 2.0], "bins": [-90.9687728881836, -89.4393539428711, -87.90994262695312, -86.38052368164062, -84.85110473632812, -83.32168579101562, -81.79227447509766, -80.26285552978516, -78.73343658447266, -77.20401763916016, -75.67460632324219, -74.14518737792969, -72.61576843261719, -71.08634948730469, -69.55693817138672, -68.02751922607422, -66.49810791015625, -64.96868896484375, -63.439273834228516, -61.90985870361328, -60.38043975830078, -58.85102462768555, -57.32160949707031, -55.79219055175781, -54.26277160644531, -52.73335647583008, -51.20393753051758, -49.674522399902344, -48.145103454589844, -46.61568832397461, -45.086273193359375, -43.556854248046875, -42.02743911743164, -40.498023986816406, -38.968605041503906, -37.43918991088867, -35.90977096557617, -34.38035583496094, -32.85093688964844, -31.321521759033203, -29.792102813720703, -28.262685775756836, -26.73326873779297, -25.203853607177734, -23.674434661865234, -22.14501953125, -20.615602493286133, -19.086185455322266, -17.55677032470703, -16.027353286743164, -14.497936248779297, -12.968520164489746, -11.439103126525879, -9.909686088562012, -8.380270004272461, -6.850852966308594, -5.32143497467041, -3.792018175125122, -2.262601375579834, -0.733184814453125, 0.7962322235107422, 2.3256492614746094, 3.85506534576416, 5.384482383728027, 6.9138994216918945]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 15.0, 37.0, 63.0, 87.0, 146.0, 158.0, 138.0, 130.0, 92.0, 48.0, 26.0, 21.0, 12.0, 10.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.495293617248535, -6.3571600914001465, -6.219026565551758, -6.080893039703369, -5.9427595138549805, -5.804625988006592, -5.666492462158203, -5.5283589363098145, -5.390225410461426, -5.252091884613037, -5.113958358764648, -4.97582483291626, -4.837691307067871, -4.699557781219482, -4.561424255371094, -4.423290729522705, -4.285157203674316, -4.147023677825928, -4.008890151977539, -3.8707566261291504, -3.7326231002807617, -3.594489574432373, -3.4563560485839844, -3.3182225227355957, -3.1800894737243652, -3.0419559478759766, -2.903822422027588, -2.765688896179199, -2.6275553703308105, -2.489421844482422, -2.351288318634033, -2.2131547927856445, -2.075021266937256, -1.9368877410888672, -1.7987542152404785, -1.6606206893920898, -1.5224871635437012, -1.3843536376953125, -1.2462202310562134, -1.1080867052078247, -0.969953179359436, -0.8318196535110474, -0.6936861276626587, -0.5555526614189148, -0.4174191355705261, -0.27928560972213745, -0.14115214347839355, -0.003018617630004883, 0.1351149082183838, 0.27324843406677246, 0.41138193011283875, 0.549515426158905, 0.6876489520072937, 0.8257824778556824, 0.9639159440994263, 1.102049469947815, 1.2401829957962036, 1.3783165216445923, 1.516450047492981, 1.65458345413208, 1.7927169799804688, 1.9308505058288574, 2.068984031677246, 2.2071175575256348, 2.3452510833740234]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 8.0, 9.0, 13.0, 10.0, 17.0, 19.0, 46.0, 69.0, 119.0, 191.0, 361.0, 617.0, 1194.0, 2630.0, 7836.0, 37440.0, 735960.0, 232241.0, 20652.0, 5110.0, 1890.0, 919.0, 500.0, 282.0, 155.0, 100.0, 58.0, 40.0, 24.0, 11.0, 12.0, 13.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.41058349609375, -2.3172607421875, -2.22393798828125, -2.130615234375, -2.03729248046875, -1.9439697265625, -1.85064697265625, -1.75732421875, -1.66400146484375, -1.5706787109375, -1.47735595703125, -1.384033203125, -1.29071044921875, -1.1973876953125, -1.10406494140625, -1.0107421875, -0.91741943359375, -0.8240966796875, -0.73077392578125, -0.637451171875, -0.54412841796875, -0.4508056640625, -0.35748291015625, -0.26416015625, -0.17083740234375, -0.0775146484375, 0.01580810546875, 0.109130859375, 0.20245361328125, 0.2957763671875, 0.38909912109375, 0.482421875, 0.57574462890625, 0.6690673828125, 0.76239013671875, 0.855712890625, 0.94903564453125, 1.0423583984375, 1.13568115234375, 1.22900390625, 1.32232666015625, 1.4156494140625, 1.50897216796875, 1.602294921875, 1.69561767578125, 1.7889404296875, 1.88226318359375, 1.9755859375, 2.06890869140625, 2.1622314453125, 2.25555419921875, 2.348876953125, 2.44219970703125, 2.5355224609375, 2.62884521484375, 2.72216796875, 2.81549072265625, 2.9088134765625, 3.00213623046875, 3.095458984375, 3.18878173828125, 3.2821044921875, 3.37542724609375, 3.46875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 8.0, 5.0, 8.0, 2.0, 17.0, 29.0, 55.0, 70.0, 104.0, 125.0, 171.0, 135.0, 79.0, 54.0, 39.0, 26.0, 21.0, 8.0, 7.0, 3.0, 9.0, 2.0, 3.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1435546875, -0.13812637329101562, -0.13269805908203125, -0.12726974487304688, -0.1218414306640625, -0.11641311645507812, -0.11098480224609375, -0.10555648803710938, -0.100128173828125, -0.09469985961914062, -0.08927154541015625, -0.08384323120117188, -0.0784149169921875, -0.07298660278320312, -0.06755828857421875, -0.062129974365234375, -0.05670166015625, -0.051273345947265625, -0.04584503173828125, -0.040416717529296875, -0.0349884033203125, -0.029560089111328125, -0.02413177490234375, -0.018703460693359375, -0.013275146484375, -0.007846832275390625, -0.00241851806640625, 0.003009796142578125, 0.0084381103515625, 0.013866424560546875, 0.01929473876953125, 0.024723052978515625, 0.0301513671875, 0.035579681396484375, 0.04100799560546875, 0.046436309814453125, 0.0518646240234375, 0.057292938232421875, 0.06272125244140625, 0.06814956665039062, 0.073577880859375, 0.07900619506835938, 0.08443450927734375, 0.08986282348632812, 0.0952911376953125, 0.10071945190429688, 0.10614776611328125, 0.11157608032226562, 0.11700439453125, 0.12243270874023438, 0.12786102294921875, 0.13328933715820312, 0.1387176513671875, 0.14414596557617188, 0.14957427978515625, 0.15500259399414062, 0.160430908203125, 0.16585922241210938, 0.17128753662109375, 0.17671585083007812, 0.1821441650390625, 0.18757247924804688, 0.19300079345703125, 0.19842910766601562, 0.203857421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 14.0, 24.0, 24.0, 30.0, 63.0, 68.0, 126.0, 280.0, 523.0, 1170.0, 4048.0, 27953.0, 696143.0, 297384.0, 15604.0, 2968.0, 1011.0, 494.0, 226.0, 122.0, 94.0, 62.0, 35.0, 22.0, 15.0, 8.0, 1.0, 5.0, 4.0, 4.0, 1.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.818359375, -2.735137939453125, -2.65191650390625, -2.568695068359375, -2.4854736328125, -2.402252197265625, -2.31903076171875, -2.235809326171875, -2.152587890625, -2.069366455078125, -1.98614501953125, -1.902923583984375, -1.8197021484375, -1.736480712890625, -1.65325927734375, -1.570037841796875, -1.48681640625, -1.403594970703125, -1.32037353515625, -1.237152099609375, -1.1539306640625, -1.070709228515625, -0.98748779296875, -0.904266357421875, -0.821044921875, -0.737823486328125, -0.65460205078125, -0.571380615234375, -0.4881591796875, -0.404937744140625, -0.32171630859375, -0.238494873046875, -0.1552734375, -0.072052001953125, 0.01116943359375, 0.094390869140625, 0.1776123046875, 0.260833740234375, 0.34405517578125, 0.427276611328125, 0.510498046875, 0.593719482421875, 0.67694091796875, 0.760162353515625, 0.8433837890625, 0.926605224609375, 1.00982666015625, 1.093048095703125, 1.17626953125, 1.259490966796875, 1.34271240234375, 1.425933837890625, 1.5091552734375, 1.592376708984375, 1.67559814453125, 1.758819580078125, 1.842041015625, 1.925262451171875, 2.00848388671875, 2.091705322265625, 2.1749267578125, 2.258148193359375, 2.34136962890625, 2.424591064453125, 2.5078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 8.0, 11.0, 8.0, 12.0, 17.0, 21.0, 16.0, 12.0, 20.0, 31.0, 38.0, 31.0, 33.0, 44.0, 29.0, 42.0, 48.0, 53.0, 48.0, 47.0, 37.0, 34.0, 37.0, 51.0, 43.0, 31.0, 28.0, 26.0, 19.0, 18.0, 17.0, 18.0, 15.0, 8.0, 7.0, 9.0, 3.0, 6.0, 5.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5439453125, -0.5257949829101562, -0.5076446533203125, -0.48949432373046875, -0.471343994140625, -0.45319366455078125, -0.4350433349609375, -0.41689300537109375, -0.39874267578125, -0.38059234619140625, -0.3624420166015625, -0.34429168701171875, -0.326141357421875, -0.30799102783203125, -0.2898406982421875, -0.27169036865234375, -0.2535400390625, -0.23538970947265625, -0.2172393798828125, -0.19908905029296875, -0.180938720703125, -0.16278839111328125, -0.1446380615234375, -0.12648773193359375, -0.10833740234375, -0.09018707275390625, -0.0720367431640625, -0.05388641357421875, -0.035736083984375, -0.01758575439453125, 0.0005645751953125, 0.01871490478515625, 0.036865234375, 0.05501556396484375, 0.0731658935546875, 0.09131622314453125, 0.109466552734375, 0.12761688232421875, 0.1457672119140625, 0.16391754150390625, 0.18206787109375, 0.20021820068359375, 0.2183685302734375, 0.23651885986328125, 0.254669189453125, 0.27281951904296875, 0.2909698486328125, 0.30912017822265625, 0.3272705078125, 0.34542083740234375, 0.3635711669921875, 0.38172149658203125, 0.399871826171875, 0.41802215576171875, 0.4361724853515625, 0.45432281494140625, 0.47247314453125, 0.49062347412109375, 0.5087738037109375, 0.5269241333007812, 0.545074462890625, 0.5632247924804688, 0.5813751220703125, 0.5995254516601562, 0.61767578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 7.0, 6.0, 13.0, 17.0, 21.0, 40.0, 44.0, 67.0, 134.0, 251.0, 532.0, 1226.0, 4391.0, 36072.0, 970455.0, 29235.0, 3875.0, 1122.0, 445.0, 217.0, 121.0, 84.0, 43.0, 24.0, 13.0, 14.0, 16.0, 9.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.76629638671875, -5.5989990234375, -5.43170166015625, -5.264404296875, -5.09710693359375, -4.9298095703125, -4.76251220703125, -4.59521484375, -4.42791748046875, -4.2606201171875, -4.09332275390625, -3.926025390625, -3.75872802734375, -3.5914306640625, -3.42413330078125, -3.2568359375, -3.08953857421875, -2.9222412109375, -2.75494384765625, -2.587646484375, -2.42034912109375, -2.2530517578125, -2.08575439453125, -1.91845703125, -1.75115966796875, -1.5838623046875, -1.41656494140625, -1.249267578125, -1.08197021484375, -0.9146728515625, -0.74737548828125, -0.580078125, -0.41278076171875, -0.2454833984375, -0.07818603515625, 0.089111328125, 0.25640869140625, 0.4237060546875, 0.59100341796875, 0.75830078125, 0.92559814453125, 1.0928955078125, 1.26019287109375, 1.427490234375, 1.59478759765625, 1.7620849609375, 1.92938232421875, 2.0966796875, 2.26397705078125, 2.4312744140625, 2.59857177734375, 2.765869140625, 2.93316650390625, 3.1004638671875, 3.26776123046875, 3.43505859375, 3.60235595703125, 3.7696533203125, 3.93695068359375, 4.104248046875, 4.27154541015625, 4.4388427734375, 4.60614013671875, 4.7734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 9.0, 4.0, 15.0, 22.0, 39.0, 66.0, 125.0, 333.0, 203.0, 58.0, 36.0, 26.0, 12.0, 8.0, 12.0, 8.0, 9.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001201629638671875, -0.001156628131866455, -0.0011116266250610352, -0.0010666251182556152, -0.0010216236114501953, -0.0009766221046447754, -0.0009316205978393555, -0.0008866190910339355, -0.0008416175842285156, -0.0007966160774230957, -0.0007516145706176758, -0.0007066130638122559, -0.0006616115570068359, -0.000616610050201416, -0.0005716085433959961, -0.0005266070365905762, -0.00048160552978515625, -0.00043660402297973633, -0.0003916025161743164, -0.0003466010093688965, -0.00030159950256347656, -0.00025659799575805664, -0.00021159648895263672, -0.0001665949821472168, -0.00012159347534179688, -7.659196853637695e-05, -3.159046173095703e-05, 1.341104507446289e-05, 5.841255187988281e-05, 0.00010341405868530273, 0.00014841556549072266, 0.00019341707229614258, 0.0002384185791015625, 0.0002834200859069824, 0.00032842159271240234, 0.00037342309951782227, 0.0004184246063232422, 0.0004634261131286621, 0.000508427619934082, 0.000553429126739502, 0.0005984306335449219, 0.0006434321403503418, 0.0006884336471557617, 0.0007334351539611816, 0.0007784366607666016, 0.0008234381675720215, 0.0008684396743774414, 0.0009134411811828613, 0.0009584426879882812, 0.0010034441947937012, 0.001048445701599121, 0.001093447208404541, 0.001138448715209961, 0.0011834502220153809, 0.0012284517288208008, 0.0012734532356262207, 0.0013184547424316406, 0.0013634562492370605, 0.0014084577560424805, 0.0014534592628479004, 0.0014984607696533203, 0.0015434622764587402, 0.0015884637832641602, 0.00163346529006958, 0.001678466796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 15.0, 20.0, 33.0, 58.0, 126.0, 411.0, 1554.0, 8365.0, 104816.0, 886108.0, 40767.0, 4648.0, 1045.0, 296.0, 125.0, 56.0, 27.0, 18.0, 14.0, 6.0, 9.0, 4.0, 6.0, 4.0, 1.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.45977783203125, -4.3218994140625, -4.18402099609375, -4.046142578125, -3.90826416015625, -3.7703857421875, -3.63250732421875, -3.49462890625, -3.35675048828125, -3.2188720703125, -3.08099365234375, -2.943115234375, -2.80523681640625, -2.6673583984375, -2.52947998046875, -2.3916015625, -2.25372314453125, -2.1158447265625, -1.97796630859375, -1.840087890625, -1.70220947265625, -1.5643310546875, -1.42645263671875, -1.28857421875, -1.15069580078125, -1.0128173828125, -0.87493896484375, -0.737060546875, -0.59918212890625, -0.4613037109375, -0.32342529296875, -0.185546875, -0.04766845703125, 0.0902099609375, 0.22808837890625, 0.365966796875, 0.50384521484375, 0.6417236328125, 0.77960205078125, 0.91748046875, 1.05535888671875, 1.1932373046875, 1.33111572265625, 1.468994140625, 1.60687255859375, 1.7447509765625, 1.88262939453125, 2.0205078125, 2.15838623046875, 2.2962646484375, 2.43414306640625, 2.572021484375, 2.70989990234375, 2.8477783203125, 2.98565673828125, 3.12353515625, 3.26141357421875, 3.3992919921875, 3.53717041015625, 3.675048828125, 3.81292724609375, 3.9508056640625, 4.08868408203125, 4.2265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 4.0, 9.0, 15.0, 6.0, 12.0, 14.0, 27.0, 35.0, 29.0, 45.0, 62.0, 84.0, 107.0, 102.0, 90.0, 76.0, 47.0, 57.0, 24.0, 38.0, 23.0, 12.0, 14.0, 20.0, 8.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.054534912109375, -1.00946044921875, -0.964385986328125, -0.9193115234375, -0.874237060546875, -0.82916259765625, -0.784088134765625, -0.739013671875, -0.693939208984375, -0.64886474609375, -0.603790283203125, -0.5587158203125, -0.513641357421875, -0.46856689453125, -0.423492431640625, -0.37841796875, -0.333343505859375, -0.28826904296875, -0.243194580078125, -0.1981201171875, -0.153045654296875, -0.10797119140625, -0.062896728515625, -0.017822265625, 0.027252197265625, 0.07232666015625, 0.117401123046875, 0.1624755859375, 0.207550048828125, 0.25262451171875, 0.297698974609375, 0.3427734375, 0.387847900390625, 0.43292236328125, 0.477996826171875, 0.5230712890625, 0.568145751953125, 0.61322021484375, 0.658294677734375, 0.703369140625, 0.748443603515625, 0.79351806640625, 0.838592529296875, 0.8836669921875, 0.928741455078125, 0.97381591796875, 1.018890380859375, 1.06396484375, 1.109039306640625, 1.15411376953125, 1.199188232421875, 1.2442626953125, 1.289337158203125, 1.33441162109375, 1.379486083984375, 1.424560546875, 1.469635009765625, 1.51470947265625, 1.559783935546875, 1.6048583984375, 1.649932861328125, 1.69500732421875, 1.740081787109375, 1.78515625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 17.0, 29.0, 56.0, 110.0, 220.0, 236.0, 165.0, 74.0, 31.0, 18.0, 14.0, 2.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.573041915893555, -8.245044708251953, -7.917048454284668, -7.589051246643066, -7.261054515838623, -6.93305778503418, -6.605061054229736, -6.277064323425293, -5.949067115783691, -5.621070384979248, -5.293073654174805, -4.965076446533203, -4.63707971572876, -4.309082984924316, -3.981086254119873, -3.6530892848968506, -3.3250927925109863, -2.997096061706543, -2.6690990924835205, -2.341102361679077, -2.0131053924560547, -1.6851086616516113, -1.357111930847168, -1.0291149616241455, -0.7011182308197021, -0.3731214106082916, -0.045124590396881104, 0.28287220001220703, 0.6108690500259399, 0.9388659000396729, 1.2668626308441162, 1.5948596000671387, 1.922856330871582, 2.2508530616760254, 2.578850030899048, 2.906846761703491, 3.2348437309265137, 3.562840461730957, 3.8908371925354004, 4.218833923339844, 4.546831130981445, 4.874827861785889, 5.202824592590332, 5.530821800231934, 5.858818531036377, 6.18681526184082, 6.514811992645264, 6.842808723449707, 7.17080545425415, 7.498802185058594, 7.826798915863037, 8.15479564666748, 8.482792854309082, 8.810789108276367, 9.138786315917969, 9.46678352355957, 9.794779777526855, 10.122776985168457, 10.450773239135742, 10.778770446777344, 11.106766700744629, 11.43476390838623, 11.762760162353516, 12.090757369995117, 12.418754577636719]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 7.0, 15.0, 21.0, 26.0, 29.0, 44.0, 61.0, 65.0, 76.0, 81.0, 78.0, 79.0, 72.0, 70.0, 62.0, 58.0, 48.0, 35.0, 24.0, 13.0, 8.0, 3.0, 5.0, 1.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.116640090942383, -5.852290630340576, -5.5879411697387695, -5.323591709136963, -5.059242248535156, -4.79489278793335, -4.530543327331543, -4.266193866729736, -4.00184440612793, -3.737494945526123, -3.4731454849243164, -3.2087960243225098, -2.944446563720703, -2.6800971031188965, -2.41574764251709, -2.151398181915283, -1.8870487213134766, -1.62269926071167, -1.3583498001098633, -1.0940003395080566, -0.82965087890625, -0.5653014183044434, -0.3009519577026367, -0.03660249710083008, 0.22774696350097656, 0.4920964241027832, 0.7564458847045898, 1.0207953453063965, 1.2851448059082031, 1.5494942665100098, 1.8138437271118164, 2.078193187713623, 2.3425416946411133, 2.60689115524292, 2.8712406158447266, 3.135590076446533, 3.39993953704834, 3.6642889976501465, 3.928638458251953, 4.19298791885376, 4.457337379455566, 4.721686840057373, 4.98603630065918, 5.250385761260986, 5.514735221862793, 5.7790846824646, 6.043434143066406, 6.307783603668213, 6.5721330642700195, 6.836482524871826, 7.100831985473633, 7.3651814460754395, 7.629530906677246, 7.893880367279053, 8.15822982788086, 8.422578811645508, 8.686928749084473, 8.951278686523438, 9.215627670288086, 9.479976654052734, 9.7443265914917, 10.008676528930664, 10.273025512695312, 10.537374496459961, 10.801724433898926]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 1.0, 5.0, 4.0, 6.0, 8.0, 10.0, 13.0, 4.0, 14.0, 17.0, 14.0, 37.0, 73.0, 239.0, 1520.0, 852695.0, 3337756.0, 1456.0, 206.0, 44.0, 33.0, 21.0, 14.0, 17.0, 11.0, 15.0, 10.0, 5.0, 5.0, 5.0, 0.0, 10.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-22.59375, -22.0146484375, -21.435546875, -20.8564453125, -20.27734375, -19.6982421875, -19.119140625, -18.5400390625, -17.9609375, -17.3818359375, -16.802734375, -16.2236328125, -15.64453125, -15.0654296875, -14.486328125, -13.9072265625, -13.328125, -12.7490234375, -12.169921875, -11.5908203125, -11.01171875, -10.4326171875, -9.853515625, -9.2744140625, -8.6953125, -8.1162109375, -7.537109375, -6.9580078125, -6.37890625, -5.7998046875, -5.220703125, -4.6416015625, -4.0625, -3.4833984375, -2.904296875, -2.3251953125, -1.74609375, -1.1669921875, -0.587890625, -0.0087890625, 0.5703125, 1.1494140625, 1.728515625, 2.3076171875, 2.88671875, 3.4658203125, 4.044921875, 4.6240234375, 5.203125, 5.7822265625, 6.361328125, 6.9404296875, 7.51953125, 8.0986328125, 8.677734375, 9.2568359375, 9.8359375, 10.4150390625, 10.994140625, 11.5732421875, 12.15234375, 12.7314453125, 13.310546875, 13.8896484375, 14.46875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 4.0, 10.0, 8.0, 10.0, 22.0, 23.0, 29.0, 45.0, 51.0, 53.0, 67.0, 90.0, 91.0, 94.0, 88.0, 85.0, 63.0, 33.0, 26.0, 36.0, 16.0, 13.0, 14.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.166259765625, -0.161956787109375, -0.15765380859375, -0.153350830078125, -0.1490478515625, -0.144744873046875, -0.14044189453125, -0.136138916015625, -0.1318359375, -0.127532958984375, -0.12322998046875, -0.118927001953125, -0.1146240234375, -0.110321044921875, -0.10601806640625, -0.101715087890625, -0.097412109375, -0.093109130859375, -0.08880615234375, -0.084503173828125, -0.0802001953125, -0.075897216796875, -0.07159423828125, -0.067291259765625, -0.06298828125, -0.058685302734375, -0.05438232421875, -0.050079345703125, -0.0457763671875, -0.041473388671875, -0.03717041015625, -0.032867431640625, -0.028564453125, -0.024261474609375, -0.01995849609375, -0.015655517578125, -0.0113525390625, -0.007049560546875, -0.00274658203125, 0.001556396484375, 0.005859375, 0.010162353515625, 0.01446533203125, 0.018768310546875, 0.0230712890625, 0.027374267578125, 0.03167724609375, 0.035980224609375, 0.040283203125, 0.044586181640625, 0.04888916015625, 0.053192138671875, 0.0574951171875, 0.061798095703125, 0.06610107421875, 0.070404052734375, 0.07470703125, 0.079010009765625, 0.08331298828125, 0.087615966796875, 0.0919189453125, 0.096221923828125, 0.10052490234375, 0.104827880859375, 0.109130859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [7.0, 18.0, 106.0, 1297.0, 4191839.0, 915.0, 95.0, 19.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.11328125, -3.95623779296875, -2.7991943359375, -1.64215087890625, -0.485107421875, 0.67193603515625, 1.8289794921875, 2.98602294921875, 4.14306640625, 5.30010986328125, 6.4571533203125, 7.61419677734375, 8.771240234375, 9.92828369140625, 11.0853271484375, 12.24237060546875, 13.3994140625, 14.55645751953125, 15.7135009765625, 16.87054443359375, 18.027587890625, 19.18463134765625, 20.3416748046875, 21.49871826171875, 22.65576171875, 23.81280517578125, 24.9698486328125, 26.12689208984375, 27.283935546875, 28.44097900390625, 29.5980224609375, 30.75506591796875, 31.912109375, 33.06915283203125, 34.2261962890625, 35.38323974609375, 36.540283203125, 37.69732666015625, 38.8543701171875, 40.01141357421875, 41.16845703125, 42.32550048828125, 43.4825439453125, 44.63958740234375, 45.796630859375, 46.95367431640625, 48.1107177734375, 49.26776123046875, 50.4248046875, 51.58184814453125, 52.7388916015625, 53.89593505859375, 55.052978515625, 56.21002197265625, 57.3670654296875, 58.52410888671875, 59.68115234375, 60.83819580078125, 61.9952392578125, 63.15228271484375, 64.309326171875, 65.46636962890625, 66.6234130859375, 67.78045654296875, 68.9375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 13.0, 13.0, 16.0, 22.0, 82.0, 192.0, 1426.0, 1871.0, 295.0, 76.0, 33.0, 18.0, 13.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328369140625, -0.3010673522949219, -0.27376556396484375, -0.24646377563476562, -0.2191619873046875, -0.19186019897460938, -0.16455841064453125, -0.13725662231445312, -0.109954833984375, -0.08265304565429688, -0.05535125732421875, -0.028049468994140625, -0.0007476806640625, 0.026554107666015625, 0.05385589599609375, 0.08115768432617188, 0.10845947265625, 0.13576126098632812, 0.16306304931640625, 0.19036483764648438, 0.2176666259765625, 0.24496841430664062, 0.27227020263671875, 0.2995719909667969, 0.326873779296875, 0.3541755676269531, 0.38147735595703125, 0.4087791442871094, 0.4360809326171875, 0.4633827209472656, 0.49068450927734375, 0.5179862976074219, 0.5452880859375, 0.5725898742675781, 0.5998916625976562, 0.6271934509277344, 0.6544952392578125, 0.6817970275878906, 0.7090988159179688, 0.7364006042480469, 0.763702392578125, 0.7910041809082031, 0.8183059692382812, 0.8456077575683594, 0.8729095458984375, 0.9002113342285156, 0.9275131225585938, 0.9548149108886719, 0.98211669921875, 1.0094184875488281, 1.0367202758789062, 1.0640220642089844, 1.0913238525390625, 1.1186256408691406, 1.1459274291992188, 1.1732292175292969, 1.200531005859375, 1.2278327941894531, 1.2551345825195312, 1.2824363708496094, 1.3097381591796875, 1.3370399475097656, 1.3643417358398438, 1.3916435241699219, 1.4189453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 25.0, 987.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.354900360107422, -25.362552642822266, -22.370203018188477, -19.377853393554688, -16.38550567626953, -13.393157005310059, -10.400808334350586, -7.408458709716797, -4.416110992431641, -1.423762321472168, 1.5685863494873047, 4.560935020446777, 7.55328369140625, 10.545632362365723, 13.537981033325195, 16.530330657958984, 19.52267837524414, 22.515026092529297, 25.507375717163086, 28.499725341796875, 31.49207305908203, 34.48442077636719, 37.476768493652344, 40.469120025634766, 43.46146774291992, 46.45381546020508, 49.4461669921875, 52.438514709472656, 55.43086242675781, 58.42321014404297, 61.415557861328125, 64.40791320800781, 67.40025329589844, 70.3926010131836, 73.38494873046875, 76.3772964477539, 79.36964416503906, 82.36199951171875, 85.3543472290039, 88.34669494628906, 91.33904266357422, 94.33139038085938, 97.32373809814453, 100.31608581542969, 103.30844116210938, 106.30078887939453, 109.29313659667969, 112.28548431396484, 115.27783203125, 118.27017974853516, 121.26252746582031, 124.25487518310547, 127.24722290039062, 130.2395782470703, 133.23191833496094, 136.22427368164062, 139.21661376953125, 142.20896911621094, 145.20130920410156, 148.19366455078125, 151.18600463867188, 154.17835998535156, 157.1707000732422, 160.16305541992188, 163.15541076660156]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 13.0, 30.0, 70.0, 133.0, 201.0, 213.0, 162.0, 103.0, 49.0, 21.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.317737102508545, -6.781598091125488, -6.245459079742432, -5.709320068359375, -5.173181056976318, -4.637042045593262, -4.100903034210205, -3.5647640228271484, -3.028625011444092, -2.492486000061035, -1.9563469886779785, -1.4202079772949219, -0.8840689659118652, -0.3479299545288086, 0.18820905685424805, 0.7243480682373047, 1.2604870796203613, 1.796626091003418, 2.3327651023864746, 2.8689041137695312, 3.405043125152588, 3.9411821365356445, 4.477321147918701, 5.013460159301758, 5.5495991706848145, 6.085738182067871, 6.621877193450928, 7.158016204833984, 7.694155216217041, 8.230294227600098, 8.766433715820312, 9.302572250366211, 9.83871078491211, 10.374849319458008, 10.910988807678223, 11.447128295898438, 11.983266830444336, 12.519405364990234, 13.05554485321045, 13.591684341430664, 14.127822875976562, 14.663961410522461, 15.200100898742676, 15.73624038696289, 16.27237892150879, 16.808517456054688, 17.34465789794922, 17.880796432495117, 18.416934967041016, 18.953073501586914, 19.489212036132812, 20.025352478027344, 20.561491012573242, 21.09762954711914, 21.633769989013672, 22.16990852355957, 22.70604705810547, 23.242185592651367, 23.778324127197266, 24.314464569091797, 24.850603103637695, 25.386741638183594, 25.922882080078125, 26.459020614624023, 26.995159149169922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 7.0, 5.0, 12.0, 6.0, 20.0, 25.0, 19.0, 23.0, 34.0, 35.0, 40.0, 49.0, 63.0, 47.0, 232.0, 1033691.0, 13796.0, 62.0, 61.0, 56.0, 41.0, 33.0, 36.0, 28.0, 17.0, 18.0, 21.0, 16.0, 8.0, 10.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.15625, -26.1025390625, -25.048828125, -23.9951171875, -22.94140625, -21.8876953125, -20.833984375, -19.7802734375, -18.7265625, -17.6728515625, -16.619140625, -15.5654296875, -14.51171875, -13.4580078125, -12.404296875, -11.3505859375, -10.296875, -9.2431640625, -8.189453125, -7.1357421875, -6.08203125, -5.0283203125, -3.974609375, -2.9208984375, -1.8671875, -0.8134765625, 0.240234375, 1.2939453125, 2.34765625, 3.4013671875, 4.455078125, 5.5087890625, 6.5625, 7.6162109375, 8.669921875, 9.7236328125, 10.77734375, 11.8310546875, 12.884765625, 13.9384765625, 14.9921875, 16.0458984375, 17.099609375, 18.1533203125, 19.20703125, 20.2607421875, 21.314453125, 22.3681640625, 23.421875, 24.4755859375, 25.529296875, 26.5830078125, 27.63671875, 28.6904296875, 29.744140625, 30.7978515625, 31.8515625, 32.9052734375, 33.958984375, 35.0126953125, 36.06640625, 37.1201171875, 38.173828125, 39.2275390625, 40.28125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 21.0, 199.0, 650.0, 139.0, 10.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.2534675598144531, -0.15073394775390625, -0.048000335693359375, 0.0547332763671875, 0.15746688842773438, 0.26020050048828125, 0.3629341125488281, 0.465667724609375, 0.5684013366699219, 0.6711349487304688, 0.7738685607910156, 0.8766021728515625, 0.9793357849121094, 1.0820693969726562, 1.1848030090332031, 1.28753662109375, 1.3902702331542969, 1.4930038452148438, 1.5957374572753906, 1.6984710693359375, 1.8012046813964844, 1.9039382934570312, 2.006671905517578, 2.109405517578125, 2.212139129638672, 2.3148727416992188, 2.4176063537597656, 2.5203399658203125, 2.6230735778808594, 2.7258071899414062, 2.828540802001953, 2.9312744140625, 3.034008026123047, 3.1367416381835938, 3.2394752502441406, 3.3422088623046875, 3.4449424743652344, 3.5476760864257812, 3.650409698486328, 3.753143310546875, 3.855876922607422, 3.9586105346679688, 4.061344146728516, 4.1640777587890625, 4.266811370849609, 4.369544982910156, 4.472278594970703, 4.57501220703125, 4.677745819091797, 4.780479431152344, 4.883213043212891, 4.9859466552734375, 5.088680267333984, 5.191413879394531, 5.294147491455078, 5.396881103515625, 5.499614715576172, 5.602348327636719, 5.705081939697266, 5.8078155517578125, 5.910549163818359, 6.013282775878906, 6.116016387939453, 6.21875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 7.0, 9.0, 9.0, 14.0, 19.0, 23.0, 28.0, 43.0, 51.0, 81.0, 116.0, 144.0, 234.0, 409.0, 679.0, 1189.0, 2437.0, 5390.0, 14163.0, 43584.0, 205735.0, 608361.0, 117077.0, 29538.0, 10362.0, 4252.0, 1990.0, 978.0, 546.0, 346.0, 193.0, 147.0, 104.0, 72.0, 60.0, 29.0, 26.0, 33.0, 20.0, 19.0, 11.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.15625, -4.996826171875, -4.83740234375, -4.677978515625, -4.5185546875, -4.359130859375, -4.19970703125, -4.040283203125, -3.880859375, -3.721435546875, -3.56201171875, -3.402587890625, -3.2431640625, -3.083740234375, -2.92431640625, -2.764892578125, -2.60546875, -2.446044921875, -2.28662109375, -2.127197265625, -1.9677734375, -1.808349609375, -1.64892578125, -1.489501953125, -1.330078125, -1.170654296875, -1.01123046875, -0.851806640625, -0.6923828125, -0.532958984375, -0.37353515625, -0.214111328125, -0.0546875, 0.104736328125, 0.26416015625, 0.423583984375, 0.5830078125, 0.742431640625, 0.90185546875, 1.061279296875, 1.220703125, 1.380126953125, 1.53955078125, 1.698974609375, 1.8583984375, 2.017822265625, 2.17724609375, 2.336669921875, 2.49609375, 2.655517578125, 2.81494140625, 2.974365234375, 3.1337890625, 3.293212890625, 3.45263671875, 3.612060546875, 3.771484375, 3.930908203125, 4.09033203125, 4.249755859375, 4.4091796875, 4.568603515625, 4.72802734375, 4.887451171875, 5.046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 4.0, 7.0, 9.0, 7.0, 14.0, 13.0, 20.0, 26.0, 22.0, 42.0, 27.0, 47.0, 64.0, 80.0, 66.0, 79.0, 52.0, 74.0, 58.0, 62.0, 45.0, 36.0, 32.0, 31.0, 9.0, 14.0, 14.0, 12.0, 9.0, 13.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.26953125, -5.1221923828125, -4.974853515625, -4.8275146484375, -4.68017578125, -4.5328369140625, -4.385498046875, -4.2381591796875, -4.0908203125, -3.9434814453125, -3.796142578125, -3.6488037109375, -3.50146484375, -3.3541259765625, -3.206787109375, -3.0594482421875, -2.912109375, -2.7647705078125, -2.617431640625, -2.4700927734375, -2.32275390625, -2.1754150390625, -2.028076171875, -1.8807373046875, -1.7333984375, -1.5860595703125, -1.438720703125, -1.2913818359375, -1.14404296875, -0.9967041015625, -0.849365234375, -0.7020263671875, -0.5546875, -0.4073486328125, -0.260009765625, -0.1126708984375, 0.03466796875, 0.1820068359375, 0.329345703125, 0.4766845703125, 0.6240234375, 0.7713623046875, 0.918701171875, 1.0660400390625, 1.21337890625, 1.3607177734375, 1.508056640625, 1.6553955078125, 1.802734375, 1.9500732421875, 2.097412109375, 2.2447509765625, 2.39208984375, 2.5394287109375, 2.686767578125, 2.8341064453125, 2.9814453125, 3.1287841796875, 3.276123046875, 3.4234619140625, 3.57080078125, 3.7181396484375, 3.865478515625, 4.0128173828125, 4.16015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 2.0, 9.0, 4.0, 11.0, 15.0, 17.0, 22.0, 35.0, 64.0, 104.0, 176.0, 398.0, 840.0, 2356.0, 8967.0, 58366.0, 809017.0, 147444.0, 15055.0, 3388.0, 1152.0, 477.0, 248.0, 133.0, 84.0, 39.0, 33.0, 26.0, 22.0, 7.0, 12.0, 5.0, 7.0, 4.0, 3.0, 0.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.98046875, -6.7528076171875, -6.525146484375, -6.2974853515625, -6.06982421875, -5.8421630859375, -5.614501953125, -5.3868408203125, -5.1591796875, -4.9315185546875, -4.703857421875, -4.4761962890625, -4.24853515625, -4.0208740234375, -3.793212890625, -3.5655517578125, -3.337890625, -3.1102294921875, -2.882568359375, -2.6549072265625, -2.42724609375, -2.1995849609375, -1.971923828125, -1.7442626953125, -1.5166015625, -1.2889404296875, -1.061279296875, -0.8336181640625, -0.60595703125, -0.3782958984375, -0.150634765625, 0.0770263671875, 0.3046875, 0.5323486328125, 0.760009765625, 0.9876708984375, 1.21533203125, 1.4429931640625, 1.670654296875, 1.8983154296875, 2.1259765625, 2.3536376953125, 2.581298828125, 2.8089599609375, 3.03662109375, 3.2642822265625, 3.491943359375, 3.7196044921875, 3.947265625, 4.1749267578125, 4.402587890625, 4.6302490234375, 4.85791015625, 5.0855712890625, 5.313232421875, 5.5408935546875, 5.7685546875, 5.9962158203125, 6.223876953125, 6.4515380859375, 6.67919921875, 6.9068603515625, 7.134521484375, 7.3621826171875, 7.58984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 2.0, 6.0, 5.0, 9.0, 12.0, 26.0, 28.0, 47.0, 79.0, 148.0, 172.0, 163.0, 118.0, 67.0, 32.0, 32.0, 16.0, 10.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009374618530273438, -0.0009087696671485901, -0.0008800774812698364, -0.0008513852953910828, -0.0008226931095123291, -0.0007940009236335754, -0.0007653087377548218, -0.0007366165518760681, -0.0007079243659973145, -0.0006792321801185608, -0.0006505399942398071, -0.0006218478083610535, -0.0005931556224822998, -0.0005644634366035461, -0.0005357712507247925, -0.0005070790648460388, -0.00047838687896728516, -0.0004496946930885315, -0.00042100250720977783, -0.00039231032133102417, -0.0003636181354522705, -0.00033492594957351685, -0.0003062337636947632, -0.0002775415778160095, -0.00024884939193725586, -0.0002201572060585022, -0.00019146502017974854, -0.00016277283430099487, -0.0001340806484222412, -0.00010538846254348755, -7.669627666473389e-05, -4.8004090785980225e-05, -1.9311904907226562e-05, 9.3802809715271e-06, 3.807246685028076e-05, 6.676465272903442e-05, 9.545683860778809e-05, 0.00012414902448654175, 0.0001528412103652954, 0.00018153339624404907, 0.00021022558212280273, 0.0002389177680015564, 0.00026760995388031006, 0.0002963021397590637, 0.0003249943256378174, 0.00035368651151657104, 0.0003823786973953247, 0.00041107088327407837, 0.00043976306915283203, 0.0004684552550315857, 0.0004971474409103394, 0.000525839626789093, 0.0005545318126678467, 0.0005832239985466003, 0.000611916184425354, 0.0006406083703041077, 0.0006693005561828613, 0.000697992742061615, 0.0007266849279403687, 0.0007553771138191223, 0.000784069299697876, 0.0008127614855766296, 0.0008414536714553833, 0.000870145857334137, 0.0008988380432128906]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 8.0, 5.0, 9.0, 22.0, 18.0, 29.0, 47.0, 87.0, 121.0, 261.0, 550.0, 1578.0, 5852.0, 53876.0, 938453.0, 40440.0, 4943.0, 1290.0, 510.0, 179.0, 109.0, 64.0, 33.0, 36.0, 14.0, 8.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3046875, -12.85302734375, -12.4013671875, -11.94970703125, -11.498046875, -11.04638671875, -10.5947265625, -10.14306640625, -9.69140625, -9.23974609375, -8.7880859375, -8.33642578125, -7.884765625, -7.43310546875, -6.9814453125, -6.52978515625, -6.078125, -5.62646484375, -5.1748046875, -4.72314453125, -4.271484375, -3.81982421875, -3.3681640625, -2.91650390625, -2.46484375, -2.01318359375, -1.5615234375, -1.10986328125, -0.658203125, -0.20654296875, 0.2451171875, 0.69677734375, 1.1484375, 1.60009765625, 2.0517578125, 2.50341796875, 2.955078125, 3.40673828125, 3.8583984375, 4.31005859375, 4.76171875, 5.21337890625, 5.6650390625, 6.11669921875, 6.568359375, 7.02001953125, 7.4716796875, 7.92333984375, 8.375, 8.82666015625, 9.2783203125, 9.72998046875, 10.181640625, 10.63330078125, 11.0849609375, 11.53662109375, 11.98828125, 12.43994140625, 12.8916015625, 13.34326171875, 13.794921875, 14.24658203125, 14.6982421875, 15.14990234375, 15.6015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 6.0, 6.0, 15.0, 25.0, 46.0, 100.0, 219.0, 247.0, 157.0, 82.0, 26.0, 11.0, 14.0, 15.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.6484375, -9.4091796875, -9.169921875, -8.9306640625, -8.69140625, -8.4521484375, -8.212890625, -7.9736328125, -7.734375, -7.4951171875, -7.255859375, -7.0166015625, -6.77734375, -6.5380859375, -6.298828125, -6.0595703125, -5.8203125, -5.5810546875, -5.341796875, -5.1025390625, -4.86328125, -4.6240234375, -4.384765625, -4.1455078125, -3.90625, -3.6669921875, -3.427734375, -3.1884765625, -2.94921875, -2.7099609375, -2.470703125, -2.2314453125, -1.9921875, -1.7529296875, -1.513671875, -1.2744140625, -1.03515625, -0.7958984375, -0.556640625, -0.3173828125, -0.078125, 0.1611328125, 0.400390625, 0.6396484375, 0.87890625, 1.1181640625, 1.357421875, 1.5966796875, 1.8359375, 2.0751953125, 2.314453125, 2.5537109375, 2.79296875, 3.0322265625, 3.271484375, 3.5107421875, 3.75, 3.9892578125, 4.228515625, 4.4677734375, 4.70703125, 4.9462890625, 5.185546875, 5.4248046875, 5.6640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 20.0, 435.0, 555.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.96212768554688, -70.01885986328125, -60.075584411621094, -50.1323127746582, -40.18904113769531, -30.245769500732422, -20.30249786376953, -10.359222412109375, -0.41595458984375, 9.52731704711914, 19.47058868408203, 29.413860321044922, 39.35713195800781, 49.3004035949707, 59.243675231933594, 69.18695068359375, 79.13021850585938, 89.073486328125, 99.01676177978516, 108.96003723144531, 118.90330505371094, 128.84657287597656, 138.78985595703125, 148.73312377929688, 158.6763916015625, 168.61965942382812, 178.56292724609375, 188.50621032714844, 198.44947814941406, 208.3927459716797, 218.33602905273438, 228.279296875, 238.2225341796875, 248.16580200195312, 258.10906982421875, 268.0523376464844, 277.99560546875, 287.93890380859375, 297.8821716308594, 307.825439453125, 317.7687072753906, 327.71197509765625, 337.6552429199219, 347.5985107421875, 357.54180908203125, 367.4850769042969, 377.4283447265625, 387.3716125488281, 397.31488037109375, 407.2581481933594, 417.201416015625, 427.1446838378906, 437.08795166015625, 447.03125, 456.9745178222656, 466.91778564453125, 476.8610534667969, 486.8043212890625, 496.7475891113281, 506.69085693359375, 516.6341552734375, 526.577392578125, 536.5206909179688, 546.4639892578125, 556.4072265625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 10.0, 10.0, 28.0, 26.0, 30.0, 45.0, 81.0, 80.0, 91.0, 114.0, 104.0, 92.0, 75.0, 52.0, 55.0, 52.0, 25.0, 13.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.575244903564453, -22.17174530029297, -20.768245697021484, -19.36474609375, -17.961246490478516, -16.55774688720703, -15.15424919128418, -13.750749588012695, -12.347249984741211, -10.943750381469727, -9.540250778198242, -8.136752128601074, -6.73325252532959, -5.3297529220581055, -3.9262542724609375, -2.522754669189453, -1.1192550659179688, 0.2842442989349365, 1.6877436637878418, 3.091242790222168, 4.494742393493652, 5.898241996765137, 7.301740646362305, 8.705240249633789, 10.108739852905273, 11.512239456176758, 12.915739059448242, 14.31923770904541, 15.722737312316895, 17.126235961914062, 18.529735565185547, 19.93323516845703, 21.33673095703125, 22.740230560302734, 24.14373016357422, 25.547229766845703, 26.950729370117188, 28.354228973388672, 29.757726669311523, 31.161226272583008, 32.564727783203125, 33.96822738647461, 35.371726989746094, 36.77522659301758, 38.17872619628906, 39.58222579956055, 40.98572540283203, 42.38922119140625, 43.792720794677734, 45.19622039794922, 46.5997200012207, 48.00321960449219, 49.40671920776367, 50.810218811035156, 52.213714599609375, 53.617218017578125, 55.020713806152344, 56.42421340942383, 57.82771301269531, 59.2312126159668, 60.63471221923828, 62.038211822509766, 63.44171142578125, 64.84520721435547, 66.24871063232422]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 64.0, 1135.0, 4191979.0, 681.0, 205.0, 115.0, 52.0, 25.0, 17.0, 7.0, 9.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -11.6982421875, -6.583984375, -1.4697265625, 3.64453125, 8.7587890625, 13.873046875, 18.9873046875, 24.1015625, 29.2158203125, 34.330078125, 39.4443359375, 44.55859375, 49.6728515625, 54.787109375, 59.9013671875, 65.015625, 70.1298828125, 75.244140625, 80.3583984375, 85.47265625, 90.5869140625, 95.701171875, 100.8154296875, 105.9296875, 111.0439453125, 116.158203125, 121.2724609375, 126.38671875, 131.5009765625, 136.615234375, 141.7294921875, 146.84375, 151.9580078125, 157.072265625, 162.1865234375, 167.30078125, 172.4150390625, 177.529296875, 182.6435546875, 187.7578125, 192.8720703125, 197.986328125, 203.1005859375, 208.21484375, 213.3291015625, 218.443359375, 223.5576171875, 228.671875, 233.7861328125, 238.900390625, 244.0146484375, 249.12890625, 254.2431640625, 259.357421875, 264.4716796875, 269.5859375, 274.7001953125, 279.814453125, 284.9287109375, 290.04296875, 295.1572265625, 300.271484375, 305.3857421875, 310.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 13.0, 98.0, 334.0, 414.0, 134.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.396026611328125, -0.27056884765625, -0.145111083984375, -0.0196533203125, 0.105804443359375, 0.23126220703125, 0.356719970703125, 0.482177734375, 0.607635498046875, 0.73309326171875, 0.858551025390625, 0.9840087890625, 1.109466552734375, 1.23492431640625, 1.360382080078125, 1.48583984375, 1.611297607421875, 1.73675537109375, 1.862213134765625, 1.9876708984375, 2.113128662109375, 2.23858642578125, 2.364044189453125, 2.489501953125, 2.614959716796875, 2.74041748046875, 2.865875244140625, 2.9913330078125, 3.116790771484375, 3.24224853515625, 3.367706298828125, 3.4931640625, 3.618621826171875, 3.74407958984375, 3.869537353515625, 3.9949951171875, 4.120452880859375, 4.24591064453125, 4.371368408203125, 4.496826171875, 4.622283935546875, 4.74774169921875, 4.873199462890625, 4.9986572265625, 5.124114990234375, 5.24957275390625, 5.375030517578125, 5.50048828125, 5.625946044921875, 5.75140380859375, 5.876861572265625, 6.0023193359375, 6.127777099609375, 6.25323486328125, 6.378692626953125, 6.504150390625, 6.629608154296875, 6.75506591796875, 6.880523681640625, 7.0059814453125, 7.131439208984375, 7.25689697265625, 7.382354736328125, 7.5078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 26.0, 53.0, 128.0, 416.0, 4322.0, 4174386.0, 13628.0, 851.0, 291.0, 124.0, 40.0, 11.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -30.48291015625, -27.8720703125, -25.26123046875, -22.650390625, -20.03955078125, -17.4287109375, -14.81787109375, -12.20703125, -9.59619140625, -6.9853515625, -4.37451171875, -1.763671875, 0.84716796875, 3.4580078125, 6.06884765625, 8.6796875, 11.29052734375, 13.9013671875, 16.51220703125, 19.123046875, 21.73388671875, 24.3447265625, 26.95556640625, 29.56640625, 32.17724609375, 34.7880859375, 37.39892578125, 40.009765625, 42.62060546875, 45.2314453125, 47.84228515625, 50.453125, 53.06396484375, 55.6748046875, 58.28564453125, 60.896484375, 63.50732421875, 66.1181640625, 68.72900390625, 71.33984375, 73.95068359375, 76.5615234375, 79.17236328125, 81.783203125, 84.39404296875, 87.0048828125, 89.61572265625, 92.2265625, 94.83740234375, 97.4482421875, 100.05908203125, 102.669921875, 105.28076171875, 107.8916015625, 110.50244140625, 113.11328125, 115.72412109375, 118.3349609375, 120.94580078125, 123.556640625, 126.16748046875, 128.7783203125, 131.38916015625, 134.0]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 10.0, 21.0, 44.0, 99.0, 445.0, 3196.0, 198.0, 33.0, 9.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.69140625, -4.44842529296875, -4.2054443359375, -3.96246337890625, -3.719482421875, -3.47650146484375, -3.2335205078125, -2.99053955078125, -2.74755859375, -2.50457763671875, -2.2615966796875, -2.01861572265625, -1.775634765625, -1.53265380859375, -1.2896728515625, -1.04669189453125, -0.8037109375, -0.56072998046875, -0.3177490234375, -0.07476806640625, 0.168212890625, 0.41119384765625, 0.6541748046875, 0.89715576171875, 1.14013671875, 1.38311767578125, 1.6260986328125, 1.86907958984375, 2.112060546875, 2.35504150390625, 2.5980224609375, 2.84100341796875, 3.083984375, 3.32696533203125, 3.5699462890625, 3.81292724609375, 4.055908203125, 4.29888916015625, 4.5418701171875, 4.78485107421875, 5.02783203125, 5.27081298828125, 5.5137939453125, 5.75677490234375, 5.999755859375, 6.24273681640625, 6.4857177734375, 6.72869873046875, 6.9716796875, 7.21466064453125, 7.4576416015625, 7.70062255859375, 7.943603515625, 8.18658447265625, 8.4295654296875, 8.67254638671875, 8.91552734375, 9.15850830078125, 9.4014892578125, 9.64447021484375, 9.887451171875, 10.13043212890625, 10.3734130859375, 10.61639404296875, 10.859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 14.0, 257.0, 710.0, 25.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-126.69851684570312, -122.35978698730469, -118.02105712890625, -113.68233489990234, -109.3436050415039, -105.00487518310547, -100.66615295410156, -96.32742309570312, -91.98869323730469, -87.64996337890625, -83.31123352050781, -78.9725112915039, -74.63378143310547, -70.29505157470703, -65.95632934570312, -61.61759948730469, -57.27886962890625, -52.94013977050781, -48.60141372680664, -44.26268768310547, -39.92395782470703, -35.585227966308594, -31.246501922607422, -26.907773971557617, -22.569046020507812, -18.230318069458008, -13.891590118408203, -9.552862167358398, -5.214134216308594, -0.8754062652587891, 3.4633216857910156, 7.80204963684082, 12.140792846679688, 16.479520797729492, 20.818248748779297, 25.1569766998291, 29.495704650878906, 33.834434509277344, 38.173160552978516, 42.51188659667969, 46.850616455078125, 51.18934631347656, 55.528072357177734, 59.866798400878906, 64.20552825927734, 68.54425811767578, 72.88298034667969, 77.22171020507812, 81.56044006347656, 85.899169921875, 90.23789978027344, 94.57662200927734, 98.91535186767578, 103.25408172607422, 107.59280395507812, 111.93153381347656, 116.270263671875, 120.60899353027344, 124.94772338867188, 129.2864532470703, 133.62518310546875, 137.96389770507812, 142.30262756347656, 146.641357421875, 150.98008728027344]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 13.0, 29.0, 26.0, 62.0, 84.0, 122.0, 124.0, 121.0, 130.0, 93.0, 71.0, 55.0, 35.0, 18.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.66246795654297, -46.25364303588867, -44.84481430053711, -43.43598937988281, -42.02716064453125, -40.61833572387695, -39.209510803222656, -37.800682067871094, -36.3918571472168, -34.9830322265625, -33.57420349121094, -32.16537857055664, -30.75655174255371, -29.34772491455078, -27.938899993896484, -26.530073165893555, -25.121246337890625, -23.712419509887695, -22.303592681884766, -20.89476776123047, -19.48594093322754, -18.07711410522461, -16.668289184570312, -15.259462356567383, -13.850635528564453, -12.441808700561523, -11.03298282623291, -9.624156951904297, -8.215330123901367, -6.806503772735596, -5.397677421569824, -3.988851547241211, -2.5800247192382812, -1.1711983680725098, 0.23762798309326172, 1.6464543342590332, 3.0552806854248047, 4.464107036590576, 5.872933387756348, 7.281759262084961, 8.69058609008789, 10.09941291809082, 11.508238792419434, 12.917064666748047, 14.325891494750977, 15.734718322753906, 17.143543243408203, 18.552370071411133, 19.961196899414062, 21.370023727416992, 22.778850555419922, 24.18767547607422, 25.59650230407715, 27.005329132080078, 28.414154052734375, 29.822980880737305, 31.231807708740234, 32.64063262939453, 34.049461364746094, 35.45828628540039, 36.86711120605469, 38.27593994140625, 39.68476486206055, 41.093589782714844, 42.502418518066406]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 12.0, 14.0, 15.0, 23.0, 36.0, 41.0, 58.0, 103.0, 208.0, 688.0, 5887.0, 732693.0, 303846.0, 3875.0, 531.0, 196.0, 86.0, 51.0, 46.0, 26.0, 33.0, 20.0, 10.0, 6.0, 10.0, 3.0, 3.0, 7.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.234375, -24.297119140625, -23.35986328125, -22.422607421875, -21.4853515625, -20.548095703125, -19.61083984375, -18.673583984375, -17.736328125, -16.799072265625, -15.86181640625, -14.924560546875, -13.9873046875, -13.050048828125, -12.11279296875, -11.175537109375, -10.23828125, -9.301025390625, -8.36376953125, -7.426513671875, -6.4892578125, -5.552001953125, -4.61474609375, -3.677490234375, -2.740234375, -1.802978515625, -0.86572265625, 0.071533203125, 1.0087890625, 1.946044921875, 2.88330078125, 3.820556640625, 4.7578125, 5.695068359375, 6.63232421875, 7.569580078125, 8.5068359375, 9.444091796875, 10.38134765625, 11.318603515625, 12.255859375, 13.193115234375, 14.13037109375, 15.067626953125, 16.0048828125, 16.942138671875, 17.87939453125, 18.816650390625, 19.75390625, 20.691162109375, 21.62841796875, 22.565673828125, 23.5029296875, 24.440185546875, 25.37744140625, 26.314697265625, 27.251953125, 28.189208984375, 29.12646484375, 30.063720703125, 31.0009765625, 31.938232421875, 32.87548828125, 33.812744140625, 34.75]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 33.0, 83.0, 191.0, 282.0, 205.0, 133.0, 51.0, 13.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.348663330078125, -2.19927978515625, -2.049896240234375, -1.9005126953125, -1.751129150390625, -1.60174560546875, -1.452362060546875, -1.302978515625, -1.153594970703125, -1.00421142578125, -0.854827880859375, -0.7054443359375, -0.556060791015625, -0.40667724609375, -0.257293701171875, -0.10791015625, 0.041473388671875, 0.19085693359375, 0.340240478515625, 0.4896240234375, 0.639007568359375, 0.78839111328125, 0.937774658203125, 1.087158203125, 1.236541748046875, 1.38592529296875, 1.535308837890625, 1.6846923828125, 1.834075927734375, 1.98345947265625, 2.132843017578125, 2.2822265625, 2.431610107421875, 2.58099365234375, 2.730377197265625, 2.8797607421875, 3.029144287109375, 3.17852783203125, 3.327911376953125, 3.477294921875, 3.626678466796875, 3.77606201171875, 3.925445556640625, 4.0748291015625, 4.224212646484375, 4.37359619140625, 4.522979736328125, 4.67236328125, 4.821746826171875, 4.97113037109375, 5.120513916015625, 5.2698974609375, 5.419281005859375, 5.56866455078125, 5.718048095703125, 5.867431640625, 6.016815185546875, 6.16619873046875, 6.315582275390625, 6.4649658203125, 6.614349365234375, 6.76373291015625, 6.913116455078125, 7.0625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 12.0, 17.0, 16.0, 41.0, 50.0, 103.0, 215.0, 514.0, 1677.0, 8825.0, 140447.0, 838393.0, 51208.0, 5003.0, 1159.0, 396.0, 176.0, 105.0, 53.0, 25.0, 22.0, 20.0, 14.0, 6.0, 11.0, 4.0, 3.0, 0.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.203125, -11.8138427734375, -11.424560546875, -11.0352783203125, -10.64599609375, -10.2567138671875, -9.867431640625, -9.4781494140625, -9.0888671875, -8.6995849609375, -8.310302734375, -7.9210205078125, -7.53173828125, -7.1424560546875, -6.753173828125, -6.3638916015625, -5.974609375, -5.5853271484375, -5.196044921875, -4.8067626953125, -4.41748046875, -4.0281982421875, -3.638916015625, -3.2496337890625, -2.8603515625, -2.4710693359375, -2.081787109375, -1.6925048828125, -1.30322265625, -0.9139404296875, -0.524658203125, -0.1353759765625, 0.25390625, 0.6431884765625, 1.032470703125, 1.4217529296875, 1.81103515625, 2.2003173828125, 2.589599609375, 2.9788818359375, 3.3681640625, 3.7574462890625, 4.146728515625, 4.5360107421875, 4.92529296875, 5.3145751953125, 5.703857421875, 6.0931396484375, 6.482421875, 6.8717041015625, 7.260986328125, 7.6502685546875, 8.03955078125, 8.4288330078125, 8.818115234375, 9.2073974609375, 9.5966796875, 9.9859619140625, 10.375244140625, 10.7645263671875, 11.15380859375, 11.5430908203125, 11.932373046875, 12.3216552734375, 12.7109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 8.0, 10.0, 10.0, 13.0, 14.0, 18.0, 28.0, 42.0, 36.0, 46.0, 55.0, 65.0, 81.0, 80.0, 63.0, 53.0, 51.0, 47.0, 55.0, 51.0, 40.0, 23.0, 27.0, 20.0, 11.0, 13.0, 11.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3984375, -5.20611572265625, -5.0137939453125, -4.82147216796875, -4.629150390625, -4.43682861328125, -4.2445068359375, -4.05218505859375, -3.85986328125, -3.66754150390625, -3.4752197265625, -3.28289794921875, -3.090576171875, -2.89825439453125, -2.7059326171875, -2.51361083984375, -2.3212890625, -2.12896728515625, -1.9366455078125, -1.74432373046875, -1.552001953125, -1.35968017578125, -1.1673583984375, -0.97503662109375, -0.78271484375, -0.59039306640625, -0.3980712890625, -0.20574951171875, -0.013427734375, 0.17889404296875, 0.3712158203125, 0.56353759765625, 0.755859375, 0.94818115234375, 1.1405029296875, 1.33282470703125, 1.525146484375, 1.71746826171875, 1.9097900390625, 2.10211181640625, 2.29443359375, 2.48675537109375, 2.6790771484375, 2.87139892578125, 3.063720703125, 3.25604248046875, 3.4483642578125, 3.64068603515625, 3.8330078125, 4.02532958984375, 4.2176513671875, 4.40997314453125, 4.602294921875, 4.79461669921875, 4.9869384765625, 5.17926025390625, 5.37158203125, 5.56390380859375, 5.7562255859375, 5.94854736328125, 6.140869140625, 6.33319091796875, 6.5255126953125, 6.71783447265625, 6.91015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 19.0, 16.0, 29.0, 48.0, 128.0, 310.0, 1058.0, 6425.0, 245905.0, 780795.0, 11520.0, 1561.0, 430.0, 164.0, 61.0, 35.0, 18.0, 7.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.3311767578125, -9.842041015625, -9.3529052734375, -8.86376953125, -8.3746337890625, -7.885498046875, -7.3963623046875, -6.9072265625, -6.4180908203125, -5.928955078125, -5.4398193359375, -4.95068359375, -4.4615478515625, -3.972412109375, -3.4832763671875, -2.994140625, -2.5050048828125, -2.015869140625, -1.5267333984375, -1.03759765625, -0.5484619140625, -0.059326171875, 0.4298095703125, 0.9189453125, 1.4080810546875, 1.897216796875, 2.3863525390625, 2.87548828125, 3.3646240234375, 3.853759765625, 4.3428955078125, 4.83203125, 5.3211669921875, 5.810302734375, 6.2994384765625, 6.78857421875, 7.2777099609375, 7.766845703125, 8.2559814453125, 8.7451171875, 9.2342529296875, 9.723388671875, 10.2125244140625, 10.70166015625, 11.1907958984375, 11.679931640625, 12.1690673828125, 12.658203125, 13.1473388671875, 13.636474609375, 14.1256103515625, 14.61474609375, 15.1038818359375, 15.593017578125, 16.0821533203125, 16.5712890625, 17.0604248046875, 17.549560546875, 18.0386962890625, 18.52783203125, 19.0169677734375, 19.506103515625, 19.9952392578125, 20.484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 11.0, 21.0, 29.0, 55.0, 102.0, 177.0, 231.0, 156.0, 100.0, 44.0, 24.0, 15.0, 7.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009379386901855469, -0.0008939877152442932, -0.0008500367403030396, -0.0008060857653617859, -0.0007621347904205322, -0.0007181838154792786, -0.0006742328405380249, -0.0006302818655967712, -0.0005863308906555176, -0.0005423799157142639, -0.0004984289407730103, -0.0004544779658317566, -0.00041052699089050293, -0.00036657601594924927, -0.0003226250410079956, -0.00027867406606674194, -0.00023472309112548828, -0.00019077211618423462, -0.00014682114124298096, -0.0001028701663017273, -5.891919136047363e-05, -1.496821641921997e-05, 2.898275852203369e-05, 7.293373346328735e-05, 0.00011688470840454102, 0.00016083568334579468, 0.00020478665828704834, 0.000248737633228302, 0.00029268860816955566, 0.0003366395831108093, 0.000380590558052063, 0.00042454153299331665, 0.0004684925079345703, 0.000512443482875824, 0.0005563944578170776, 0.0006003454327583313, 0.000644296407699585, 0.0006882473826408386, 0.0007321983575820923, 0.000776149332523346, 0.0008201003074645996, 0.0008640512824058533, 0.0009080022573471069, 0.0009519532322883606, 0.0009959042072296143, 0.001039855182170868, 0.0010838061571121216, 0.0011277571320533752, 0.001171708106994629, 0.0012156590819358826, 0.0012596100568771362, 0.00130356103181839, 0.0013475120067596436, 0.0013914629817008972, 0.0014354139566421509, 0.0014793649315834045, 0.0015233159065246582, 0.0015672668814659119, 0.0016112178564071655, 0.0016551688313484192, 0.0016991198062896729, 0.0017430707812309265, 0.0017870217561721802, 0.0018309727311134338, 0.0018749237060546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 9.0, 12.0, 25.0, 43.0, 77.0, 136.0, 288.0, 648.0, 2290.0, 12767.0, 222210.0, 764952.0, 38547.0, 4728.0, 1096.0, 348.0, 168.0, 83.0, 49.0, 27.0, 14.0, 12.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.1796875, -12.84375, -12.5078125, -12.171875, -11.8359375, -11.5, -11.1640625, -10.828125, -10.4921875, -10.15625, -9.8203125, -9.484375, -9.1484375, -8.8125, -8.4765625, -8.140625, -7.8046875, -7.46875, -7.1328125, -6.796875, -6.4609375, -6.125, -5.7890625, -5.453125, -5.1171875, -4.78125, -4.4453125, -4.109375, -3.7734375, -3.4375, -3.1015625, -2.765625, -2.4296875, -2.09375, -1.7578125, -1.421875, -1.0859375, -0.75, -0.4140625, -0.078125, 0.2578125, 0.59375, 0.9296875, 1.265625, 1.6015625, 1.9375, 2.2734375, 2.609375, 2.9453125, 3.28125, 3.6171875, 3.953125, 4.2890625, 4.625, 4.9609375, 5.296875, 5.6328125, 5.96875, 6.3046875, 6.640625, 6.9765625, 7.3125, 7.6484375, 7.984375, 8.3203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 9.0, 6.0, 7.0, 14.0, 19.0, 28.0, 42.0, 57.0, 85.0, 113.0, 125.0, 149.0, 119.0, 59.0, 55.0, 41.0, 24.0, 10.0, 7.0, 12.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.296875, -5.1453857421875, -4.993896484375, -4.8424072265625, -4.69091796875, -4.5394287109375, -4.387939453125, -4.2364501953125, -4.0849609375, -3.9334716796875, -3.781982421875, -3.6304931640625, -3.47900390625, -3.3275146484375, -3.176025390625, -3.0245361328125, -2.873046875, -2.7215576171875, -2.570068359375, -2.4185791015625, -2.26708984375, -2.1156005859375, -1.964111328125, -1.8126220703125, -1.6611328125, -1.5096435546875, -1.358154296875, -1.2066650390625, -1.05517578125, -0.9036865234375, -0.752197265625, -0.6007080078125, -0.44921875, -0.2977294921875, -0.146240234375, 0.0052490234375, 0.15673828125, 0.3082275390625, 0.459716796875, 0.6112060546875, 0.7626953125, 0.9141845703125, 1.065673828125, 1.2171630859375, 1.36865234375, 1.5201416015625, 1.671630859375, 1.8231201171875, 1.974609375, 2.1260986328125, 2.277587890625, 2.4290771484375, 2.58056640625, 2.7320556640625, 2.883544921875, 3.0350341796875, 3.1865234375, 3.3380126953125, 3.489501953125, 3.6409912109375, 3.79248046875, 3.9439697265625, 4.095458984375, 4.2469482421875, 4.3984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 11.0, 15.0, 29.0, 129.0, 494.0, 268.0, 59.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.02476501464844, -106.33174133300781, -102.63872528076172, -98.94570922851562, -95.252685546875, -91.55966186523438, -87.86664581298828, -84.17362976074219, -80.48060607910156, -76.78758239746094, -73.09456634521484, -69.40155029296875, -65.70852661132812, -62.015506744384766, -58.322486877441406, -54.62946701049805, -50.93644714355469, -47.24342727661133, -43.55040740966797, -39.85738754272461, -36.16436767578125, -32.47134780883789, -28.77832794189453, -25.085308074951172, -21.392288208007812, -17.699268341064453, -14.006248474121094, -10.313228607177734, -6.620208740234375, -2.9271888732910156, 0.7658309936523438, 4.458850860595703, 8.151878356933594, 11.844898223876953, 15.537918090820312, 19.230937957763672, 22.92395782470703, 26.61697769165039, 30.30999755859375, 34.00301742553711, 37.69603729248047, 41.38905715942383, 45.08207702636719, 48.77509689331055, 52.468116760253906, 56.161136627197266, 59.854156494140625, 63.547176361083984, 67.24019622802734, 70.93321228027344, 74.62623596191406, 78.31925964355469, 82.01227569580078, 85.70529174804688, 89.3983154296875, 93.09133911132812, 96.78435516357422, 100.47737121582031, 104.17039489746094, 107.86341857910156, 111.55643463134766, 115.24945068359375, 118.94247436523438, 122.635498046875, 126.3285140991211]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 5.0, 8.0, 11.0, 9.0, 21.0, 30.0, 25.0, 31.0, 43.0, 52.0, 45.0, 61.0, 58.0, 67.0, 56.0, 49.0, 60.0, 62.0, 67.0, 53.0, 33.0, 21.0, 33.0, 15.0, 25.0, 19.0, 9.0, 13.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.06242370605469, -35.8731575012207, -34.68389129638672, -33.494625091552734, -32.30535888671875, -31.1160945892334, -29.926830291748047, -28.737564086914062, -27.548297882080078, -26.359031677246094, -25.16976547241211, -23.980501174926758, -22.791234970092773, -21.60196876525879, -20.412704467773438, -19.223438262939453, -18.03417205810547, -16.844905853271484, -15.655640602111816, -14.466375350952148, -13.277109146118164, -12.08784294128418, -10.898577690124512, -9.709312438964844, -8.52004623413086, -7.330780506134033, -6.141514778137207, -4.952249050140381, -3.7629833221435547, -2.5737175941467285, -1.3844518661499023, -0.19518661499023438, 0.9940757751464844, 2.1833415031433105, 3.3726072311401367, 4.561872959136963, 5.751138687133789, 6.940404415130615, 8.129670143127441, 9.31893539428711, 10.508201599121094, 11.697467803955078, 12.886733055114746, 14.075998306274414, 15.265264511108398, 16.454530715942383, 17.643795013427734, 18.83306121826172, 20.022327423095703, 21.211593627929688, 22.400859832763672, 23.590124130249023, 24.779390335083008, 25.968656539916992, 27.157920837402344, 28.347187042236328, 29.536453247070312, 30.725719451904297, 31.91498565673828, 33.104251861572266, 34.29351806640625, 35.48278045654297, 36.67204666137695, 37.86131286621094, 39.05057907104492]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 8.0, 25.0, 57.0, 207.0, 805.0, 6051.0, 333684.0, 3840772.0, 10285.0, 1270.0, 383.0, 181.0, 121.0, 93.0, 71.0, 45.0, 38.0, 33.0, 32.0, 20.0, 15.0, 17.0, 11.0, 10.0, 10.0, 3.0, 6.0, 6.0, 7.0, 2.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -9.65966796875, -8.6005859375, -7.54150390625, -6.482421875, -5.42333984375, -4.3642578125, -3.30517578125, -2.24609375, -1.18701171875, -0.1279296875, 0.93115234375, 1.990234375, 3.04931640625, 4.1083984375, 5.16748046875, 6.2265625, 7.28564453125, 8.3447265625, 9.40380859375, 10.462890625, 11.52197265625, 12.5810546875, 13.64013671875, 14.69921875, 15.75830078125, 16.8173828125, 17.87646484375, 18.935546875, 19.99462890625, 21.0537109375, 22.11279296875, 23.171875, 24.23095703125, 25.2900390625, 26.34912109375, 27.408203125, 28.46728515625, 29.5263671875, 30.58544921875, 31.64453125, 32.70361328125, 33.7626953125, 34.82177734375, 35.880859375, 36.93994140625, 37.9990234375, 39.05810546875, 40.1171875, 41.17626953125, 42.2353515625, 43.29443359375, 44.353515625, 45.41259765625, 46.4716796875, 47.53076171875, 48.58984375, 49.64892578125, 50.7080078125, 51.76708984375, 52.826171875, 53.88525390625, 54.9443359375, 56.00341796875, 57.0625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 16.0, 49.0, 83.0, 209.0, 240.0, 215.0, 127.0, 47.0, 14.0, 9.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.611328125, -1.460174560546875, -1.30902099609375, -1.157867431640625, -1.0067138671875, -0.855560302734375, -0.70440673828125, -0.553253173828125, -0.402099609375, -0.250946044921875, -0.09979248046875, 0.051361083984375, 0.2025146484375, 0.353668212890625, 0.50482177734375, 0.655975341796875, 0.80712890625, 0.958282470703125, 1.10943603515625, 1.260589599609375, 1.4117431640625, 1.562896728515625, 1.71405029296875, 1.865203857421875, 2.016357421875, 2.167510986328125, 2.31866455078125, 2.469818115234375, 2.6209716796875, 2.772125244140625, 2.92327880859375, 3.074432373046875, 3.2255859375, 3.376739501953125, 3.52789306640625, 3.679046630859375, 3.8302001953125, 3.981353759765625, 4.13250732421875, 4.283660888671875, 4.434814453125, 4.585968017578125, 4.73712158203125, 4.888275146484375, 5.0394287109375, 5.190582275390625, 5.34173583984375, 5.492889404296875, 5.64404296875, 5.795196533203125, 5.94635009765625, 6.097503662109375, 6.2486572265625, 6.399810791015625, 6.55096435546875, 6.702117919921875, 6.853271484375, 7.004425048828125, 7.15557861328125, 7.306732177734375, 7.4578857421875, 7.609039306640625, 7.76019287109375, 7.911346435546875, 8.0625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 15.0, 49.0, 99.0, 192.0, 778.0, 3892503.0, 298908.0, 1078.0, 332.0, 157.0, 96.0, 41.0, 17.0, 11.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.46875, -32.50244140625, -29.5361328125, -26.56982421875, -23.603515625, -20.63720703125, -17.6708984375, -14.70458984375, -11.73828125, -8.77197265625, -5.8056640625, -2.83935546875, 0.126953125, 3.09326171875, 6.0595703125, 9.02587890625, 11.9921875, 14.95849609375, 17.9248046875, 20.89111328125, 23.857421875, 26.82373046875, 29.7900390625, 32.75634765625, 35.72265625, 38.68896484375, 41.6552734375, 44.62158203125, 47.587890625, 50.55419921875, 53.5205078125, 56.48681640625, 59.453125, 62.41943359375, 65.3857421875, 68.35205078125, 71.318359375, 74.28466796875, 77.2509765625, 80.21728515625, 83.18359375, 86.14990234375, 89.1162109375, 92.08251953125, 95.048828125, 98.01513671875, 100.9814453125, 103.94775390625, 106.9140625, 109.88037109375, 112.8466796875, 115.81298828125, 118.779296875, 121.74560546875, 124.7119140625, 127.67822265625, 130.64453125, 133.61083984375, 136.5771484375, 139.54345703125, 142.509765625, 145.47607421875, 148.4423828125, 151.40869140625, 154.375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 14.0, 34.0, 77.0, 546.0, 3122.0, 229.0, 28.0, 11.0, 9.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.16754150390625, -1.8702392578125, -1.57293701171875, -1.275634765625, -0.97833251953125, -0.6810302734375, -0.38372802734375, -0.08642578125, 0.21087646484375, 0.5081787109375, 0.80548095703125, 1.102783203125, 1.40008544921875, 1.6973876953125, 1.99468994140625, 2.2919921875, 2.58929443359375, 2.8865966796875, 3.18389892578125, 3.481201171875, 3.77850341796875, 4.0758056640625, 4.37310791015625, 4.67041015625, 4.96771240234375, 5.2650146484375, 5.56231689453125, 5.859619140625, 6.15692138671875, 6.4542236328125, 6.75152587890625, 7.048828125, 7.34613037109375, 7.6434326171875, 7.94073486328125, 8.238037109375, 8.53533935546875, 8.8326416015625, 9.12994384765625, 9.42724609375, 9.72454833984375, 10.0218505859375, 10.31915283203125, 10.616455078125, 10.91375732421875, 11.2110595703125, 11.50836181640625, 11.8056640625, 12.10296630859375, 12.4002685546875, 12.69757080078125, 12.994873046875, 13.29217529296875, 13.5894775390625, 13.88677978515625, 14.18408203125, 14.48138427734375, 14.7786865234375, 15.07598876953125, 15.373291015625, 15.67059326171875, 15.9678955078125, 16.26519775390625, 16.5625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 26.0, 337.0, 529.0, 74.0, 25.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.65919494628906, -71.03740692138672, -68.41561889648438, -65.79383087158203, -63.17204284667969, -60.550254821777344, -57.928462982177734, -55.30667495727539, -52.68488693237305, -50.0630989074707, -47.44131088256836, -44.819522857666016, -42.197731018066406, -39.57594299316406, -36.95415496826172, -34.332366943359375, -31.71057891845703, -29.088790893554688, -26.467002868652344, -23.845212936401367, -21.223424911499023, -18.60163688659668, -15.97984790802002, -13.35805892944336, -10.736270904541016, -8.114482879638672, -5.492693901062012, -2.8709053993225098, -0.2491168975830078, 2.372671127319336, 4.994460105895996, 7.616249084472656, 10.238037109375, 12.859825134277344, 15.481614112854004, 18.103403091430664, 20.725191116333008, 23.34697914123535, 25.968769073486328, 28.590557098388672, 31.212345123291016, 33.83413314819336, 36.4559211730957, 39.07770919799805, 41.699501037597656, 44.3212890625, 46.943077087402344, 49.56486511230469, 52.18665313720703, 54.808441162109375, 57.43022918701172, 60.05201721191406, 62.673805236816406, 65.29559326171875, 67.9173812866211, 70.53916931152344, 73.16096496582031, 75.78275299072266, 78.404541015625, 81.02632904052734, 83.64811706542969, 86.26990509033203, 88.89169311523438, 91.51348876953125, 94.13526916503906]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 11.0, 20.0, 38.0, 61.0, 70.0, 87.0, 86.0, 116.0, 120.0, 100.0, 82.0, 73.0, 38.0, 38.0, 19.0, 11.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.18561553955078, -31.13006591796875, -30.07451629638672, -29.018966674804688, -27.963417053222656, -26.907867431640625, -25.852319717407227, -24.796770095825195, -23.741220474243164, -22.685670852661133, -21.6301212310791, -20.57457160949707, -19.519023895263672, -18.46347427368164, -17.40792465209961, -16.352375030517578, -15.296825408935547, -14.241275787353516, -13.185726165771484, -12.13017749786377, -11.074627876281738, -10.019078254699707, -8.963529586791992, -7.907979965209961, -6.85243034362793, -5.796880722045898, -4.741331577301025, -3.6857821941375732, -2.630232810974121, -1.5746831893920898, -0.5191340446472168, 0.5364151000976562, 1.5919685363769531, 2.6475179195404053, 3.7030673027038574, 4.7586164474487305, 5.814166069030762, 6.869715690612793, 7.925264835357666, 8.980813980102539, 10.03636360168457, 11.091913223266602, 12.147462844848633, 13.203011512756348, 14.258561134338379, 15.31411075592041, 16.369659423828125, 17.425209045410156, 18.480758666992188, 19.53630828857422, 20.59185791015625, 21.64740753173828, 22.702957153320312, 23.758506774902344, 24.814054489135742, 25.869604110717773, 26.925153732299805, 27.980703353881836, 29.036252975463867, 30.0918025970459, 31.147350311279297, 32.20289993286133, 33.25844955444336, 34.31399917602539, 35.36954879760742]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 2.0, 6.0, 4.0, 10.0, 11.0, 15.0, 16.0, 29.0, 30.0, 33.0, 67.0, 73.0, 136.0, 273.0, 584.0, 1982.0, 13112.0, 281222.0, 715585.0, 30281.0, 3322.0, 875.0, 334.0, 178.0, 105.0, 69.0, 42.0, 30.0, 26.0, 20.0, 14.0, 13.0, 13.0, 8.0, 5.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2109375, -14.7066650390625, -14.202392578125, -13.6981201171875, -13.19384765625, -12.6895751953125, -12.185302734375, -11.6810302734375, -11.1767578125, -10.6724853515625, -10.168212890625, -9.6639404296875, -9.15966796875, -8.6553955078125, -8.151123046875, -7.6468505859375, -7.142578125, -6.6383056640625, -6.134033203125, -5.6297607421875, -5.12548828125, -4.6212158203125, -4.116943359375, -3.6126708984375, -3.1083984375, -2.6041259765625, -2.099853515625, -1.5955810546875, -1.09130859375, -0.5870361328125, -0.082763671875, 0.4215087890625, 0.92578125, 1.4300537109375, 1.934326171875, 2.4385986328125, 2.94287109375, 3.4471435546875, 3.951416015625, 4.4556884765625, 4.9599609375, 5.4642333984375, 5.968505859375, 6.4727783203125, 6.97705078125, 7.4813232421875, 7.985595703125, 8.4898681640625, 8.994140625, 9.4984130859375, 10.002685546875, 10.5069580078125, 11.01123046875, 11.5155029296875, 12.019775390625, 12.5240478515625, 13.0283203125, 13.5325927734375, 14.036865234375, 14.5411376953125, 15.04541015625, 15.5496826171875, 16.053955078125, 16.5582275390625, 17.0625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 13.0, 18.0, 37.0, 91.0, 131.0, 165.0, 184.0, 139.0, 110.0, 60.0, 32.0, 17.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.791015625, -2.638092041015625, -2.48516845703125, -2.332244873046875, -2.1793212890625, -2.026397705078125, -1.87347412109375, -1.720550537109375, -1.567626953125, -1.414703369140625, -1.26177978515625, -1.108856201171875, -0.9559326171875, -0.803009033203125, -0.65008544921875, -0.497161865234375, -0.34423828125, -0.191314697265625, -0.03839111328125, 0.114532470703125, 0.2674560546875, 0.420379638671875, 0.57330322265625, 0.726226806640625, 0.879150390625, 1.032073974609375, 1.18499755859375, 1.337921142578125, 1.4908447265625, 1.643768310546875, 1.79669189453125, 1.949615478515625, 2.1025390625, 2.255462646484375, 2.40838623046875, 2.561309814453125, 2.7142333984375, 2.867156982421875, 3.02008056640625, 3.173004150390625, 3.325927734375, 3.478851318359375, 3.63177490234375, 3.784698486328125, 3.9376220703125, 4.090545654296875, 4.24346923828125, 4.396392822265625, 4.54931640625, 4.702239990234375, 4.85516357421875, 5.008087158203125, 5.1610107421875, 5.313934326171875, 5.46685791015625, 5.619781494140625, 5.772705078125, 5.925628662109375, 6.07855224609375, 6.231475830078125, 6.3843994140625, 6.537322998046875, 6.69024658203125, 6.843170166015625, 6.99609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 7.0, 7.0, 15.0, 8.0, 15.0, 20.0, 45.0, 60.0, 99.0, 166.0, 297.0, 523.0, 1339.0, 4019.0, 18336.0, 153019.0, 718053.0, 130199.0, 16108.0, 3777.0, 1255.0, 540.0, 237.0, 133.0, 81.0, 48.0, 47.0, 32.0, 19.0, 17.0, 6.0, 12.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.2890625, -10.9794921875, -10.669921875, -10.3603515625, -10.05078125, -9.7412109375, -9.431640625, -9.1220703125, -8.8125, -8.5029296875, -8.193359375, -7.8837890625, -7.57421875, -7.2646484375, -6.955078125, -6.6455078125, -6.3359375, -6.0263671875, -5.716796875, -5.4072265625, -5.09765625, -4.7880859375, -4.478515625, -4.1689453125, -3.859375, -3.5498046875, -3.240234375, -2.9306640625, -2.62109375, -2.3115234375, -2.001953125, -1.6923828125, -1.3828125, -1.0732421875, -0.763671875, -0.4541015625, -0.14453125, 0.1650390625, 0.474609375, 0.7841796875, 1.09375, 1.4033203125, 1.712890625, 2.0224609375, 2.33203125, 2.6416015625, 2.951171875, 3.2607421875, 3.5703125, 3.8798828125, 4.189453125, 4.4990234375, 4.80859375, 5.1181640625, 5.427734375, 5.7373046875, 6.046875, 6.3564453125, 6.666015625, 6.9755859375, 7.28515625, 7.5947265625, 7.904296875, 8.2138671875, 8.5234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 2.0, 15.0, 13.0, 17.0, 18.0, 20.0, 22.0, 36.0, 38.0, 35.0, 47.0, 53.0, 52.0, 52.0, 56.0, 52.0, 55.0, 57.0, 52.0, 44.0, 48.0, 32.0, 22.0, 22.0, 28.0, 21.0, 16.0, 13.0, 11.0, 10.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.4453125, -8.20550537109375, -7.9656982421875, -7.72589111328125, -7.486083984375, -7.24627685546875, -7.0064697265625, -6.76666259765625, -6.52685546875, -6.28704833984375, -6.0472412109375, -5.80743408203125, -5.567626953125, -5.32781982421875, -5.0880126953125, -4.84820556640625, -4.6083984375, -4.36859130859375, -4.1287841796875, -3.88897705078125, -3.649169921875, -3.40936279296875, -3.1695556640625, -2.92974853515625, -2.68994140625, -2.45013427734375, -2.2103271484375, -1.97052001953125, -1.730712890625, -1.49090576171875, -1.2510986328125, -1.01129150390625, -0.771484375, -0.53167724609375, -0.2918701171875, -0.05206298828125, 0.187744140625, 0.42755126953125, 0.6673583984375, 0.90716552734375, 1.14697265625, 1.38677978515625, 1.6265869140625, 1.86639404296875, 2.106201171875, 2.34600830078125, 2.5858154296875, 2.82562255859375, 3.0654296875, 3.30523681640625, 3.5450439453125, 3.78485107421875, 4.024658203125, 4.26446533203125, 4.5042724609375, 4.74407958984375, 4.98388671875, 5.22369384765625, 5.4635009765625, 5.70330810546875, 5.943115234375, 6.18292236328125, 6.4227294921875, 6.66253662109375, 6.90234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 4.0, 6.0, 19.0, 11.0, 16.0, 19.0, 34.0, 54.0, 75.0, 101.0, 137.0, 255.0, 390.0, 646.0, 1218.0, 2415.0, 5270.0, 13062.0, 37882.0, 138114.0, 449137.0, 286606.0, 74020.0, 22794.0, 8468.0, 3691.0, 1788.0, 923.0, 493.0, 312.0, 193.0, 131.0, 82.0, 53.0, 36.0, 23.0, 25.0, 13.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.431640625, -2.3551025390625, -2.278564453125, -2.2020263671875, -2.12548828125, -2.0489501953125, -1.972412109375, -1.8958740234375, -1.8193359375, -1.7427978515625, -1.666259765625, -1.5897216796875, -1.51318359375, -1.4366455078125, -1.360107421875, -1.2835693359375, -1.20703125, -1.1304931640625, -1.053955078125, -0.9774169921875, -0.90087890625, -0.8243408203125, -0.747802734375, -0.6712646484375, -0.5947265625, -0.5181884765625, -0.441650390625, -0.3651123046875, -0.28857421875, -0.2120361328125, -0.135498046875, -0.0589599609375, 0.017578125, 0.0941162109375, 0.170654296875, 0.2471923828125, 0.32373046875, 0.4002685546875, 0.476806640625, 0.5533447265625, 0.6298828125, 0.7064208984375, 0.782958984375, 0.8594970703125, 0.93603515625, 1.0125732421875, 1.089111328125, 1.1656494140625, 1.2421875, 1.3187255859375, 1.395263671875, 1.4718017578125, 1.54833984375, 1.6248779296875, 1.701416015625, 1.7779541015625, 1.8544921875, 1.9310302734375, 2.007568359375, 2.0841064453125, 2.16064453125, 2.2371826171875, 2.313720703125, 2.3902587890625, 2.466796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 18.0, 13.0, 21.0, 21.0, 28.0, 35.0, 51.0, 74.0, 96.0, 119.0, 102.0, 76.0, 84.0, 58.0, 38.0, 31.0, 20.0, 19.0, 12.0, 6.0, 10.0, 8.0, 11.0, 2.0, 6.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0006403923034667969, -0.0006243288516998291, -0.0006082653999328613, -0.0005922019481658936, -0.0005761384963989258, -0.000560075044631958, -0.0005440115928649902, -0.0005279481410980225, -0.0005118846893310547, -0.0004958212375640869, -0.00047975778579711914, -0.00046369433403015137, -0.0004476308822631836, -0.0004315674304962158, -0.00041550397872924805, -0.0003994405269622803, -0.0003833770751953125, -0.0003673136234283447, -0.00035125017166137695, -0.0003351867198944092, -0.0003191232681274414, -0.00030305981636047363, -0.00028699636459350586, -0.0002709329128265381, -0.0002548694610595703, -0.00023880600929260254, -0.00022274255752563477, -0.000206679105758667, -0.00019061565399169922, -0.00017455220222473145, -0.00015848875045776367, -0.0001424252986907959, -0.00012636184692382812, -0.00011029839515686035, -9.423494338989258e-05, -7.81714916229248e-05, -6.210803985595703e-05, -4.604458808898926e-05, -2.9981136322021484e-05, -1.3917684555053711e-05, 2.1457672119140625e-06, 1.8209218978881836e-05, 3.427267074584961e-05, 5.033612251281738e-05, 6.639957427978516e-05, 8.246302604675293e-05, 9.85264778137207e-05, 0.00011458992958068848, 0.00013065338134765625, 0.00014671683311462402, 0.0001627802848815918, 0.00017884373664855957, 0.00019490718841552734, 0.00021097064018249512, 0.0002270340919494629, 0.00024309754371643066, 0.00025916099548339844, 0.0002752244472503662, 0.000291287899017334, 0.00030735135078430176, 0.00032341480255126953, 0.0003394782543182373, 0.0003555417060852051, 0.00037160515785217285, 0.0003876686096191406]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 14.0, 16.0, 15.0, 26.0, 22.0, 41.0, 62.0, 60.0, 108.0, 151.0, 251.0, 381.0, 599.0, 1079.0, 1858.0, 3705.0, 8146.0, 19544.0, 57647.0, 203841.0, 462054.0, 197657.0, 55782.0, 19127.0, 7964.0, 3738.0, 1902.0, 1033.0, 617.0, 360.0, 252.0, 160.0, 101.0, 69.0, 51.0, 36.0, 25.0, 17.0, 9.0, 7.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.21624755859375, -2.1356201171875, -2.05499267578125, -1.974365234375, -1.89373779296875, -1.8131103515625, -1.73248291015625, -1.65185546875, -1.57122802734375, -1.4906005859375, -1.40997314453125, -1.329345703125, -1.24871826171875, -1.1680908203125, -1.08746337890625, -1.0068359375, -0.92620849609375, -0.8455810546875, -0.76495361328125, -0.684326171875, -0.60369873046875, -0.5230712890625, -0.44244384765625, -0.36181640625, -0.28118896484375, -0.2005615234375, -0.11993408203125, -0.039306640625, 0.04132080078125, 0.1219482421875, 0.20257568359375, 0.283203125, 0.36383056640625, 0.4444580078125, 0.52508544921875, 0.605712890625, 0.68634033203125, 0.7669677734375, 0.84759521484375, 0.92822265625, 1.00885009765625, 1.0894775390625, 1.17010498046875, 1.250732421875, 1.33135986328125, 1.4119873046875, 1.49261474609375, 1.5732421875, 1.65386962890625, 1.7344970703125, 1.81512451171875, 1.895751953125, 1.97637939453125, 2.0570068359375, 2.13763427734375, 2.21826171875, 2.29888916015625, 2.3795166015625, 2.46014404296875, 2.540771484375, 2.62139892578125, 2.7020263671875, 2.78265380859375, 2.86328125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 5.0, 11.0, 18.0, 17.0, 23.0, 30.0, 51.0, 56.0, 83.0, 99.0, 111.0, 109.0, 86.0, 53.0, 57.0, 46.0, 34.0, 21.0, 17.0, 16.0, 9.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.08984375, -3.005584716796875, -2.92132568359375, -2.837066650390625, -2.7528076171875, -2.668548583984375, -2.58428955078125, -2.500030517578125, -2.415771484375, -2.331512451171875, -2.24725341796875, -2.162994384765625, -2.0787353515625, -1.994476318359375, -1.91021728515625, -1.825958251953125, -1.74169921875, -1.657440185546875, -1.57318115234375, -1.488922119140625, -1.4046630859375, -1.320404052734375, -1.23614501953125, -1.151885986328125, -1.067626953125, -0.983367919921875, -0.89910888671875, -0.814849853515625, -0.7305908203125, -0.646331787109375, -0.56207275390625, -0.477813720703125, -0.3935546875, -0.309295654296875, -0.22503662109375, -0.140777587890625, -0.0565185546875, 0.027740478515625, 0.11199951171875, 0.196258544921875, 0.280517578125, 0.364776611328125, 0.44903564453125, 0.533294677734375, 0.6175537109375, 0.701812744140625, 0.78607177734375, 0.870330810546875, 0.95458984375, 1.038848876953125, 1.12310791015625, 1.207366943359375, 1.2916259765625, 1.375885009765625, 1.46014404296875, 1.544403076171875, 1.628662109375, 1.712921142578125, 1.79718017578125, 1.881439208984375, 1.9656982421875, 2.049957275390625, 2.13421630859375, 2.218475341796875, 2.302734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 17.0, 38.0, 90.0, 219.0, 343.0, 198.0, 66.0, 18.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.83872985839844, -52.29728317260742, -49.755836486816406, -47.214385986328125, -44.67293930053711, -42.131492614746094, -39.59004211425781, -37.0485954284668, -34.50714874267578, -31.965702056884766, -29.424253463745117, -26.88280487060547, -24.341358184814453, -21.799911499023438, -19.25846290588379, -16.71701431274414, -14.175567626953125, -11.634119987487793, -9.092672348022461, -6.551224708557129, -4.009777069091797, -1.4683294296264648, 1.0731182098388672, 3.6145668029785156, 6.156013488769531, 8.697461128234863, 11.238908767700195, 13.780356407165527, 16.32180404663086, 18.863250732421875, 21.404699325561523, 23.946147918701172, 26.487586975097656, 29.029033660888672, 31.57048225402832, 34.11193084716797, 36.653377532958984, 39.19482421875, 41.73627471923828, 44.2777214050293, 46.81916809082031, 49.36061477661133, 51.902061462402344, 54.443511962890625, 56.98495864868164, 59.526405334472656, 62.06785583496094, 64.60929870605469, 67.15074920654297, 69.69219970703125, 72.233642578125, 74.77509307861328, 77.31654357910156, 79.85798645019531, 82.3994369506836, 84.94088745117188, 87.48233032226562, 90.0237808227539, 92.56522369384766, 95.10667419433594, 97.64811706542969, 100.18956756591797, 102.73101806640625, 105.2724609375, 107.81391143798828]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 11.0, 15.0, 18.0, 17.0, 29.0, 22.0, 22.0, 31.0, 29.0, 43.0, 42.0, 32.0, 40.0, 56.0, 42.0, 49.0, 60.0, 45.0, 47.0, 38.0, 52.0, 38.0, 28.0, 37.0, 19.0, 22.0, 14.0, 15.0, 15.0, 12.0, 6.0, 11.0, 6.0, 6.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.94635772705078, -34.75006866455078, -33.55377960205078, -32.35749053955078, -31.161203384399414, -29.964914321899414, -28.768627166748047, -27.572338104248047, -26.376049041748047, -25.179759979248047, -23.983470916748047, -22.78718376159668, -21.59089469909668, -20.39460563659668, -19.198318481445312, -18.002029418945312, -16.805740356445312, -15.609451293945312, -14.413163185119629, -13.216875076293945, -12.020586013793945, -10.824296951293945, -9.628008842468262, -8.431720733642578, -7.235431671142578, -6.039143085479736, -4.8428544998168945, -3.6465659141540527, -2.450277328491211, -1.2539887428283691, -0.057700157165527344, 1.1385879516601562, 2.3348731994628906, 3.5311617851257324, 4.727450370788574, 5.923738956451416, 7.120027542114258, 8.316316604614258, 9.512604713439941, 10.708892822265625, 11.905181884765625, 13.101470947265625, 14.297759056091309, 15.494047164916992, 16.690336227416992, 17.886625289916992, 19.08291244506836, 20.27920150756836, 21.47549057006836, 22.67177963256836, 23.86806869506836, 25.064355850219727, 26.260644912719727, 27.456933975219727, 28.653221130371094, 29.849510192871094, 31.045799255371094, 32.242088317871094, 33.438377380371094, 34.634666442871094, 35.830955505371094, 37.02724075317383, 38.22352981567383, 39.41981887817383, 40.61610794067383]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 10.0, 12.0, 37.0, 71.0, 139.0, 334.0, 1088.0, 4989.0, 73808.0, 4073417.0, 34890.0, 3718.0, 943.0, 358.0, 162.0, 82.0, 58.0, 38.0, 30.0, 23.0, 16.0, 14.0, 9.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.503173828125, -11.74072265625, -10.978271484375, -10.2158203125, -9.453369140625, -8.69091796875, -7.928466796875, -7.166015625, -6.403564453125, -5.64111328125, -4.878662109375, -4.1162109375, -3.353759765625, -2.59130859375, -1.828857421875, -1.06640625, -0.303955078125, 0.45849609375, 1.220947265625, 1.9833984375, 2.745849609375, 3.50830078125, 4.270751953125, 5.033203125, 5.795654296875, 6.55810546875, 7.320556640625, 8.0830078125, 8.845458984375, 9.60791015625, 10.370361328125, 11.1328125, 11.895263671875, 12.65771484375, 13.420166015625, 14.1826171875, 14.945068359375, 15.70751953125, 16.469970703125, 17.232421875, 17.994873046875, 18.75732421875, 19.519775390625, 20.2822265625, 21.044677734375, 21.80712890625, 22.569580078125, 23.33203125, 24.094482421875, 24.85693359375, 25.619384765625, 26.3818359375, 27.144287109375, 27.90673828125, 28.669189453125, 29.431640625, 30.194091796875, 30.95654296875, 31.718994140625, 32.4814453125, 33.243896484375, 34.00634765625, 34.768798828125, 35.53125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 10.0, 9.0, 29.0, 59.0, 90.0, 122.0, 133.0, 156.0, 144.0, 110.0, 60.0, 41.0, 20.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.131866455078125, -1.99224853515625, -1.852630615234375, -1.7130126953125, -1.573394775390625, -1.43377685546875, -1.294158935546875, -1.154541015625, -1.014923095703125, -0.87530517578125, -0.735687255859375, -0.5960693359375, -0.456451416015625, -0.31683349609375, -0.177215576171875, -0.03759765625, 0.102020263671875, 0.24163818359375, 0.381256103515625, 0.5208740234375, 0.660491943359375, 0.80010986328125, 0.939727783203125, 1.079345703125, 1.218963623046875, 1.35858154296875, 1.498199462890625, 1.6378173828125, 1.777435302734375, 1.91705322265625, 2.056671142578125, 2.1962890625, 2.335906982421875, 2.47552490234375, 2.615142822265625, 2.7547607421875, 2.894378662109375, 3.03399658203125, 3.173614501953125, 3.313232421875, 3.452850341796875, 3.59246826171875, 3.732086181640625, 3.8717041015625, 4.011322021484375, 4.15093994140625, 4.290557861328125, 4.43017578125, 4.569793701171875, 4.70941162109375, 4.849029541015625, 4.9886474609375, 5.128265380859375, 5.26788330078125, 5.407501220703125, 5.547119140625, 5.686737060546875, 5.82635498046875, 5.965972900390625, 6.1055908203125, 6.245208740234375, 6.38482666015625, 6.524444580078125, 6.6640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 20.0, 43.0, 59.0, 90.0, 194.0, 902.0, 3775329.0, 416668.0, 690.0, 149.0, 63.0, 40.0, 16.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.5, -93.32763671875, -91.1552734375, -88.98291015625, -86.810546875, -84.63818359375, -82.4658203125, -80.29345703125, -78.12109375, -75.94873046875, -73.7763671875, -71.60400390625, -69.431640625, -67.25927734375, -65.0869140625, -62.91455078125, -60.7421875, -58.56982421875, -56.3974609375, -54.22509765625, -52.052734375, -49.88037109375, -47.7080078125, -45.53564453125, -43.36328125, -41.19091796875, -39.0185546875, -36.84619140625, -34.673828125, -32.50146484375, -30.3291015625, -28.15673828125, -25.984375, -23.81201171875, -21.6396484375, -19.46728515625, -17.294921875, -15.12255859375, -12.9501953125, -10.77783203125, -8.60546875, -6.43310546875, -4.2607421875, -2.08837890625, 0.083984375, 2.25634765625, 4.4287109375, 6.60107421875, 8.7734375, 10.94580078125, 13.1181640625, 15.29052734375, 17.462890625, 19.63525390625, 21.8076171875, 23.97998046875, 26.15234375, 28.32470703125, 30.4970703125, 32.66943359375, 34.841796875, 37.01416015625, 39.1865234375, 41.35888671875, 43.53125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 11.0, 40.0, 305.0, 3435.0, 246.0, 32.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.5625, -17.16748046875, -16.7724609375, -16.37744140625, -15.982421875, -15.58740234375, -15.1923828125, -14.79736328125, -14.40234375, -14.00732421875, -13.6123046875, -13.21728515625, -12.822265625, -12.42724609375, -12.0322265625, -11.63720703125, -11.2421875, -10.84716796875, -10.4521484375, -10.05712890625, -9.662109375, -9.26708984375, -8.8720703125, -8.47705078125, -8.08203125, -7.68701171875, -7.2919921875, -6.89697265625, -6.501953125, -6.10693359375, -5.7119140625, -5.31689453125, -4.921875, -4.52685546875, -4.1318359375, -3.73681640625, -3.341796875, -2.94677734375, -2.5517578125, -2.15673828125, -1.76171875, -1.36669921875, -0.9716796875, -0.57666015625, -0.181640625, 0.21337890625, 0.6083984375, 1.00341796875, 1.3984375, 1.79345703125, 2.1884765625, 2.58349609375, 2.978515625, 3.37353515625, 3.7685546875, 4.16357421875, 4.55859375, 4.95361328125, 5.3486328125, 5.74365234375, 6.138671875, 6.53369140625, 6.9287109375, 7.32373046875, 7.71875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 45.0, 664.0, 274.0, 18.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-90.30525207519531, -87.55488586425781, -84.80451202392578, -82.05414581298828, -79.30377197265625, -76.55340576171875, -73.80303192138672, -71.05266571044922, -68.30229187011719, -65.55192565917969, -62.801551818847656, -60.05118179321289, -57.300811767578125, -54.55044174194336, -51.800071716308594, -49.049705505371094, -46.29933547973633, -43.54896545410156, -40.7985954284668, -38.04822540283203, -35.297855377197266, -32.5474853515625, -29.797117233276367, -27.0467472076416, -24.296377182006836, -21.54600715637207, -18.795637130737305, -16.045269012451172, -13.29489803314209, -10.544528007507324, -7.794158935546875, -5.043788909912109, -2.2934188842773438, 0.4569509029388428, 3.2073206901550293, 5.957690238952637, 8.708060264587402, 11.458430290222168, 14.208799362182617, 16.959169387817383, 19.70953941345215, 22.459909439086914, 25.21027946472168, 27.960647583007812, 30.711017608642578, 33.461387634277344, 36.21175765991211, 38.962127685546875, 41.71249771118164, 44.462867736816406, 47.21323776245117, 49.96360778808594, 52.7139778137207, 55.46434783935547, 58.21471405029297, 60.965087890625, 63.7154541015625, 66.4658203125, 69.21619415283203, 71.96656036376953, 74.71693420410156, 77.46730041503906, 80.2176742553711, 82.9680404663086, 85.71841430664062]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 11.0, 13.0, 26.0, 29.0, 43.0, 51.0, 76.0, 75.0, 84.0, 80.0, 82.0, 100.0, 69.0, 63.0, 66.0, 35.0, 32.0, 24.0, 14.0, 14.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.09068775177002, -13.561224937438965, -13.03176212310791, -12.502299308776855, -11.9728364944458, -11.443373680114746, -10.913909912109375, -10.38444709777832, -9.854984283447266, -9.325521469116211, -8.796058654785156, -8.266595840454102, -7.737133026123047, -7.207670211791992, -6.678206920623779, -6.148744106292725, -5.619281768798828, -5.089818954467773, -4.560356140136719, -4.030893325805664, -3.5014302730560303, -2.9719674587249756, -2.442504405975342, -1.913041591644287, -1.3835787773132324, -0.854115903377533, -0.3246530294418335, 0.20480990409851074, 0.7342727184295654, 1.2637355327606201, 1.793198585510254, 2.3226613998413086, 2.852123260498047, 3.3815860748291016, 3.9110488891601562, 4.440511703491211, 4.969974517822266, 5.49943733215332, 6.028900623321533, 6.558363437652588, 7.087826251983643, 7.617289066314697, 8.14675235748291, 8.676215171813965, 9.20567798614502, 9.735140800476074, 10.264603614807129, 10.794066429138184, 11.323529243469238, 11.852992057800293, 12.382454872131348, 12.911917686462402, 13.441380500793457, 13.970843315124512, 14.500307083129883, 15.029769897460938, 15.559232711791992, 16.088695526123047, 16.6181583404541, 17.147621154785156, 17.67708396911621, 18.206546783447266, 18.73600959777832, 19.265472412109375, 19.79493522644043]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 13.0, 10.0, 14.0, 16.0, 21.0, 33.0, 39.0, 40.0, 63.0, 139.0, 243.0, 749.0, 3339.0, 37980.0, 816001.0, 179778.0, 7897.0, 1342.0, 370.0, 146.0, 91.0, 60.0, 28.0, 39.0, 18.0, 19.0, 15.0, 11.0, 9.0, 15.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.09375, -16.5712890625, -16.048828125, -15.5263671875, -15.00390625, -14.4814453125, -13.958984375, -13.4365234375, -12.9140625, -12.3916015625, -11.869140625, -11.3466796875, -10.82421875, -10.3017578125, -9.779296875, -9.2568359375, -8.734375, -8.2119140625, -7.689453125, -7.1669921875, -6.64453125, -6.1220703125, -5.599609375, -5.0771484375, -4.5546875, -4.0322265625, -3.509765625, -2.9873046875, -2.46484375, -1.9423828125, -1.419921875, -0.8974609375, -0.375, 0.1474609375, 0.669921875, 1.1923828125, 1.71484375, 2.2373046875, 2.759765625, 3.2822265625, 3.8046875, 4.3271484375, 4.849609375, 5.3720703125, 5.89453125, 6.4169921875, 6.939453125, 7.4619140625, 7.984375, 8.5068359375, 9.029296875, 9.5517578125, 10.07421875, 10.5966796875, 11.119140625, 11.6416015625, 12.1640625, 12.6865234375, 13.208984375, 13.7314453125, 14.25390625, 14.7763671875, 15.298828125, 15.8212890625, 16.34375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 13.0, 30.0, 60.0, 83.0, 115.0, 171.0, 171.0, 138.0, 104.0, 66.0, 28.0, 16.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.893218994140625, -1.73760986328125, -1.582000732421875, -1.4263916015625, -1.270782470703125, -1.11517333984375, -0.959564208984375, -0.803955078125, -0.648345947265625, -0.49273681640625, -0.337127685546875, -0.1815185546875, -0.025909423828125, 0.12969970703125, 0.285308837890625, 0.44091796875, 0.596527099609375, 0.75213623046875, 0.907745361328125, 1.0633544921875, 1.218963623046875, 1.37457275390625, 1.530181884765625, 1.685791015625, 1.841400146484375, 1.99700927734375, 2.152618408203125, 2.3082275390625, 2.463836669921875, 2.61944580078125, 2.775054931640625, 2.9306640625, 3.086273193359375, 3.24188232421875, 3.397491455078125, 3.5531005859375, 3.708709716796875, 3.86431884765625, 4.019927978515625, 4.175537109375, 4.331146240234375, 4.48675537109375, 4.642364501953125, 4.7979736328125, 4.953582763671875, 5.10919189453125, 5.264801025390625, 5.42041015625, 5.576019287109375, 5.73162841796875, 5.887237548828125, 6.0428466796875, 6.198455810546875, 6.35406494140625, 6.509674072265625, 6.665283203125, 6.820892333984375, 6.97650146484375, 7.132110595703125, 7.2877197265625, 7.443328857421875, 7.59893798828125, 7.754547119140625, 7.91015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 3.0, 5.0, 13.0, 13.0, 18.0, 39.0, 42.0, 86.0, 129.0, 252.0, 484.0, 1001.0, 2598.0, 9258.0, 58784.0, 610711.0, 325477.0, 30255.0, 5793.0, 1930.0, 768.0, 376.0, 185.0, 111.0, 61.0, 56.0, 28.0, 25.0, 9.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.5, -8.1578369140625, -7.815673828125, -7.4735107421875, -7.13134765625, -6.7891845703125, -6.447021484375, -6.1048583984375, -5.7626953125, -5.4205322265625, -5.078369140625, -4.7362060546875, -4.39404296875, -4.0518798828125, -3.709716796875, -3.3675537109375, -3.025390625, -2.6832275390625, -2.341064453125, -1.9989013671875, -1.65673828125, -1.3145751953125, -0.972412109375, -0.6302490234375, -0.2880859375, 0.0540771484375, 0.396240234375, 0.7384033203125, 1.08056640625, 1.4227294921875, 1.764892578125, 2.1070556640625, 2.44921875, 2.7913818359375, 3.133544921875, 3.4757080078125, 3.81787109375, 4.1600341796875, 4.502197265625, 4.8443603515625, 5.1865234375, 5.5286865234375, 5.870849609375, 6.2130126953125, 6.55517578125, 6.8973388671875, 7.239501953125, 7.5816650390625, 7.923828125, 8.2659912109375, 8.608154296875, 8.9503173828125, 9.29248046875, 9.6346435546875, 9.976806640625, 10.3189697265625, 10.6611328125, 11.0032958984375, 11.345458984375, 11.6876220703125, 12.02978515625, 12.3719482421875, 12.714111328125, 13.0562744140625, 13.3984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 11.0, 14.0, 16.0, 20.0, 27.0, 34.0, 42.0, 63.0, 53.0, 74.0, 67.0, 78.0, 77.0, 56.0, 91.0, 53.0, 45.0, 38.0, 33.0, 32.0, 20.0, 11.0, 11.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0546875, -8.6925048828125, -8.330322265625, -7.9681396484375, -7.60595703125, -7.2437744140625, -6.881591796875, -6.5194091796875, -6.1572265625, -5.7950439453125, -5.432861328125, -5.0706787109375, -4.70849609375, -4.3463134765625, -3.984130859375, -3.6219482421875, -3.259765625, -2.8975830078125, -2.535400390625, -2.1732177734375, -1.81103515625, -1.4488525390625, -1.086669921875, -0.7244873046875, -0.3623046875, -0.0001220703125, 0.362060546875, 0.7242431640625, 1.08642578125, 1.4486083984375, 1.810791015625, 2.1729736328125, 2.53515625, 2.8973388671875, 3.259521484375, 3.6217041015625, 3.98388671875, 4.3460693359375, 4.708251953125, 5.0704345703125, 5.4326171875, 5.7947998046875, 6.156982421875, 6.5191650390625, 6.88134765625, 7.2435302734375, 7.605712890625, 7.9678955078125, 8.330078125, 8.6922607421875, 9.054443359375, 9.4166259765625, 9.77880859375, 10.1409912109375, 10.503173828125, 10.8653564453125, 11.2275390625, 11.5897216796875, 11.951904296875, 12.3140869140625, 12.67626953125, 13.0384521484375, 13.400634765625, 13.7628173828125, 14.125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 8.0, 7.0, 11.0, 18.0, 25.0, 22.0, 46.0, 68.0, 88.0, 142.0, 250.0, 431.0, 814.0, 1550.0, 3511.0, 8641.0, 28148.0, 136954.0, 551360.0, 248070.0, 46475.0, 12729.0, 4773.0, 2061.0, 1027.0, 529.0, 291.0, 167.0, 110.0, 73.0, 40.0, 27.0, 22.0, 13.0, 10.0, 8.0, 8.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.541015625, -2.452392578125, -2.36376953125, -2.275146484375, -2.1865234375, -2.097900390625, -2.00927734375, -1.920654296875, -1.83203125, -1.743408203125, -1.65478515625, -1.566162109375, -1.4775390625, -1.388916015625, -1.30029296875, -1.211669921875, -1.123046875, -1.034423828125, -0.94580078125, -0.857177734375, -0.7685546875, -0.679931640625, -0.59130859375, -0.502685546875, -0.4140625, -0.325439453125, -0.23681640625, -0.148193359375, -0.0595703125, 0.029052734375, 0.11767578125, 0.206298828125, 0.294921875, 0.383544921875, 0.47216796875, 0.560791015625, 0.6494140625, 0.738037109375, 0.82666015625, 0.915283203125, 1.00390625, 1.092529296875, 1.18115234375, 1.269775390625, 1.3583984375, 1.447021484375, 1.53564453125, 1.624267578125, 1.712890625, 1.801513671875, 1.89013671875, 1.978759765625, 2.0673828125, 2.156005859375, 2.24462890625, 2.333251953125, 2.421875, 2.510498046875, 2.59912109375, 2.687744140625, 2.7763671875, 2.864990234375, 2.95361328125, 3.042236328125, 3.130859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 3.0, 14.0, 6.0, 19.0, 37.0, 55.0, 79.0, 96.0, 138.0, 149.0, 137.0, 74.0, 53.0, 48.0, 21.0, 19.0, 15.0, 6.0, 4.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005502700805664062, -0.0005293413996696472, -0.0005084127187728882, -0.00048748403787612915, -0.0004665553569793701, -0.0004456266760826111, -0.00042469799518585205, -0.000403769314289093, -0.000382840633392334, -0.00036191195249557495, -0.0003409832715988159, -0.0003200545907020569, -0.00029912590980529785, -0.0002781972289085388, -0.0002572685480117798, -0.00023633986711502075, -0.00021541118621826172, -0.00019448250532150269, -0.00017355382442474365, -0.00015262514352798462, -0.00013169646263122559, -0.00011076778173446655, -8.983910083770752e-05, -6.891041994094849e-05, -4.798173904418945e-05, -2.705305814743042e-05, -6.124377250671387e-06, 1.4804303646087646e-05, 3.573298454284668e-05, 5.666166543960571e-05, 7.759034633636475e-05, 9.851902723312378e-05, 0.00011944770812988281, 0.00014037638902664185, 0.00016130506992340088, 0.0001822337508201599, 0.00020316243171691895, 0.00022409111261367798, 0.000245019793510437, 0.00026594847440719604, 0.0002868771553039551, 0.0003078058362007141, 0.00032873451709747314, 0.0003496631979942322, 0.0003705918788909912, 0.00039152055978775024, 0.0004124492406845093, 0.0004333779215812683, 0.00045430660247802734, 0.0004752352833747864, 0.0004961639642715454, 0.0005170926451683044, 0.0005380213260650635, 0.0005589500069618225, 0.0005798786878585815, 0.0006008073687553406, 0.0006217360496520996, 0.0006426647305488586, 0.0006635934114456177, 0.0006845220923423767, 0.0007054507732391357, 0.0007263794541358948, 0.0007473081350326538, 0.0007682368159294128, 0.0007891654968261719]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 16.0, 9.0, 14.0, 38.0, 37.0, 59.0, 89.0, 151.0, 227.0, 394.0, 790.0, 1793.0, 4025.0, 10756.0, 37573.0, 193637.0, 583466.0, 165171.0, 33415.0, 9697.0, 3733.0, 1649.0, 792.0, 405.0, 212.0, 137.0, 80.0, 53.0, 44.0, 22.0, 13.0, 12.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.94921875, -3.843780517578125, -3.73834228515625, -3.632904052734375, -3.5274658203125, -3.422027587890625, -3.31658935546875, -3.211151123046875, -3.105712890625, -3.000274658203125, -2.89483642578125, -2.789398193359375, -2.6839599609375, -2.578521728515625, -2.47308349609375, -2.367645263671875, -2.26220703125, -2.156768798828125, -2.05133056640625, -1.945892333984375, -1.8404541015625, -1.735015869140625, -1.62957763671875, -1.524139404296875, -1.418701171875, -1.313262939453125, -1.20782470703125, -1.102386474609375, -0.9969482421875, -0.891510009765625, -0.78607177734375, -0.680633544921875, -0.5751953125, -0.469757080078125, -0.36431884765625, -0.258880615234375, -0.1534423828125, -0.048004150390625, 0.05743408203125, 0.162872314453125, 0.268310546875, 0.373748779296875, 0.47918701171875, 0.584625244140625, 0.6900634765625, 0.795501708984375, 0.90093994140625, 1.006378173828125, 1.11181640625, 1.217254638671875, 1.32269287109375, 1.428131103515625, 1.5335693359375, 1.639007568359375, 1.74444580078125, 1.849884033203125, 1.955322265625, 2.060760498046875, 2.16619873046875, 2.271636962890625, 2.3770751953125, 2.482513427734375, 2.58795166015625, 2.693389892578125, 2.798828125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 7.0, 7.0, 9.0, 9.0, 9.0, 14.0, 27.0, 29.0, 49.0, 57.0, 61.0, 94.0, 102.0, 90.0, 100.0, 66.0, 58.0, 48.0, 45.0, 33.0, 23.0, 12.0, 14.0, 6.0, 5.0, 10.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.505859375, -3.409088134765625, -3.31231689453125, -3.215545654296875, -3.1187744140625, -3.022003173828125, -2.92523193359375, -2.828460693359375, -2.731689453125, -2.634918212890625, -2.53814697265625, -2.441375732421875, -2.3446044921875, -2.247833251953125, -2.15106201171875, -2.054290771484375, -1.95751953125, -1.860748291015625, -1.76397705078125, -1.667205810546875, -1.5704345703125, -1.473663330078125, -1.37689208984375, -1.280120849609375, -1.183349609375, -1.086578369140625, -0.98980712890625, -0.893035888671875, -0.7962646484375, -0.699493408203125, -0.60272216796875, -0.505950927734375, -0.4091796875, -0.312408447265625, -0.21563720703125, -0.118865966796875, -0.0220947265625, 0.074676513671875, 0.17144775390625, 0.268218994140625, 0.364990234375, 0.461761474609375, 0.55853271484375, 0.655303955078125, 0.7520751953125, 0.848846435546875, 0.94561767578125, 1.042388916015625, 1.13916015625, 1.235931396484375, 1.33270263671875, 1.429473876953125, 1.5262451171875, 1.623016357421875, 1.71978759765625, 1.816558837890625, 1.913330078125, 2.010101318359375, 2.10687255859375, 2.203643798828125, 2.3004150390625, 2.397186279296875, 2.49395751953125, 2.590728759765625, 2.6875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 10.0, 24.0, 64.0, 170.0, 320.0, 258.0, 95.0, 33.0, 15.0, 6.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.86557006835938, -127.0228271484375, -124.18009185791016, -121.33734893798828, -118.49461364746094, -115.65187072753906, -112.80912780761719, -109.96639251708984, -107.12364959716797, -104.2809066772461, -101.43817138671875, -98.59542846679688, -95.75269317626953, -92.90995025634766, -90.06721496582031, -87.22447204589844, -84.38172912597656, -81.53898620605469, -78.69625091552734, -75.85350799560547, -73.01077270507812, -70.16802978515625, -67.32528686523438, -64.48255157470703, -61.63981628417969, -58.79707717895508, -55.95433807373047, -53.111595153808594, -50.268856048583984, -47.426116943359375, -44.583377838134766, -41.740638732910156, -38.89789581298828, -36.05515670776367, -33.21241760253906, -30.36967658996582, -27.526935577392578, -24.68419647216797, -21.84145736694336, -18.998716354370117, -16.155977249145508, -13.313237190246582, -10.470497131347656, -7.627758026123047, -4.785017967224121, -1.9422779083251953, 0.9004611968994141, 3.7432022094726562, 6.585941314697266, 9.428681373596191, 12.271421432495117, 15.114160537719727, 17.95690155029297, 20.799640655517578, 23.642379760742188, 26.48512077331543, 29.32785987854004, 32.17060089111328, 35.01333999633789, 37.8560791015625, 40.69881820678711, 43.54155731201172, 46.384300231933594, 49.2270393371582, 52.06977844238281]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 9.0, 11.0, 8.0, 8.0, 24.0, 18.0, 16.0, 20.0, 28.0, 32.0, 32.0, 44.0, 30.0, 52.0, 47.0, 50.0, 43.0, 58.0, 43.0, 53.0, 44.0, 42.0, 33.0, 31.0, 35.0, 25.0, 24.0, 22.0, 17.0, 25.0, 13.0, 10.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.41595458984375, -37.097164154052734, -35.778377532958984, -34.45958709716797, -33.14080047607422, -31.822010040283203, -30.50322151184082, -29.184432983398438, -27.865644454956055, -26.546855926513672, -25.22806739807129, -23.909278869628906, -22.59048843383789, -21.27170181274414, -19.952911376953125, -18.634122848510742, -17.31533432006836, -15.996545791625977, -14.677757263183594, -13.358967781066895, -12.040179252624512, -10.721390724182129, -9.40260124206543, -8.083812713623047, -6.765024185180664, -5.446235656738281, -4.12744665145874, -2.8086578845977783, -1.4898691177368164, -0.1710805892944336, 1.1477084159851074, 2.4664974212646484, 3.7852859497070312, 5.104074478149414, 6.422863483428955, 7.741652488708496, 9.060441017150879, 10.379229545593262, 11.698019027709961, 13.016807556152344, 14.335596084594727, 15.65438461303711, 16.973173141479492, 18.291961669921875, 19.61075210571289, 20.92953872680664, 22.248329162597656, 23.56711769104004, 24.885906219482422, 26.204694747924805, 27.523483276367188, 28.84227180480957, 30.161060333251953, 31.47985076904297, 32.79863739013672, 34.117427825927734, 35.43621826171875, 36.755008697509766, 38.073795318603516, 39.39258575439453, 40.71137237548828, 42.0301628112793, 43.34894943237305, 44.66773986816406, 45.98652648925781]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 14.0, 24.0, 56.0, 117.0, 331.0, 972.0, 3887.0, 30998.0, 3951819.0, 192401.0, 10114.0, 2068.0, 730.0, 281.0, 157.0, 90.0, 59.0, 50.0, 29.0, 21.0, 8.0, 15.0, 7.0, 7.0, 6.0, 6.0, 6.0, 6.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.356201171875, -9.60302734375, -8.849853515625, -8.0966796875, -7.343505859375, -6.59033203125, -5.837158203125, -5.083984375, -4.330810546875, -3.57763671875, -2.824462890625, -2.0712890625, -1.318115234375, -0.56494140625, 0.188232421875, 0.94140625, 1.694580078125, 2.44775390625, 3.200927734375, 3.9541015625, 4.707275390625, 5.46044921875, 6.213623046875, 6.966796875, 7.719970703125, 8.47314453125, 9.226318359375, 9.9794921875, 10.732666015625, 11.48583984375, 12.239013671875, 12.9921875, 13.745361328125, 14.49853515625, 15.251708984375, 16.0048828125, 16.758056640625, 17.51123046875, 18.264404296875, 19.017578125, 19.770751953125, 20.52392578125, 21.277099609375, 22.0302734375, 22.783447265625, 23.53662109375, 24.289794921875, 25.04296875, 25.796142578125, 26.54931640625, 27.302490234375, 28.0556640625, 28.808837890625, 29.56201171875, 30.315185546875, 31.068359375, 31.821533203125, 32.57470703125, 33.327880859375, 34.0810546875, 34.834228515625, 35.58740234375, 36.340576171875, 37.09375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 12.0, 37.0, 55.0, 79.0, 96.0, 112.0, 131.0, 136.0, 89.0, 80.0, 67.0, 45.0, 29.0, 9.0, 9.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8024444580078125, -1.680084228515625, -1.5577239990234375, -1.43536376953125, -1.3130035400390625, -1.190643310546875, -1.0682830810546875, -0.9459228515625, -0.8235626220703125, -0.701202392578125, -0.5788421630859375, -0.45648193359375, -0.3341217041015625, -0.211761474609375, -0.0894012451171875, 0.032958984375, 0.1553192138671875, 0.277679443359375, 0.4000396728515625, 0.52239990234375, 0.6447601318359375, 0.767120361328125, 0.8894805908203125, 1.0118408203125, 1.1342010498046875, 1.256561279296875, 1.3789215087890625, 1.50128173828125, 1.6236419677734375, 1.746002197265625, 1.8683624267578125, 1.99072265625, 2.1130828857421875, 2.235443115234375, 2.3578033447265625, 2.48016357421875, 2.6025238037109375, 2.724884033203125, 2.8472442626953125, 2.9696044921875, 3.0919647216796875, 3.214324951171875, 3.3366851806640625, 3.45904541015625, 3.5814056396484375, 3.703765869140625, 3.8261260986328125, 3.948486328125, 4.0708465576171875, 4.193206787109375, 4.3155670166015625, 4.43792724609375, 4.5602874755859375, 4.682647705078125, 4.8050079345703125, 4.9273681640625, 5.0497283935546875, 5.172088623046875, 5.2944488525390625, 5.41680908203125, 5.5391693115234375, 5.661529541015625, 5.7838897705078125, 5.90625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 8.0, 4.0, 15.0, 21.0, 36.0, 53.0, 114.0, 178.0, 369.0, 807.0, 2795.0, 14211.0, 4014427.0, 150443.0, 7219.0, 2030.0, 730.0, 377.0, 182.0, 104.0, 53.0, 36.0, 26.0, 12.0, 15.0, 12.0, 3.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.46875, -27.4443359375, -26.419921875, -25.3955078125, -24.37109375, -23.3466796875, -22.322265625, -21.2978515625, -20.2734375, -19.2490234375, -18.224609375, -17.2001953125, -16.17578125, -15.1513671875, -14.126953125, -13.1025390625, -12.078125, -11.0537109375, -10.029296875, -9.0048828125, -7.98046875, -6.9560546875, -5.931640625, -4.9072265625, -3.8828125, -2.8583984375, -1.833984375, -0.8095703125, 0.21484375, 1.2392578125, 2.263671875, 3.2880859375, 4.3125, 5.3369140625, 6.361328125, 7.3857421875, 8.41015625, 9.4345703125, 10.458984375, 11.4833984375, 12.5078125, 13.5322265625, 14.556640625, 15.5810546875, 16.60546875, 17.6298828125, 18.654296875, 19.6787109375, 20.703125, 21.7275390625, 22.751953125, 23.7763671875, 24.80078125, 25.8251953125, 26.849609375, 27.8740234375, 28.8984375, 29.9228515625, 30.947265625, 31.9716796875, 32.99609375, 34.0205078125, 35.044921875, 36.0693359375, 37.09375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 5.0, 15.0, 71.0, 344.0, 3083.0, 425.0, 65.0, 25.0, 13.0, 6.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.76171875, -7.31964111328125, -6.8775634765625, -6.43548583984375, -5.993408203125, -5.55133056640625, -5.1092529296875, -4.66717529296875, -4.22509765625, -3.78302001953125, -3.3409423828125, -2.89886474609375, -2.456787109375, -2.01470947265625, -1.5726318359375, -1.13055419921875, -0.6884765625, -0.24639892578125, 0.1956787109375, 0.63775634765625, 1.079833984375, 1.52191162109375, 1.9639892578125, 2.40606689453125, 2.84814453125, 3.29022216796875, 3.7322998046875, 4.17437744140625, 4.616455078125, 5.05853271484375, 5.5006103515625, 5.94268798828125, 6.384765625, 6.82684326171875, 7.2689208984375, 7.71099853515625, 8.153076171875, 8.59515380859375, 9.0372314453125, 9.47930908203125, 9.92138671875, 10.36346435546875, 10.8055419921875, 11.24761962890625, 11.689697265625, 12.13177490234375, 12.5738525390625, 13.01593017578125, 13.4580078125, 13.90008544921875, 14.3421630859375, 14.78424072265625, 15.226318359375, 15.66839599609375, 16.1104736328125, 16.55255126953125, 16.99462890625, 17.43670654296875, 17.8787841796875, 18.32086181640625, 18.762939453125, 19.20501708984375, 19.6470947265625, 20.08917236328125, 20.53125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 30.0, 245.0, 559.0, 140.0, 18.0, 9.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.19833374023438, -172.62811279296875, -169.05789184570312, -165.48765563964844, -161.9174346923828, -158.3472137451172, -154.77699279785156, -151.20677185058594, -147.63653564453125, -144.06631469726562, -140.49609375, -136.9258575439453, -133.3556365966797, -129.78541564941406, -126.21519470214844, -122.64497375488281, -119.07475280761719, -115.50453186035156, -111.9343032836914, -108.36408233642578, -104.79385375976562, -101.2236328125, -97.65341186523438, -94.08319091796875, -90.5129623413086, -86.94274139404297, -83.37251281738281, -79.80229187011719, -76.23207092285156, -72.6618423461914, -69.09162139892578, -65.52139282226562, -61.95117950439453, -58.38095474243164, -54.81072998046875, -51.240509033203125, -47.670284271240234, -44.100059509277344, -40.52983856201172, -36.95961380004883, -33.38938903808594, -29.819164276123047, -26.24894142150879, -22.67871856689453, -19.10849380493164, -15.53826904296875, -11.968046188354492, -8.397823333740234, -4.827598571777344, -1.2573747634887695, 2.3128490447998047, 5.883072853088379, 9.453296661376953, 13.023521423339844, 16.5937442779541, 20.16396713256836, 23.73419189453125, 27.30441665649414, 30.8746395111084, 34.444862365722656, 38.01508712768555, 41.58531188964844, 45.15553283691406, 48.72575759887695, 52.295982360839844]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 24.0, 41.0, 82.0, 108.0, 154.0, 139.0, 141.0, 115.0, 84.0, 62.0, 24.0, 20.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.93634796142578, -56.12519073486328, -54.31403732299805, -52.50288009643555, -50.69172668457031, -48.88056945800781, -47.06941223144531, -45.25825500488281, -43.44710159301758, -41.63594436645508, -39.824790954589844, -38.013633728027344, -36.202476501464844, -34.39132308959961, -32.58016586303711, -30.769010543823242, -28.957855224609375, -27.146699905395508, -25.33554458618164, -23.52438735961914, -21.713232040405273, -19.902076721191406, -18.090919494628906, -16.27976417541504, -14.468608856201172, -12.657453536987305, -10.846297264099121, -9.035140991210938, -7.22398567199707, -5.412830352783203, -3.6016740798950195, -1.790517807006836, 0.020641326904296875, 1.8317971229553223, 3.6429529190063477, 5.454108715057373, 7.265264511108398, 9.076419830322266, 10.88757610321045, 12.698732376098633, 14.5098876953125, 16.321043014526367, 18.132198333740234, 19.943355560302734, 21.7545108795166, 23.56566619873047, 25.37682342529297, 27.187978744506836, 28.999134063720703, 30.81028938293457, 32.62144470214844, 34.43260192871094, 36.24375915527344, 38.05491256713867, 39.86606979370117, 41.677223205566406, 43.488380432128906, 45.299537658691406, 47.11069107055664, 48.92184829711914, 50.733001708984375, 52.544158935546875, 54.355316162109375, 56.166473388671875, 57.97762680053711]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 19.0, 22.0, 40.0, 83.0, 113.0, 192.0, 381.0, 871.0, 2569.0, 17615.0, 439551.0, 560303.0, 22035.0, 2875.0, 897.0, 429.0, 215.0, 115.0, 78.0, 47.0, 29.0, 20.0, 12.0, 8.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.33349609375, -15.7294921875, -15.12548828125, -14.521484375, -13.91748046875, -13.3134765625, -12.70947265625, -12.10546875, -11.50146484375, -10.8974609375, -10.29345703125, -9.689453125, -9.08544921875, -8.4814453125, -7.87744140625, -7.2734375, -6.66943359375, -6.0654296875, -5.46142578125, -4.857421875, -4.25341796875, -3.6494140625, -3.04541015625, -2.44140625, -1.83740234375, -1.2333984375, -0.62939453125, -0.025390625, 0.57861328125, 1.1826171875, 1.78662109375, 2.390625, 2.99462890625, 3.5986328125, 4.20263671875, 4.806640625, 5.41064453125, 6.0146484375, 6.61865234375, 7.22265625, 7.82666015625, 8.4306640625, 9.03466796875, 9.638671875, 10.24267578125, 10.8466796875, 11.45068359375, 12.0546875, 12.65869140625, 13.2626953125, 13.86669921875, 14.470703125, 15.07470703125, 15.6787109375, 16.28271484375, 16.88671875, 17.49072265625, 18.0947265625, 18.69873046875, 19.302734375, 19.90673828125, 20.5107421875, 21.11474609375, 21.71875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 14.0, 18.0, 44.0, 77.0, 101.0, 134.0, 142.0, 139.0, 99.0, 96.0, 60.0, 37.0, 18.0, 12.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.26171875, -3.1187744140625, -2.975830078125, -2.8328857421875, -2.68994140625, -2.5469970703125, -2.404052734375, -2.2611083984375, -2.1181640625, -1.9752197265625, -1.832275390625, -1.6893310546875, -1.54638671875, -1.4034423828125, -1.260498046875, -1.1175537109375, -0.974609375, -0.8316650390625, -0.688720703125, -0.5457763671875, -0.40283203125, -0.2598876953125, -0.116943359375, 0.0260009765625, 0.1689453125, 0.3118896484375, 0.454833984375, 0.5977783203125, 0.74072265625, 0.8836669921875, 1.026611328125, 1.1695556640625, 1.3125, 1.4554443359375, 1.598388671875, 1.7413330078125, 1.88427734375, 2.0272216796875, 2.170166015625, 2.3131103515625, 2.4560546875, 2.5989990234375, 2.741943359375, 2.8848876953125, 3.02783203125, 3.1707763671875, 3.313720703125, 3.4566650390625, 3.599609375, 3.7425537109375, 3.885498046875, 4.0284423828125, 4.17138671875, 4.3143310546875, 4.457275390625, 4.6002197265625, 4.7431640625, 4.8861083984375, 5.029052734375, 5.1719970703125, 5.31494140625, 5.4578857421875, 5.600830078125, 5.7437744140625, 5.88671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 5.0, 11.0, 15.0, 16.0, 17.0, 23.0, 37.0, 44.0, 65.0, 97.0, 148.0, 231.0, 330.0, 618.0, 1020.0, 1912.0, 3683.0, 7432.0, 15860.0, 38191.0, 101044.0, 265718.0, 351778.0, 158269.0, 57713.0, 23192.0, 10188.0, 4936.0, 2475.0, 1403.0, 762.0, 485.0, 268.0, 203.0, 99.0, 77.0, 56.0, 41.0, 20.0, 20.0, 12.0, 14.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-4.765625, -4.63031005859375, -4.4949951171875, -4.35968017578125, -4.224365234375, -4.08905029296875, -3.9537353515625, -3.81842041015625, -3.68310546875, -3.54779052734375, -3.4124755859375, -3.27716064453125, -3.141845703125, -3.00653076171875, -2.8712158203125, -2.73590087890625, -2.6005859375, -2.46527099609375, -2.3299560546875, -2.19464111328125, -2.059326171875, -1.92401123046875, -1.7886962890625, -1.65338134765625, -1.51806640625, -1.38275146484375, -1.2474365234375, -1.11212158203125, -0.976806640625, -0.84149169921875, -0.7061767578125, -0.57086181640625, -0.435546875, -0.30023193359375, -0.1649169921875, -0.02960205078125, 0.105712890625, 0.24102783203125, 0.3763427734375, 0.51165771484375, 0.64697265625, 0.78228759765625, 0.9176025390625, 1.05291748046875, 1.188232421875, 1.32354736328125, 1.4588623046875, 1.59417724609375, 1.7294921875, 1.86480712890625, 2.0001220703125, 2.13543701171875, 2.270751953125, 2.40606689453125, 2.5413818359375, 2.67669677734375, 2.81201171875, 2.94732666015625, 3.0826416015625, 3.21795654296875, 3.353271484375, 3.48858642578125, 3.6239013671875, 3.75921630859375, 3.89453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 4.0, 6.0, 8.0, 8.0, 13.0, 10.0, 17.0, 14.0, 14.0, 21.0, 33.0, 19.0, 25.0, 48.0, 30.0, 40.0, 37.0, 51.0, 51.0, 48.0, 34.0, 47.0, 38.0, 45.0, 35.0, 18.0, 30.0, 36.0, 29.0, 27.0, 18.0, 20.0, 26.0, 18.0, 14.0, 13.0, 11.0, 7.0, 3.0, 9.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.60150146484375, -5.4100341796875, -5.21856689453125, -5.027099609375, -4.83563232421875, -4.6441650390625, -4.45269775390625, -4.26123046875, -4.06976318359375, -3.8782958984375, -3.68682861328125, -3.495361328125, -3.30389404296875, -3.1124267578125, -2.92095947265625, -2.7294921875, -2.53802490234375, -2.3465576171875, -2.15509033203125, -1.963623046875, -1.77215576171875, -1.5806884765625, -1.38922119140625, -1.19775390625, -1.00628662109375, -0.8148193359375, -0.62335205078125, -0.431884765625, -0.24041748046875, -0.0489501953125, 0.14251708984375, 0.333984375, 0.52545166015625, 0.7169189453125, 0.90838623046875, 1.099853515625, 1.29132080078125, 1.4827880859375, 1.67425537109375, 1.86572265625, 2.05718994140625, 2.2486572265625, 2.44012451171875, 2.631591796875, 2.82305908203125, 3.0145263671875, 3.20599365234375, 3.3974609375, 3.58892822265625, 3.7803955078125, 3.97186279296875, 4.163330078125, 4.35479736328125, 4.5462646484375, 4.73773193359375, 4.92919921875, 5.12066650390625, 5.3121337890625, 5.50360107421875, 5.695068359375, 5.88653564453125, 6.0780029296875, 6.26947021484375, 6.4609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 5.0, 12.0, 17.0, 26.0, 31.0, 45.0, 75.0, 139.0, 233.0, 431.0, 822.0, 1794.0, 3917.0, 11253.0, 45677.0, 290369.0, 562922.0, 99355.0, 20272.0, 6249.0, 2400.0, 1104.0, 580.0, 362.0, 189.0, 88.0, 61.0, 39.0, 24.0, 20.0, 8.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.31640625, -3.222259521484375, -3.12811279296875, -3.033966064453125, -2.9398193359375, -2.845672607421875, -2.75152587890625, -2.657379150390625, -2.563232421875, -2.469085693359375, -2.37493896484375, -2.280792236328125, -2.1866455078125, -2.092498779296875, -1.99835205078125, -1.904205322265625, -1.81005859375, -1.715911865234375, -1.62176513671875, -1.527618408203125, -1.4334716796875, -1.339324951171875, -1.24517822265625, -1.151031494140625, -1.056884765625, -0.962738037109375, -0.86859130859375, -0.774444580078125, -0.6802978515625, -0.586151123046875, -0.49200439453125, -0.397857666015625, -0.3037109375, -0.209564208984375, -0.11541748046875, -0.021270751953125, 0.0728759765625, 0.167022705078125, 0.26116943359375, 0.355316162109375, 0.449462890625, 0.543609619140625, 0.63775634765625, 0.731903076171875, 0.8260498046875, 0.920196533203125, 1.01434326171875, 1.108489990234375, 1.20263671875, 1.296783447265625, 1.39093017578125, 1.485076904296875, 1.5792236328125, 1.673370361328125, 1.76751708984375, 1.861663818359375, 1.955810546875, 2.049957275390625, 2.14410400390625, 2.238250732421875, 2.3323974609375, 2.426544189453125, 2.52069091796875, 2.614837646484375, 2.708984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 2.0, 6.0, 9.0, 13.0, 16.0, 19.0, 31.0, 41.0, 62.0, 81.0, 123.0, 121.0, 121.0, 98.0, 79.0, 46.0, 25.0, 23.0, 20.0, 12.0, 11.0, 8.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005178451538085938, -0.0005037076771259308, -0.0004895702004432678, -0.00047543272376060486, -0.0004612952470779419, -0.00044715777039527893, -0.00043302029371261597, -0.000418882817029953, -0.00040474534034729004, -0.0003906078636646271, -0.0003764703869819641, -0.00036233291029930115, -0.0003481954336166382, -0.0003340579569339752, -0.00031992048025131226, -0.0003057830035686493, -0.00029164552688598633, -0.00027750805020332336, -0.0002633705735206604, -0.00024923309683799744, -0.00023509562015533447, -0.0002209581434726715, -0.00020682066679000854, -0.00019268319010734558, -0.00017854571342468262, -0.00016440823674201965, -0.0001502707600593567, -0.00013613328337669373, -0.00012199580669403076, -0.0001078583300113678, -9.372085332870483e-05, -7.958337664604187e-05, -6.54458999633789e-05, -5.130842328071594e-05, -3.717094659805298e-05, -2.3033469915390015e-05, -8.89599323272705e-06, 5.241483449935913e-06, 1.9378960132598877e-05, 3.351643681526184e-05, 4.7653913497924805e-05, 6.179139018058777e-05, 7.592886686325073e-05, 9.00663435459137e-05, 0.00010420382022857666, 0.00011834129691123962, 0.0001324787735939026, 0.00014661625027656555, 0.00016075372695922852, 0.00017489120364189148, 0.00018902868032455444, 0.0002031661570072174, 0.00021730363368988037, 0.00023144111037254333, 0.0002455785870552063, 0.00025971606373786926, 0.0002738535404205322, 0.0002879910171031952, 0.00030212849378585815, 0.0003162659704685211, 0.0003304034471511841, 0.00034454092383384705, 0.00035867840051651, 0.000372815877199173, 0.00038695335388183594]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 22.0, 14.0, 30.0, 41.0, 75.0, 111.0, 200.0, 381.0, 690.0, 1603.0, 3939.0, 11508.0, 42534.0, 279798.0, 590687.0, 86966.0, 19421.0, 6048.0, 2278.0, 1017.0, 500.0, 272.0, 150.0, 100.0, 57.0, 42.0, 19.0, 11.0, 8.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.837890625, -3.71875, -3.599609375, -3.48046875, -3.361328125, -3.2421875, -3.123046875, -3.00390625, -2.884765625, -2.765625, -2.646484375, -2.52734375, -2.408203125, -2.2890625, -2.169921875, -2.05078125, -1.931640625, -1.8125, -1.693359375, -1.57421875, -1.455078125, -1.3359375, -1.216796875, -1.09765625, -0.978515625, -0.859375, -0.740234375, -0.62109375, -0.501953125, -0.3828125, -0.263671875, -0.14453125, -0.025390625, 0.09375, 0.212890625, 0.33203125, 0.451171875, 0.5703125, 0.689453125, 0.80859375, 0.927734375, 1.046875, 1.166015625, 1.28515625, 1.404296875, 1.5234375, 1.642578125, 1.76171875, 1.880859375, 2.0, 2.119140625, 2.23828125, 2.357421875, 2.4765625, 2.595703125, 2.71484375, 2.833984375, 2.953125, 3.072265625, 3.19140625, 3.310546875, 3.4296875, 3.548828125, 3.66796875, 3.787109375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 11.0, 10.0, 15.0, 8.0, 21.0, 21.0, 60.0, 57.0, 125.0, 118.0, 110.0, 112.0, 88.0, 66.0, 39.0, 34.0, 23.0, 13.0, 10.0, 10.0, 10.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.42578125, -3.3292236328125, -3.232666015625, -3.1361083984375, -3.03955078125, -2.9429931640625, -2.846435546875, -2.7498779296875, -2.6533203125, -2.5567626953125, -2.460205078125, -2.3636474609375, -2.26708984375, -2.1705322265625, -2.073974609375, -1.9774169921875, -1.880859375, -1.7843017578125, -1.687744140625, -1.5911865234375, -1.49462890625, -1.3980712890625, -1.301513671875, -1.2049560546875, -1.1083984375, -1.0118408203125, -0.915283203125, -0.8187255859375, -0.72216796875, -0.6256103515625, -0.529052734375, -0.4324951171875, -0.3359375, -0.2393798828125, -0.142822265625, -0.0462646484375, 0.05029296875, 0.1468505859375, 0.243408203125, 0.3399658203125, 0.4365234375, 0.5330810546875, 0.629638671875, 0.7261962890625, 0.82275390625, 0.9193115234375, 1.015869140625, 1.1124267578125, 1.208984375, 1.3055419921875, 1.402099609375, 1.4986572265625, 1.59521484375, 1.6917724609375, 1.788330078125, 1.8848876953125, 1.9814453125, 2.0780029296875, 2.174560546875, 2.2711181640625, 2.36767578125, 2.4642333984375, 2.560791015625, 2.6573486328125, 2.75390625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 5.0, 3.0, 3.0, 7.0, 11.0, 15.0, 23.0, 35.0, 66.0, 103.0, 137.0, 147.0, 154.0, 107.0, 69.0, 51.0, 23.0, 20.0, 10.0, 7.0, 7.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.71232604980469, -37.42655944824219, -36.14078903198242, -34.85502243041992, -33.569252014160156, -32.283485412597656, -30.997718811035156, -29.711950302124023, -28.42618179321289, -27.140413284301758, -25.854644775390625, -24.568878173828125, -23.283109664916992, -21.99734115600586, -20.71157455444336, -19.425806045532227, -18.140037536621094, -16.85426902770996, -15.568501472473145, -14.282733917236328, -12.996965408325195, -11.711196899414062, -10.425429344177246, -9.13966178894043, -7.853893280029297, -6.568125247955322, -5.282357215881348, -3.996589183807373, -2.7108211517333984, -1.4250531196594238, -0.13928508758544922, 1.1464824676513672, 2.4322509765625, 3.7180190086364746, 5.003787040710449, 6.289555072784424, 7.575323104858398, 8.861091613769531, 10.146859169006348, 11.432626724243164, 12.718395233154297, 14.00416374206543, 15.289931297302246, 16.575698852539062, 17.861467361450195, 19.147235870361328, 20.433002471923828, 21.71877098083496, 23.004539489746094, 24.290307998657227, 25.57607650756836, 26.86184310913086, 28.147611618041992, 29.433380126953125, 30.719146728515625, 32.004913330078125, 33.29068374633789, 34.57645034790039, 35.862220764160156, 37.147987365722656, 38.433753967285156, 39.71952438354492, 41.00529098510742, 42.29106140136719, 43.57682800292969]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 10.0, 22.0, 20.0, 20.0, 22.0, 32.0, 36.0, 34.0, 49.0, 44.0, 35.0, 39.0, 43.0, 53.0, 59.0, 57.0, 39.0, 54.0, 48.0, 45.0, 28.0, 37.0, 29.0, 17.0, 31.0, 16.0, 18.0, 10.0, 10.0, 11.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.0434684753418, -41.76372528076172, -40.48398208618164, -39.20423889160156, -37.924495697021484, -36.644752502441406, -35.36500930786133, -34.08526611328125, -32.80552673339844, -31.52578353881836, -30.24604034423828, -28.966297149658203, -27.686553955078125, -26.406810760498047, -25.1270694732666, -23.847326278686523, -22.567581176757812, -21.287837982177734, -20.008094787597656, -18.728351593017578, -17.4486083984375, -16.168865203857422, -14.889123916625977, -13.609380722045898, -12.32963752746582, -11.049894332885742, -9.770151138305664, -8.490408897399902, -7.210665702819824, -5.930922508239746, -4.651179790496826, -3.3714370727539062, -2.0916976928710938, -0.8119547367095947, 0.4677882194519043, 1.7475311756134033, 3.0272741317749023, 4.3070173263549805, 5.5867600440979, 6.86650276184082, 8.146245956420898, 9.425989151000977, 10.705732345581055, 11.985474586486816, 13.265217781066895, 14.544960975646973, 15.824703216552734, 17.104446411132812, 18.38418960571289, 19.66393280029297, 20.943675994873047, 22.223419189453125, 23.503162384033203, 24.78290557861328, 26.062646865844727, 27.342390060424805, 28.622133255004883, 29.90187644958496, 31.18161964416504, 32.461360931396484, 33.74110412597656, 35.02084732055664, 36.30059051513672, 37.5803337097168, 38.860076904296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 11.0, 29.0, 51.0, 109.0, 180.0, 488.0, 1609.0, 13578.0, 4074731.0, 97839.0, 4040.0, 882.0, 350.0, 165.0, 87.0, 54.0, 22.0, 20.0, 9.0, 11.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.455078125, -17.73828125, -17.021484375, -16.3046875, -15.587890625, -14.87109375, -14.154296875, -13.4375, -12.720703125, -12.00390625, -11.287109375, -10.5703125, -9.853515625, -9.13671875, -8.419921875, -7.703125, -6.986328125, -6.26953125, -5.552734375, -4.8359375, -4.119140625, -3.40234375, -2.685546875, -1.96875, -1.251953125, -0.53515625, 0.181640625, 0.8984375, 1.615234375, 2.33203125, 3.048828125, 3.765625, 4.482421875, 5.19921875, 5.916015625, 6.6328125, 7.349609375, 8.06640625, 8.783203125, 9.5, 10.216796875, 10.93359375, 11.650390625, 12.3671875, 13.083984375, 13.80078125, 14.517578125, 15.234375, 15.951171875, 16.66796875, 17.384765625, 18.1015625, 18.818359375, 19.53515625, 20.251953125, 20.96875, 21.685546875, 22.40234375, 23.119140625, 23.8359375, 24.552734375, 25.26953125, 25.986328125, 26.703125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 9.0, 20.0, 45.0, 77.0, 78.0, 120.0, 135.0, 128.0, 124.0, 82.0, 70.0, 51.0, 26.0, 16.0, 11.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.365234375, -3.219940185546875, -3.07464599609375, -2.929351806640625, -2.7840576171875, -2.638763427734375, -2.49346923828125, -2.348175048828125, -2.202880859375, -2.057586669921875, -1.91229248046875, -1.766998291015625, -1.6217041015625, -1.476409912109375, -1.33111572265625, -1.185821533203125, -1.04052734375, -0.895233154296875, -0.74993896484375, -0.604644775390625, -0.4593505859375, -0.314056396484375, -0.16876220703125, -0.023468017578125, 0.121826171875, 0.267120361328125, 0.41241455078125, 0.557708740234375, 0.7030029296875, 0.848297119140625, 0.99359130859375, 1.138885498046875, 1.2841796875, 1.429473876953125, 1.57476806640625, 1.720062255859375, 1.8653564453125, 2.010650634765625, 2.15594482421875, 2.301239013671875, 2.446533203125, 2.591827392578125, 2.73712158203125, 2.882415771484375, 3.0277099609375, 3.173004150390625, 3.31829833984375, 3.463592529296875, 3.60888671875, 3.754180908203125, 3.89947509765625, 4.044769287109375, 4.1900634765625, 4.335357666015625, 4.48065185546875, 4.625946044921875, 4.771240234375, 4.916534423828125, 5.06182861328125, 5.207122802734375, 5.3524169921875, 5.497711181640625, 5.64300537109375, 5.788299560546875, 5.93359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 5.0, 10.0, 11.0, 18.0, 15.0, 44.0, 40.0, 42.0, 80.0, 95.0, 133.0, 231.0, 389.0, 857.0, 2441.0, 10169.0, 85270.0, 3954745.0, 122852.0, 12324.0, 2644.0, 881.0, 392.0, 195.0, 115.0, 71.0, 49.0, 38.0, 34.0, 18.0, 11.0, 15.0, 16.0, 3.0, 5.0, 9.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -11.24072265625, -10.8955078125, -10.55029296875, -10.205078125, -9.85986328125, -9.5146484375, -9.16943359375, -8.82421875, -8.47900390625, -8.1337890625, -7.78857421875, -7.443359375, -7.09814453125, -6.7529296875, -6.40771484375, -6.0625, -5.71728515625, -5.3720703125, -5.02685546875, -4.681640625, -4.33642578125, -3.9912109375, -3.64599609375, -3.30078125, -2.95556640625, -2.6103515625, -2.26513671875, -1.919921875, -1.57470703125, -1.2294921875, -0.88427734375, -0.5390625, -0.19384765625, 0.1513671875, 0.49658203125, 0.841796875, 1.18701171875, 1.5322265625, 1.87744140625, 2.22265625, 2.56787109375, 2.9130859375, 3.25830078125, 3.603515625, 3.94873046875, 4.2939453125, 4.63916015625, 4.984375, 5.32958984375, 5.6748046875, 6.02001953125, 6.365234375, 6.71044921875, 7.0556640625, 7.40087890625, 7.74609375, 8.09130859375, 8.4365234375, 8.78173828125, 9.126953125, 9.47216796875, 9.8173828125, 10.16259765625, 10.5078125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 10.0, 2.0, 5.0, 11.0, 17.0, 19.0, 32.0, 54.0, 93.0, 257.0, 1048.0, 1963.0, 329.0, 118.0, 45.0, 26.0, 15.0, 11.0, 13.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.06640625, -4.9589691162109375, -4.851531982421875, -4.7440948486328125, -4.63665771484375, -4.5292205810546875, -4.421783447265625, -4.3143463134765625, -4.2069091796875, -4.0994720458984375, -3.992034912109375, -3.8845977783203125, -3.77716064453125, -3.6697235107421875, -3.562286376953125, -3.4548492431640625, -3.347412109375, -3.2399749755859375, -3.132537841796875, -3.0251007080078125, -2.91766357421875, -2.8102264404296875, -2.702789306640625, -2.5953521728515625, -2.4879150390625, -2.3804779052734375, -2.273040771484375, -2.1656036376953125, -2.05816650390625, -1.9507293701171875, -1.843292236328125, -1.7358551025390625, -1.62841796875, -1.5209808349609375, -1.413543701171875, -1.3061065673828125, -1.19866943359375, -1.0912322998046875, -0.983795166015625, -0.8763580322265625, -0.7689208984375, -0.6614837646484375, -0.554046630859375, -0.4466094970703125, -0.33917236328125, -0.2317352294921875, -0.124298095703125, -0.0168609619140625, 0.090576171875, 0.1980133056640625, 0.305450439453125, 0.4128875732421875, 0.52032470703125, 0.6277618408203125, 0.735198974609375, 0.8426361083984375, 0.9500732421875, 1.0575103759765625, 1.164947509765625, 1.2723846435546875, 1.37982177734375, 1.4872589111328125, 1.594696044921875, 1.7021331787109375, 1.8095703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 7.0, 13.0, 23.0, 42.0, 86.0, 157.0, 222.0, 182.0, 136.0, 77.0, 31.0, 13.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.342247009277344, -31.711666107177734, -31.081087112426758, -30.45050621032715, -29.81992530822754, -29.189346313476562, -28.558765411376953, -27.928184509277344, -27.297603607177734, -26.667022705078125, -26.03644371032715, -25.40586280822754, -24.77528190612793, -24.144702911376953, -23.514122009277344, -22.883541107177734, -22.252962112426758, -21.62238121032715, -20.991802215576172, -20.361221313476562, -19.730640411376953, -19.100059509277344, -18.469480514526367, -17.838899612426758, -17.20832061767578, -16.577739715576172, -15.947159767150879, -15.316579818725586, -14.685998916625977, -14.055418968200684, -13.42483901977539, -12.794258117675781, -12.163675308227539, -11.533095359802246, -10.902514457702637, -10.271934509277344, -9.641353607177734, -9.010773658752441, -8.380193710327148, -7.749613285064697, -7.119032859802246, -6.488452434539795, -5.857872009277344, -5.227292060852051, -4.5967116355896, -3.9661312103271484, -3.3355510234832764, -2.7049708366394043, -2.074390411376953, -1.4438101053237915, -0.8132297992706299, -0.18264949321746826, 0.44793081283569336, 1.0785112380981445, 1.7090914249420166, 2.3396716117858887, 2.97025203704834, 3.600832462310791, 4.231412887573242, 4.861992835998535, 5.492573261260986, 6.1231536865234375, 6.7537336349487305, 7.384314060211182, 8.014894485473633]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 12.0, 11.0, 25.0, 27.0, 41.0, 42.0, 54.0, 59.0, 84.0, 61.0, 63.0, 80.0, 68.0, 76.0, 60.0, 50.0, 48.0, 33.0, 22.0, 25.0, 21.0, 11.0, 9.0, 7.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.256521224975586, -16.842187881469727, -16.427854537963867, -16.013521194458008, -15.599188804626465, -15.184855461120605, -14.770522117614746, -14.356189727783203, -13.941856384277344, -13.527523040771484, -13.113189697265625, -12.698857307434082, -12.284523963928223, -11.870190620422363, -11.455857276916504, -11.041524887084961, -10.627191543579102, -10.212858200073242, -9.798524856567383, -9.38419246673584, -8.96985912322998, -8.555525779724121, -8.141192436218262, -7.7268595695495605, -7.312525749206543, -6.898192405700684, -6.483859539031982, -6.069526195526123, -5.655193328857422, -5.2408599853515625, -4.826526641845703, -4.412193775177002, -3.997860908508301, -3.5835278034210205, -3.1691946983337402, -2.754861354827881, -2.3405284881591797, -1.9261951446533203, -1.51186203956604, -1.0975289344787598, -0.6831958293914795, -0.26886269450187683, 0.14547044038772583, 0.5598036050796509, 0.9741367101669312, 1.388469934463501, 1.8028030395507812, 2.2171361446380615, 2.631469249725342, 3.045802354812622, 3.4601354598999023, 3.8744688034057617, 4.288801670074463, 4.703135013580322, 5.117467880249023, 5.531801223754883, 5.946134567260742, 6.360467910766602, 6.774800777435303, 7.189134120941162, 7.603466987609863, 8.017800331115723, 8.432133674621582, 8.846466064453125, 9.260799407958984]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 6.0, 4.0, 20.0, 13.0, 19.0, 27.0, 22.0, 42.0, 51.0, 62.0, 103.0, 174.0, 232.0, 369.0, 655.0, 1457.0, 4292.0, 18348.0, 115597.0, 634862.0, 229895.0, 31545.0, 6590.0, 2005.0, 866.0, 416.0, 278.0, 179.0, 114.0, 85.0, 49.0, 47.0, 29.0, 24.0, 14.0, 19.0, 9.0, 5.0, 6.0, 9.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.3203125, -10.9627685546875, -10.605224609375, -10.2476806640625, -9.89013671875, -9.5325927734375, -9.175048828125, -8.8175048828125, -8.4599609375, -8.1024169921875, -7.744873046875, -7.3873291015625, -7.02978515625, -6.6722412109375, -6.314697265625, -5.9571533203125, -5.599609375, -5.2420654296875, -4.884521484375, -4.5269775390625, -4.16943359375, -3.8118896484375, -3.454345703125, -3.0968017578125, -2.7392578125, -2.3817138671875, -2.024169921875, -1.6666259765625, -1.30908203125, -0.9515380859375, -0.593994140625, -0.2364501953125, 0.12109375, 0.4786376953125, 0.836181640625, 1.1937255859375, 1.55126953125, 1.9088134765625, 2.266357421875, 2.6239013671875, 2.9814453125, 3.3389892578125, 3.696533203125, 4.0540771484375, 4.41162109375, 4.7691650390625, 5.126708984375, 5.4842529296875, 5.841796875, 6.1993408203125, 6.556884765625, 6.9144287109375, 7.27197265625, 7.6295166015625, 7.987060546875, 8.3446044921875, 8.7021484375, 9.0596923828125, 9.417236328125, 9.7747802734375, 10.13232421875, 10.4898681640625, 10.847412109375, 11.2049560546875, 11.5625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 17.0, 40.0, 61.0, 88.0, 130.0, 158.0, 138.0, 121.0, 90.0, 56.0, 47.0, 26.0, 17.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.276336669921875, -3.12103271484375, -2.965728759765625, -2.8104248046875, -2.655120849609375, -2.49981689453125, -2.344512939453125, -2.189208984375, -2.033905029296875, -1.87860107421875, -1.723297119140625, -1.5679931640625, -1.412689208984375, -1.25738525390625, -1.102081298828125, -0.94677734375, -0.791473388671875, -0.63616943359375, -0.480865478515625, -0.3255615234375, -0.170257568359375, -0.01495361328125, 0.140350341796875, 0.295654296875, 0.450958251953125, 0.60626220703125, 0.761566162109375, 0.9168701171875, 1.072174072265625, 1.22747802734375, 1.382781982421875, 1.5380859375, 1.693389892578125, 1.84869384765625, 2.003997802734375, 2.1593017578125, 2.314605712890625, 2.46990966796875, 2.625213623046875, 2.780517578125, 2.935821533203125, 3.09112548828125, 3.246429443359375, 3.4017333984375, 3.557037353515625, 3.71234130859375, 3.867645263671875, 4.02294921875, 4.178253173828125, 4.33355712890625, 4.488861083984375, 4.6441650390625, 4.799468994140625, 4.95477294921875, 5.110076904296875, 5.265380859375, 5.420684814453125, 5.57598876953125, 5.731292724609375, 5.8865966796875, 6.041900634765625, 6.19720458984375, 6.352508544921875, 6.5078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 2.0, 4.0, 6.0, 7.0, 17.0, 17.0, 23.0, 45.0, 46.0, 66.0, 86.0, 143.0, 200.0, 280.0, 442.0, 717.0, 1115.0, 1893.0, 3290.0, 6071.0, 11856.0, 25737.0, 60596.0, 155753.0, 332106.0, 261168.0, 105737.0, 42208.0, 18545.0, 8990.0, 4674.0, 2563.0, 1425.0, 927.0, 556.0, 367.0, 279.0, 168.0, 114.0, 76.0, 70.0, 47.0, 35.0, 24.0, 24.0, 15.0, 10.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.47265625, -4.3441162109375, -4.215576171875, -4.0870361328125, -3.95849609375, -3.8299560546875, -3.701416015625, -3.5728759765625, -3.4443359375, -3.3157958984375, -3.187255859375, -3.0587158203125, -2.93017578125, -2.8016357421875, -2.673095703125, -2.5445556640625, -2.416015625, -2.2874755859375, -2.158935546875, -2.0303955078125, -1.90185546875, -1.7733154296875, -1.644775390625, -1.5162353515625, -1.3876953125, -1.2591552734375, -1.130615234375, -1.0020751953125, -0.87353515625, -0.7449951171875, -0.616455078125, -0.4879150390625, -0.359375, -0.2308349609375, -0.102294921875, 0.0262451171875, 0.15478515625, 0.2833251953125, 0.411865234375, 0.5404052734375, 0.6689453125, 0.7974853515625, 0.926025390625, 1.0545654296875, 1.18310546875, 1.3116455078125, 1.440185546875, 1.5687255859375, 1.697265625, 1.8258056640625, 1.954345703125, 2.0828857421875, 2.21142578125, 2.3399658203125, 2.468505859375, 2.5970458984375, 2.7255859375, 2.8541259765625, 2.982666015625, 3.1112060546875, 3.23974609375, 3.3682861328125, 3.496826171875, 3.6253662109375, 3.75390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 13.0, 13.0, 14.0, 22.0, 23.0, 28.0, 29.0, 34.0, 28.0, 37.0, 36.0, 34.0, 33.0, 43.0, 43.0, 47.0, 46.0, 39.0, 48.0, 46.0, 30.0, 50.0, 32.0, 36.0, 24.0, 23.0, 17.0, 15.0, 14.0, 7.0, 18.0, 19.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-7.19140625, -6.97174072265625, -6.7520751953125, -6.53240966796875, -6.312744140625, -6.09307861328125, -5.8734130859375, -5.65374755859375, -5.43408203125, -5.21441650390625, -4.9947509765625, -4.77508544921875, -4.555419921875, -4.33575439453125, -4.1160888671875, -3.89642333984375, -3.6767578125, -3.45709228515625, -3.2374267578125, -3.01776123046875, -2.798095703125, -2.57843017578125, -2.3587646484375, -2.13909912109375, -1.91943359375, -1.69976806640625, -1.4801025390625, -1.26043701171875, -1.040771484375, -0.82110595703125, -0.6014404296875, -0.38177490234375, -0.162109375, 0.05755615234375, 0.2772216796875, 0.49688720703125, 0.716552734375, 0.93621826171875, 1.1558837890625, 1.37554931640625, 1.59521484375, 1.81488037109375, 2.0345458984375, 2.25421142578125, 2.473876953125, 2.69354248046875, 2.9132080078125, 3.13287353515625, 3.3525390625, 3.57220458984375, 3.7918701171875, 4.01153564453125, 4.231201171875, 4.45086669921875, 4.6705322265625, 4.89019775390625, 5.10986328125, 5.32952880859375, 5.5491943359375, 5.76885986328125, 5.988525390625, 6.20819091796875, 6.4278564453125, 6.64752197265625, 6.8671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 17.0, 24.0, 34.0, 54.0, 131.0, 207.0, 444.0, 962.0, 2418.0, 7353.0, 30529.0, 212532.0, 677494.0, 91678.0, 16917.0, 4689.0, 1663.0, 670.0, 350.0, 150.0, 100.0, 44.0, 23.0, 17.0, 13.0, 9.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.359375, -4.20538330078125, -4.0513916015625, -3.89739990234375, -3.743408203125, -3.58941650390625, -3.4354248046875, -3.28143310546875, -3.12744140625, -2.97344970703125, -2.8194580078125, -2.66546630859375, -2.511474609375, -2.35748291015625, -2.2034912109375, -2.04949951171875, -1.8955078125, -1.74151611328125, -1.5875244140625, -1.43353271484375, -1.279541015625, -1.12554931640625, -0.9715576171875, -0.81756591796875, -0.66357421875, -0.50958251953125, -0.3555908203125, -0.20159912109375, -0.047607421875, 0.10638427734375, 0.2603759765625, 0.41436767578125, 0.568359375, 0.72235107421875, 0.8763427734375, 1.03033447265625, 1.184326171875, 1.33831787109375, 1.4923095703125, 1.64630126953125, 1.80029296875, 1.95428466796875, 2.1082763671875, 2.26226806640625, 2.416259765625, 2.57025146484375, 2.7242431640625, 2.87823486328125, 3.0322265625, 3.18621826171875, 3.3402099609375, 3.49420166015625, 3.648193359375, 3.80218505859375, 3.9561767578125, 4.11016845703125, 4.26416015625, 4.41815185546875, 4.5721435546875, 4.72613525390625, 4.880126953125, 5.03411865234375, 5.1881103515625, 5.34210205078125, 5.49609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 10.0, 15.0, 16.0, 14.0, 33.0, 38.0, 54.0, 67.0, 101.0, 173.0, 133.0, 99.0, 62.0, 52.0, 22.0, 26.0, 19.0, 15.0, 8.0, 6.0, 5.0, 4.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007023811340332031, -0.0006795227527618408, -0.0006566643714904785, -0.0006338059902191162, -0.0006109476089477539, -0.0005880892276763916, -0.0005652308464050293, -0.000542372465133667, -0.0005195140838623047, -0.0004966557025909424, -0.0004737973213195801, -0.0004509389400482178, -0.00042808055877685547, -0.00040522217750549316, -0.00038236379623413086, -0.00035950541496276855, -0.00033664703369140625, -0.00031378865242004395, -0.00029093027114868164, -0.00026807188987731934, -0.00024521350860595703, -0.00022235512733459473, -0.00019949674606323242, -0.00017663836479187012, -0.0001537799835205078, -0.0001309216022491455, -0.0001080632209777832, -8.52048397064209e-05, -6.23464584350586e-05, -3.948807716369629e-05, -1.6629695892333984e-05, 6.22868537902832e-06, 2.9087066650390625e-05, 5.194544792175293e-05, 7.480382919311523e-05, 9.766221046447754e-05, 0.00012052059173583984, 0.00014337897300720215, 0.00016623735427856445, 0.00018909573554992676, 0.00021195411682128906, 0.00023481249809265137, 0.00025767087936401367, 0.000280529260635376, 0.0003033876419067383, 0.0003262460231781006, 0.0003491044044494629, 0.0003719627857208252, 0.0003948211669921875, 0.0004176795482635498, 0.0004405379295349121, 0.0004633963108062744, 0.0004862546920776367, 0.000509113073348999, 0.0005319714546203613, 0.0005548298358917236, 0.0005776882171630859, 0.0006005465984344482, 0.0006234049797058105, 0.0006462633609771729, 0.0006691217422485352, 0.0006919801235198975, 0.0007148385047912598, 0.0007376968860626221, 0.0007605552673339844]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 9.0, 25.0, 35.0, 57.0, 143.0, 330.0, 882.0, 2776.0, 12634.0, 89078.0, 809033.0, 113807.0, 15031.0, 3215.0, 868.0, 334.0, 138.0, 72.0, 47.0, 23.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.898681640625, -8.64111328125, -8.383544921875, -8.1259765625, -7.868408203125, -7.61083984375, -7.353271484375, -7.095703125, -6.838134765625, -6.58056640625, -6.322998046875, -6.0654296875, -5.807861328125, -5.55029296875, -5.292724609375, -5.03515625, -4.777587890625, -4.52001953125, -4.262451171875, -4.0048828125, -3.747314453125, -3.48974609375, -3.232177734375, -2.974609375, -2.717041015625, -2.45947265625, -2.201904296875, -1.9443359375, -1.686767578125, -1.42919921875, -1.171630859375, -0.9140625, -0.656494140625, -0.39892578125, -0.141357421875, 0.1162109375, 0.373779296875, 0.63134765625, 0.888916015625, 1.146484375, 1.404052734375, 1.66162109375, 1.919189453125, 2.1767578125, 2.434326171875, 2.69189453125, 2.949462890625, 3.20703125, 3.464599609375, 3.72216796875, 3.979736328125, 4.2373046875, 4.494873046875, 4.75244140625, 5.010009765625, 5.267578125, 5.525146484375, 5.78271484375, 6.040283203125, 6.2978515625, 6.555419921875, 6.81298828125, 7.070556640625, 7.328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 6.0, 9.0, 7.0, 11.0, 11.0, 9.0, 11.0, 22.0, 27.0, 27.0, 36.0, 54.0, 75.0, 97.0, 109.0, 97.0, 73.0, 66.0, 42.0, 36.0, 29.0, 28.0, 17.0, 17.0, 8.0, 10.0, 11.0, 6.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.94140625, -3.83074951171875, -3.7200927734375, -3.60943603515625, -3.498779296875, -3.38812255859375, -3.2774658203125, -3.16680908203125, -3.05615234375, -2.94549560546875, -2.8348388671875, -2.72418212890625, -2.613525390625, -2.50286865234375, -2.3922119140625, -2.28155517578125, -2.1708984375, -2.06024169921875, -1.9495849609375, -1.83892822265625, -1.728271484375, -1.61761474609375, -1.5069580078125, -1.39630126953125, -1.28564453125, -1.17498779296875, -1.0643310546875, -0.95367431640625, -0.843017578125, -0.73236083984375, -0.6217041015625, -0.51104736328125, -0.400390625, -0.28973388671875, -0.1790771484375, -0.06842041015625, 0.042236328125, 0.15289306640625, 0.2635498046875, 0.37420654296875, 0.48486328125, 0.59552001953125, 0.7061767578125, 0.81683349609375, 0.927490234375, 1.03814697265625, 1.1488037109375, 1.25946044921875, 1.3701171875, 1.48077392578125, 1.5914306640625, 1.70208740234375, 1.812744140625, 1.92340087890625, 2.0340576171875, 2.14471435546875, 2.25537109375, 2.36602783203125, 2.4766845703125, 2.58734130859375, 2.697998046875, 2.80865478515625, 2.9193115234375, 3.02996826171875, 3.140625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 5.0, 4.0, 11.0, 7.0, 34.0, 65.0, 152.0, 305.0, 238.0, 124.0, 39.0, 10.0, 11.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.027982711791992, -25.73267936706543, -22.437376022338867, -19.142072677612305, -15.846769332885742, -12.55146598815918, -9.256162643432617, -5.960859298706055, -2.665555953979492, 0.6297473907470703, 3.925050735473633, 7.220354080200195, 10.515657424926758, 13.81096076965332, 17.106264114379883, 20.401567459106445, 23.696870803833008, 26.99217414855957, 30.287477493286133, 33.58277893066406, 36.878082275390625, 40.17338562011719, 43.46868896484375, 46.76399230957031, 50.059295654296875, 53.35459899902344, 56.64990234375, 59.94520568847656, 63.240509033203125, 66.53581237792969, 69.83111572265625, 73.12641906738281, 76.42172241210938, 79.71702575683594, 83.0123291015625, 86.30763244628906, 89.60293579101562, 92.89823913574219, 96.19354248046875, 99.48884582519531, 102.78414916992188, 106.07945251464844, 109.374755859375, 112.67005920410156, 115.96536254882812, 119.26066589355469, 122.55596923828125, 125.85127258300781, 129.14657592773438, 132.44187927246094, 135.7371826171875, 139.03248596191406, 142.32778930664062, 145.6230926513672, 148.91839599609375, 152.2136993408203, 155.50900268554688, 158.80430603027344, 162.099609375, 165.39491271972656, 168.69021606445312, 171.9855194091797, 175.28082275390625, 178.5761260986328, 181.87142944335938]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 8.0, 2.0, 5.0, 5.0, 11.0, 11.0, 15.0, 16.0, 26.0, 29.0, 28.0, 26.0, 24.0, 36.0, 49.0, 33.0, 29.0, 45.0, 23.0, 43.0, 45.0, 45.0, 44.0, 40.0, 46.0, 40.0, 44.0, 35.0, 29.0, 25.0, 20.0, 26.0, 22.0, 11.0, 8.0, 15.0, 12.0, 7.0, 5.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.568180084228516, -46.148834228515625, -44.7294921875, -43.31014633178711, -41.89080047607422, -40.471458435058594, -39.0521125793457, -37.63276672363281, -36.21342468261719, -34.7940788269043, -33.37473678588867, -31.95539093017578, -30.53604507446289, -29.116701126098633, -27.697357177734375, -26.278011322021484, -24.858665466308594, -23.439321517944336, -22.019975662231445, -20.600631713867188, -19.181285858154297, -17.76194190979004, -16.34259796142578, -14.923253059387207, -13.503908157348633, -12.084563255310059, -10.665218353271484, -9.245874404907227, -7.826529502868652, -6.407184600830078, -4.98784065246582, -3.568495750427246, -2.1491546630859375, -0.7298099994659424, 0.6895346641540527, 2.1088790893554688, 3.528223991394043, 4.947568893432617, 6.366912841796875, 7.786257743835449, 9.205602645874023, 10.624947547912598, 12.044292449951172, 13.46363639831543, 14.882981300354004, 16.302326202392578, 17.721670150756836, 19.141014099121094, 20.560359954833984, 21.979703903198242, 23.399049758911133, 24.81839370727539, 26.23773956298828, 27.65708351135254, 29.076427459716797, 30.495773315429688, 31.915117263793945, 33.3344612121582, 34.753807067871094, 36.17314910888672, 37.59249496459961, 39.0118408203125, 40.431182861328125, 41.850528717041016, 43.269874572753906]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 18.0, 24.0, 37.0, 73.0, 140.0, 259.0, 637.0, 1571.0, 6282.0, 63350.0, 4059626.0, 53741.0, 5777.0, 1499.0, 599.0, 277.0, 137.0, 70.0, 53.0, 31.0, 19.0, 7.0, 6.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.171875, -14.552001953125, -13.93212890625, -13.312255859375, -12.6923828125, -12.072509765625, -11.45263671875, -10.832763671875, -10.212890625, -9.593017578125, -8.97314453125, -8.353271484375, -7.7333984375, -7.113525390625, -6.49365234375, -5.873779296875, -5.25390625, -4.634033203125, -4.01416015625, -3.394287109375, -2.7744140625, -2.154541015625, -1.53466796875, -0.914794921875, -0.294921875, 0.324951171875, 0.94482421875, 1.564697265625, 2.1845703125, 2.804443359375, 3.42431640625, 4.044189453125, 4.6640625, 5.283935546875, 5.90380859375, 6.523681640625, 7.1435546875, 7.763427734375, 8.38330078125, 9.003173828125, 9.623046875, 10.242919921875, 10.86279296875, 11.482666015625, 12.1025390625, 12.722412109375, 13.34228515625, 13.962158203125, 14.58203125, 15.201904296875, 15.82177734375, 16.441650390625, 17.0615234375, 17.681396484375, 18.30126953125, 18.921142578125, 19.541015625, 20.160888671875, 20.78076171875, 21.400634765625, 22.0205078125, 22.640380859375, 23.26025390625, 23.880126953125, 24.5]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 16.0, 26.0, 43.0, 61.0, 78.0, 95.0, 87.0, 136.0, 106.0, 99.0, 71.0, 63.0, 46.0, 35.0, 15.0, 14.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.57421875, -3.42938232421875, -3.2845458984375, -3.13970947265625, -2.994873046875, -2.85003662109375, -2.7052001953125, -2.56036376953125, -2.41552734375, -2.27069091796875, -2.1258544921875, -1.98101806640625, -1.836181640625, -1.69134521484375, -1.5465087890625, -1.40167236328125, -1.2568359375, -1.11199951171875, -0.9671630859375, -0.82232666015625, -0.677490234375, -0.53265380859375, -0.3878173828125, -0.24298095703125, -0.09814453125, 0.04669189453125, 0.1915283203125, 0.33636474609375, 0.481201171875, 0.62603759765625, 0.7708740234375, 0.91571044921875, 1.060546875, 1.20538330078125, 1.3502197265625, 1.49505615234375, 1.639892578125, 1.78472900390625, 1.9295654296875, 2.07440185546875, 2.21923828125, 2.36407470703125, 2.5089111328125, 2.65374755859375, 2.798583984375, 2.94342041015625, 3.0882568359375, 3.23309326171875, 3.3779296875, 3.52276611328125, 3.6676025390625, 3.81243896484375, 3.957275390625, 4.10211181640625, 4.2469482421875, 4.39178466796875, 4.53662109375, 4.68145751953125, 4.8262939453125, 4.97113037109375, 5.115966796875, 5.26080322265625, 5.4056396484375, 5.55047607421875, 5.6953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 4.0, 10.0, 18.0, 14.0, 23.0, 35.0, 32.0, 60.0, 68.0, 117.0, 191.0, 264.0, 393.0, 673.0, 993.0, 1782.0, 3513.0, 7524.0, 18235.0, 59194.0, 555267.0, 3361143.0, 133503.0, 29582.0, 10987.0, 4828.0, 2404.0, 1296.0, 726.0, 464.0, 297.0, 192.0, 120.0, 86.0, 51.0, 43.0, 46.0, 23.0, 28.0, 15.0, 10.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-7.30078125, -7.08111572265625, -6.8614501953125, -6.64178466796875, -6.422119140625, -6.20245361328125, -5.9827880859375, -5.76312255859375, -5.54345703125, -5.32379150390625, -5.1041259765625, -4.88446044921875, -4.664794921875, -4.44512939453125, -4.2254638671875, -4.00579833984375, -3.7861328125, -3.56646728515625, -3.3468017578125, -3.12713623046875, -2.907470703125, -2.68780517578125, -2.4681396484375, -2.24847412109375, -2.02880859375, -1.80914306640625, -1.5894775390625, -1.36981201171875, -1.150146484375, -0.93048095703125, -0.7108154296875, -0.49114990234375, -0.271484375, -0.05181884765625, 0.1678466796875, 0.38751220703125, 0.607177734375, 0.82684326171875, 1.0465087890625, 1.26617431640625, 1.48583984375, 1.70550537109375, 1.9251708984375, 2.14483642578125, 2.364501953125, 2.58416748046875, 2.8038330078125, 3.02349853515625, 3.2431640625, 3.46282958984375, 3.6824951171875, 3.90216064453125, 4.121826171875, 4.34149169921875, 4.5611572265625, 4.78082275390625, 5.00048828125, 5.22015380859375, 5.4398193359375, 5.65948486328125, 5.879150390625, 6.09881591796875, 6.3184814453125, 6.53814697265625, 6.7578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 8.0, 14.0, 18.0, 12.0, 29.0, 42.0, 80.0, 160.0, 356.0, 1779.0, 982.0, 263.0, 118.0, 64.0, 41.0, 22.0, 10.0, 15.0, 9.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.5, -4.3670654296875, -4.234130859375, -4.1011962890625, -3.96826171875, -3.8353271484375, -3.702392578125, -3.5694580078125, -3.4365234375, -3.3035888671875, -3.170654296875, -3.0377197265625, -2.90478515625, -2.7718505859375, -2.638916015625, -2.5059814453125, -2.373046875, -2.2401123046875, -2.107177734375, -1.9742431640625, -1.84130859375, -1.7083740234375, -1.575439453125, -1.4425048828125, -1.3095703125, -1.1766357421875, -1.043701171875, -0.9107666015625, -0.77783203125, -0.6448974609375, -0.511962890625, -0.3790283203125, -0.24609375, -0.1131591796875, 0.019775390625, 0.1527099609375, 0.28564453125, 0.4185791015625, 0.551513671875, 0.6844482421875, 0.8173828125, 0.9503173828125, 1.083251953125, 1.2161865234375, 1.34912109375, 1.4820556640625, 1.614990234375, 1.7479248046875, 1.880859375, 2.0137939453125, 2.146728515625, 2.2796630859375, 2.41259765625, 2.5455322265625, 2.678466796875, 2.8114013671875, 2.9443359375, 3.0772705078125, 3.210205078125, 3.3431396484375, 3.47607421875, 3.6090087890625, 3.741943359375, 3.8748779296875, 4.0078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 10.0, 15.0, 25.0, 53.0, 136.0, 205.0, 201.0, 156.0, 100.0, 39.0, 28.0, 15.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-50.06025695800781, -49.08889389038086, -48.117530822753906, -47.14617156982422, -46.174808502197266, -45.20344543457031, -44.23208236694336, -43.260719299316406, -42.28935623168945, -41.3179931640625, -40.34663009643555, -39.375267028808594, -38.403907775878906, -37.43254470825195, -36.461181640625, -35.48981857299805, -34.518455505371094, -33.54709243774414, -32.57572937011719, -31.604368209838867, -30.633005142211914, -29.661643981933594, -28.69028091430664, -27.718917846679688, -26.74755859375, -25.776195526123047, -24.804834365844727, -23.833471298217773, -22.86210823059082, -21.8907470703125, -20.919384002685547, -19.948020935058594, -18.976659774780273, -18.00529670715332, -17.033935546875, -16.062572479248047, -15.091209411621094, -14.119847297668457, -13.14848518371582, -12.177122116088867, -11.20576000213623, -10.234397888183594, -9.26303482055664, -8.291672706604004, -7.320310115814209, -6.348947525024414, -5.377585411071777, -4.406222820281982, -3.4348602294921875, -2.4634976387023926, -1.4921352863311768, -0.5207729339599609, 0.450589656829834, 1.421952247619629, 2.3933143615722656, 3.3646769523620605, 4.3360395431518555, 5.30740213394165, 6.278764724731445, 7.250126838684082, 8.221488952636719, 9.192852020263672, 10.164214134216309, 11.135576248168945, 12.106939315795898]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 8.0, 12.0, 12.0, 23.0, 25.0, 32.0, 28.0, 27.0, 47.0, 46.0, 55.0, 58.0, 61.0, 53.0, 49.0, 55.0, 52.0, 61.0, 58.0, 37.0, 36.0, 27.0, 31.0, 28.0, 15.0, 4.0, 15.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.609703063964844, -16.133255004882812, -15.656805992126465, -15.180356979370117, -14.70390796661377, -14.227458953857422, -13.75101089477539, -13.274561882019043, -12.798112869262695, -12.321663856506348, -11.845215797424316, -11.368766784667969, -10.892317771911621, -10.415868759155273, -9.939420700073242, -9.462971687316895, -8.986523628234863, -8.510074615478516, -8.033626556396484, -7.557177543640137, -7.080728530883789, -6.6042799949646, -6.12783145904541, -5.6513824462890625, -5.174933910369873, -4.698485374450684, -4.222036361694336, -3.7455878257751465, -3.269139051437378, -2.7926902770996094, -2.31624174118042, -1.8397929668426514, -1.3633451461791992, -0.8868964314460754, -0.41044771671295166, 0.06600093841552734, 0.5424497127532959, 1.0188984870910645, 1.495347023010254, 1.9717957973480225, 2.448244571685791, 2.9246933460235596, 3.401142120361328, 3.8775906562805176, 4.354039192199707, 4.830488204956055, 5.306936740875244, 5.783385276794434, 6.259834289550781, 6.736282825469971, 7.212731838226318, 7.689180374145508, 8.165629386901855, 8.642078399658203, 9.118526458740234, 9.594975471496582, 10.07142448425293, 10.547873497009277, 11.024321556091309, 11.500770568847656, 11.977219581604004, 12.453668594360352, 12.930116653442383, 13.40656566619873, 13.883013725280762]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 14.0, 13.0, 12.0, 22.0, 37.0, 45.0, 92.0, 162.0, 272.0, 556.0, 1184.0, 3425.0, 11777.0, 55651.0, 474238.0, 432769.0, 51642.0, 10939.0, 3298.0, 1216.0, 521.0, 252.0, 167.0, 81.0, 47.0, 36.0, 30.0, 22.0, 5.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.859375, -11.488525390625, -11.11767578125, -10.746826171875, -10.3759765625, -10.005126953125, -9.63427734375, -9.263427734375, -8.892578125, -8.521728515625, -8.15087890625, -7.780029296875, -7.4091796875, -7.038330078125, -6.66748046875, -6.296630859375, -5.92578125, -5.554931640625, -5.18408203125, -4.813232421875, -4.4423828125, -4.071533203125, -3.70068359375, -3.329833984375, -2.958984375, -2.588134765625, -2.21728515625, -1.846435546875, -1.4755859375, -1.104736328125, -0.73388671875, -0.363037109375, 0.0078125, 0.378662109375, 0.74951171875, 1.120361328125, 1.4912109375, 1.862060546875, 2.23291015625, 2.603759765625, 2.974609375, 3.345458984375, 3.71630859375, 4.087158203125, 4.4580078125, 4.828857421875, 5.19970703125, 5.570556640625, 5.94140625, 6.312255859375, 6.68310546875, 7.053955078125, 7.4248046875, 7.795654296875, 8.16650390625, 8.537353515625, 8.908203125, 9.279052734375, 9.64990234375, 10.020751953125, 10.3916015625, 10.762451171875, 11.13330078125, 11.504150390625, 11.875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 9.0, 15.0, 23.0, 28.0, 56.0, 45.0, 78.0, 77.0, 104.0, 84.0, 103.0, 91.0, 72.0, 57.0, 40.0, 48.0, 26.0, 21.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.552734375, -3.428863525390625, -3.30499267578125, -3.181121826171875, -3.0572509765625, -2.933380126953125, -2.80950927734375, -2.685638427734375, -2.561767578125, -2.437896728515625, -2.31402587890625, -2.190155029296875, -2.0662841796875, -1.942413330078125, -1.81854248046875, -1.694671630859375, -1.57080078125, -1.446929931640625, -1.32305908203125, -1.199188232421875, -1.0753173828125, -0.951446533203125, -0.82757568359375, -0.703704833984375, -0.579833984375, -0.455963134765625, -0.33209228515625, -0.208221435546875, -0.0843505859375, 0.039520263671875, 0.16339111328125, 0.287261962890625, 0.4111328125, 0.535003662109375, 0.65887451171875, 0.782745361328125, 0.9066162109375, 1.030487060546875, 1.15435791015625, 1.278228759765625, 1.402099609375, 1.525970458984375, 1.64984130859375, 1.773712158203125, 1.8975830078125, 2.021453857421875, 2.14532470703125, 2.269195556640625, 2.39306640625, 2.516937255859375, 2.64080810546875, 2.764678955078125, 2.8885498046875, 3.012420654296875, 3.13629150390625, 3.260162353515625, 3.384033203125, 3.507904052734375, 3.63177490234375, 3.755645751953125, 3.8795166015625, 4.003387451171875, 4.12725830078125, 4.251129150390625, 4.375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 8.0, 8.0, 9.0, 10.0, 17.0, 31.0, 38.0, 45.0, 80.0, 93.0, 155.0, 222.0, 336.0, 483.0, 776.0, 1377.0, 2440.0, 4786.0, 10353.0, 27561.0, 91672.0, 408267.0, 371257.0, 83183.0, 25292.0, 9834.0, 4464.0, 2297.0, 1265.0, 743.0, 467.0, 310.0, 202.0, 141.0, 107.0, 73.0, 42.0, 26.0, 25.0, 18.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0], "bins": [-7.6015625, -7.39019775390625, -7.1788330078125, -6.96746826171875, -6.756103515625, -6.54473876953125, -6.3333740234375, -6.12200927734375, -5.91064453125, -5.69927978515625, -5.4879150390625, -5.27655029296875, -5.065185546875, -4.85382080078125, -4.6424560546875, -4.43109130859375, -4.2197265625, -4.00836181640625, -3.7969970703125, -3.58563232421875, -3.374267578125, -3.16290283203125, -2.9515380859375, -2.74017333984375, -2.52880859375, -2.31744384765625, -2.1060791015625, -1.89471435546875, -1.683349609375, -1.47198486328125, -1.2606201171875, -1.04925537109375, -0.837890625, -0.62652587890625, -0.4151611328125, -0.20379638671875, 0.007568359375, 0.21893310546875, 0.4302978515625, 0.64166259765625, 0.85302734375, 1.06439208984375, 1.2757568359375, 1.48712158203125, 1.698486328125, 1.90985107421875, 2.1212158203125, 2.33258056640625, 2.5439453125, 2.75531005859375, 2.9666748046875, 3.17803955078125, 3.389404296875, 3.60076904296875, 3.8121337890625, 4.02349853515625, 4.23486328125, 4.44622802734375, 4.6575927734375, 4.86895751953125, 5.080322265625, 5.29168701171875, 5.5030517578125, 5.71441650390625, 5.92578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 3.0, 5.0, 3.0, 9.0, 6.0, 16.0, 15.0, 18.0, 23.0, 40.0, 38.0, 50.0, 41.0, 52.0, 51.0, 60.0, 75.0, 60.0, 83.0, 54.0, 58.0, 51.0, 39.0, 28.0, 26.0, 23.0, 18.0, 14.0, 10.0, 11.0, 9.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.0, -12.6376953125, -12.275390625, -11.9130859375, -11.55078125, -11.1884765625, -10.826171875, -10.4638671875, -10.1015625, -9.7392578125, -9.376953125, -9.0146484375, -8.65234375, -8.2900390625, -7.927734375, -7.5654296875, -7.203125, -6.8408203125, -6.478515625, -6.1162109375, -5.75390625, -5.3916015625, -5.029296875, -4.6669921875, -4.3046875, -3.9423828125, -3.580078125, -3.2177734375, -2.85546875, -2.4931640625, -2.130859375, -1.7685546875, -1.40625, -1.0439453125, -0.681640625, -0.3193359375, 0.04296875, 0.4052734375, 0.767578125, 1.1298828125, 1.4921875, 1.8544921875, 2.216796875, 2.5791015625, 2.94140625, 3.3037109375, 3.666015625, 4.0283203125, 4.390625, 4.7529296875, 5.115234375, 5.4775390625, 5.83984375, 6.2021484375, 6.564453125, 6.9267578125, 7.2890625, 7.6513671875, 8.013671875, 8.3759765625, 8.73828125, 9.1005859375, 9.462890625, 9.8251953125, 10.1875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 5.0, 13.0, 12.0, 29.0, 47.0, 112.0, 281.0, 744.0, 3983.0, 46233.0, 969078.0, 24216.0, 2812.0, 591.0, 218.0, 76.0, 46.0, 18.0, 17.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.015625, -12.6580810546875, -12.300537109375, -11.9429931640625, -11.58544921875, -11.2279052734375, -10.870361328125, -10.5128173828125, -10.1552734375, -9.7977294921875, -9.440185546875, -9.0826416015625, -8.72509765625, -8.3675537109375, -8.010009765625, -7.6524658203125, -7.294921875, -6.9373779296875, -6.579833984375, -6.2222900390625, -5.86474609375, -5.5072021484375, -5.149658203125, -4.7921142578125, -4.4345703125, -4.0770263671875, -3.719482421875, -3.3619384765625, -3.00439453125, -2.6468505859375, -2.289306640625, -1.9317626953125, -1.57421875, -1.2166748046875, -0.859130859375, -0.5015869140625, -0.14404296875, 0.2135009765625, 0.571044921875, 0.9285888671875, 1.2861328125, 1.6436767578125, 2.001220703125, 2.3587646484375, 2.71630859375, 3.0738525390625, 3.431396484375, 3.7889404296875, 4.146484375, 4.5040283203125, 4.861572265625, 5.2191162109375, 5.57666015625, 5.9342041015625, 6.291748046875, 6.6492919921875, 7.0068359375, 7.3643798828125, 7.721923828125, 8.0794677734375, 8.43701171875, 8.7945556640625, 9.152099609375, 9.5096435546875, 9.8671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 5.0, 9.0, 9.0, 14.0, 17.0, 38.0, 70.0, 204.0, 321.0, 142.0, 59.0, 34.0, 28.0, 10.0, 11.0, 7.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011072158813476562, -0.0010767504572868347, -0.0010462850332260132, -0.0010158196091651917, -0.0009853541851043701, -0.0009548887610435486, -0.000924423336982727, -0.0008939579129219055, -0.000863492488861084, -0.0008330270648002625, -0.0008025616407394409, -0.0007720962166786194, -0.0007416307926177979, -0.0007111653685569763, -0.0006806999444961548, -0.0006502345204353333, -0.0006197690963745117, -0.0005893036723136902, -0.0005588382482528687, -0.0005283728241920471, -0.0004979074001312256, -0.00046744197607040405, -0.0004369765520095825, -0.000406511127948761, -0.00037604570388793945, -0.0003455802798271179, -0.0003151148557662964, -0.00028464943170547485, -0.0002541840076446533, -0.0002237185835838318, -0.00019325315952301025, -0.00016278773546218872, -0.0001323223114013672, -0.00010185688734054565, -7.139146327972412e-05, -4.092603921890259e-05, -1.0460615158081055e-05, 2.000480890274048e-05, 5.047023296356201e-05, 8.093565702438354e-05, 0.00011140108108520508, 0.0001418665051460266, 0.00017233192920684814, 0.00020279735326766968, 0.0002332627773284912, 0.00026372820138931274, 0.0002941936254501343, 0.0003246590495109558, 0.00035512447357177734, 0.0003855898976325989, 0.0004160553216934204, 0.00044652074575424194, 0.0004769861698150635, 0.000507451593875885, 0.0005379170179367065, 0.0005683824419975281, 0.0005988478660583496, 0.0006293132901191711, 0.0006597787141799927, 0.0006902441382408142, 0.0007207095623016357, 0.0007511749863624573, 0.0007816404104232788, 0.0008121058344841003, 0.0008425712585449219]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 14.0, 34.0, 44.0, 107.0, 182.0, 460.0, 1655.0, 8774.0, 168461.0, 847432.0, 17632.0, 2582.0, 664.0, 249.0, 116.0, 72.0, 32.0, 19.0, 8.0, 3.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.03125, -14.615478515625, -14.19970703125, -13.783935546875, -13.3681640625, -12.952392578125, -12.53662109375, -12.120849609375, -11.705078125, -11.289306640625, -10.87353515625, -10.457763671875, -10.0419921875, -9.626220703125, -9.21044921875, -8.794677734375, -8.37890625, -7.963134765625, -7.54736328125, -7.131591796875, -6.7158203125, -6.300048828125, -5.88427734375, -5.468505859375, -5.052734375, -4.636962890625, -4.22119140625, -3.805419921875, -3.3896484375, -2.973876953125, -2.55810546875, -2.142333984375, -1.7265625, -1.310791015625, -0.89501953125, -0.479248046875, -0.0634765625, 0.352294921875, 0.76806640625, 1.183837890625, 1.599609375, 2.015380859375, 2.43115234375, 2.846923828125, 3.2626953125, 3.678466796875, 4.09423828125, 4.510009765625, 4.92578125, 5.341552734375, 5.75732421875, 6.173095703125, 6.5888671875, 7.004638671875, 7.42041015625, 7.836181640625, 8.251953125, 8.667724609375, 9.08349609375, 9.499267578125, 9.9150390625, 10.330810546875, 10.74658203125, 11.162353515625, 11.578125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 9.0, 20.0, 55.0, 138.0, 474.0, 177.0, 56.0, 39.0, 8.0, 14.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8203125, -13.408935546875, -12.99755859375, -12.586181640625, -12.1748046875, -11.763427734375, -11.35205078125, -10.940673828125, -10.529296875, -10.117919921875, -9.70654296875, -9.295166015625, -8.8837890625, -8.472412109375, -8.06103515625, -7.649658203125, -7.23828125, -6.826904296875, -6.41552734375, -6.004150390625, -5.5927734375, -5.181396484375, -4.77001953125, -4.358642578125, -3.947265625, -3.535888671875, -3.12451171875, -2.713134765625, -2.3017578125, -1.890380859375, -1.47900390625, -1.067626953125, -0.65625, -0.244873046875, 0.16650390625, 0.577880859375, 0.9892578125, 1.400634765625, 1.81201171875, 2.223388671875, 2.634765625, 3.046142578125, 3.45751953125, 3.868896484375, 4.2802734375, 4.691650390625, 5.10302734375, 5.514404296875, 5.92578125, 6.337158203125, 6.74853515625, 7.159912109375, 7.5712890625, 7.982666015625, 8.39404296875, 8.805419921875, 9.216796875, 9.628173828125, 10.03955078125, 10.450927734375, 10.8623046875, 11.273681640625, 11.68505859375, 12.096435546875, 12.5078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 15.0, 29.0, 75.0, 189.0, 325.0, 210.0, 92.0, 33.0, 13.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.35951232910156, -64.50629425048828, -60.653072357177734, -56.79985046386719, -52.946632385253906, -49.09341049194336, -45.24018859863281, -41.38697052001953, -37.53375244140625, -33.6805305480957, -29.827312469482422, -25.974090576171875, -22.120872497558594, -18.267650604248047, -14.414430618286133, -10.561210632324219, -6.707988739013672, -2.8547685146331787, 0.9984517097473145, 4.851672172546387, 8.7048921585083, 12.558113098144531, 16.411333084106445, 20.26455307006836, 24.117773056030273, 27.970993041992188, 31.8242130279541, 35.677433013916016, 39.53065490722656, 43.383872985839844, 47.23709487915039, 51.09031677246094, 54.94353485107422, 58.796756744384766, 62.64997482299805, 66.5031967163086, 70.35641479492188, 74.20964050292969, 78.06285858154297, 81.91607666015625, 85.76929473876953, 89.62251281738281, 93.47573852539062, 97.3289566040039, 101.18217468261719, 105.035400390625, 108.88861846923828, 112.74183654785156, 116.59506225585938, 120.44828033447266, 124.30150604248047, 128.15472412109375, 132.00794982910156, 135.8611602783203, 139.71438598632812, 143.56759643554688, 147.4208221435547, 151.2740478515625, 155.12725830078125, 158.98048400878906, 162.83370971679688, 166.68692016601562, 170.54014587402344, 174.39337158203125, 178.24658203125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 6.0, 4.0, 6.0, 7.0, 10.0, 7.0, 12.0, 16.0, 18.0, 24.0, 22.0, 19.0, 44.0, 19.0, 40.0, 28.0, 35.0, 39.0, 32.0, 52.0, 46.0, 40.0, 43.0, 37.0, 41.0, 47.0, 40.0, 43.0, 34.0, 31.0, 27.0, 18.0, 25.0, 12.0, 22.0, 11.0, 12.0, 10.0, 4.0, 5.0, 3.0, 4.0, 9.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.158470153808594, -36.744163513183594, -35.32985305786133, -33.91554641723633, -32.50123596191406, -31.086929321289062, -29.67262077331543, -28.258312225341797, -26.844005584716797, -25.429697036743164, -24.01538848876953, -22.60108184814453, -21.1867733001709, -19.772464752197266, -18.358156204223633, -16.94384765625, -15.529539108276367, -14.115230560302734, -12.700922966003418, -11.286614418029785, -9.872306823730469, -8.457998275756836, -7.043689727783203, -5.629382133483887, -4.215073585510254, -2.8007655143737793, -1.3864572048187256, 0.027851104736328125, 1.4421591758728027, 2.8564672470092773, 4.27077579498291, 5.685083389282227, 7.099391937255859, 8.513700485229492, 9.928008079528809, 11.342316627502441, 12.756624221801758, 14.17093276977539, 15.585241317749023, 16.999549865722656, 18.413856506347656, 19.82816505432129, 21.242473602294922, 22.656780242919922, 24.071088790893555, 25.485397338867188, 26.89970588684082, 28.314014434814453, 29.728322982788086, 31.14263153076172, 32.55693817138672, 33.971248626708984, 35.385555267333984, 36.79986572265625, 38.21417236328125, 39.62847900390625, 41.042789459228516, 42.457096099853516, 43.87140655517578, 45.28571319580078, 46.70002365112305, 48.11433029174805, 49.52864074707031, 50.94294738769531, 52.35725402832031]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 7.0, 10.0, 21.0, 33.0, 37.0, 86.0, 183.0, 338.0, 854.0, 2798.0, 14828.0, 3051303.0, 1105716.0, 13772.0, 2650.0, 891.0, 338.0, 166.0, 95.0, 58.0, 38.0, 20.0, 9.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0078125, -14.4071044921875, -13.806396484375, -13.2056884765625, -12.60498046875, -12.0042724609375, -11.403564453125, -10.8028564453125, -10.2021484375, -9.6014404296875, -9.000732421875, -8.4000244140625, -7.79931640625, -7.1986083984375, -6.597900390625, -5.9971923828125, -5.396484375, -4.7957763671875, -4.195068359375, -3.5943603515625, -2.99365234375, -2.3929443359375, -1.792236328125, -1.1915283203125, -0.5908203125, 0.0098876953125, 0.610595703125, 1.2113037109375, 1.81201171875, 2.4127197265625, 3.013427734375, 3.6141357421875, 4.21484375, 4.8155517578125, 5.416259765625, 6.0169677734375, 6.61767578125, 7.2183837890625, 7.819091796875, 8.4197998046875, 9.0205078125, 9.6212158203125, 10.221923828125, 10.8226318359375, 11.42333984375, 12.0240478515625, 12.624755859375, 13.2254638671875, 13.826171875, 14.4268798828125, 15.027587890625, 15.6282958984375, 16.22900390625, 16.8297119140625, 17.430419921875, 18.0311279296875, 18.6318359375, 19.2325439453125, 19.833251953125, 20.4339599609375, 21.03466796875, 21.6353759765625, 22.236083984375, 22.8367919921875, 23.4375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 13.0, 10.0, 25.0, 40.0, 44.0, 55.0, 68.0, 86.0, 94.0, 96.0, 90.0, 93.0, 78.0, 54.0, 42.0, 29.0, 34.0, 24.0, 7.0, 10.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.440826416015625, -3.30157470703125, -3.162322998046875, -3.0230712890625, -2.883819580078125, -2.74456787109375, -2.605316162109375, -2.466064453125, -2.326812744140625, -2.18756103515625, -2.048309326171875, -1.9090576171875, -1.769805908203125, -1.63055419921875, -1.491302490234375, -1.35205078125, -1.212799072265625, -1.07354736328125, -0.934295654296875, -0.7950439453125, -0.655792236328125, -0.51654052734375, -0.377288818359375, -0.238037109375, -0.098785400390625, 0.04046630859375, 0.179718017578125, 0.3189697265625, 0.458221435546875, 0.59747314453125, 0.736724853515625, 0.8759765625, 1.015228271484375, 1.15447998046875, 1.293731689453125, 1.4329833984375, 1.572235107421875, 1.71148681640625, 1.850738525390625, 1.989990234375, 2.129241943359375, 2.26849365234375, 2.407745361328125, 2.5469970703125, 2.686248779296875, 2.82550048828125, 2.964752197265625, 3.10400390625, 3.243255615234375, 3.38250732421875, 3.521759033203125, 3.6610107421875, 3.800262451171875, 3.93951416015625, 4.078765869140625, 4.218017578125, 4.357269287109375, 4.49652099609375, 4.635772705078125, 4.7750244140625, 4.914276123046875, 5.05352783203125, 5.192779541015625, 5.33203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 7.0, 12.0, 18.0, 43.0, 60.0, 108.0, 109.0, 217.0, 371.0, 813.0, 1840.0, 5211.0, 21864.0, 321444.0, 3784361.0, 44812.0, 8287.0, 2538.0, 956.0, 518.0, 268.0, 132.0, 105.0, 72.0, 43.0, 15.0, 14.0, 17.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.40625, -10.970703125, -10.53515625, -10.099609375, -9.6640625, -9.228515625, -8.79296875, -8.357421875, -7.921875, -7.486328125, -7.05078125, -6.615234375, -6.1796875, -5.744140625, -5.30859375, -4.873046875, -4.4375, -4.001953125, -3.56640625, -3.130859375, -2.6953125, -2.259765625, -1.82421875, -1.388671875, -0.953125, -0.517578125, -0.08203125, 0.353515625, 0.7890625, 1.224609375, 1.66015625, 2.095703125, 2.53125, 2.966796875, 3.40234375, 3.837890625, 4.2734375, 4.708984375, 5.14453125, 5.580078125, 6.015625, 6.451171875, 6.88671875, 7.322265625, 7.7578125, 8.193359375, 8.62890625, 9.064453125, 9.5, 9.935546875, 10.37109375, 10.806640625, 11.2421875, 11.677734375, 12.11328125, 12.548828125, 12.984375, 13.419921875, 13.85546875, 14.291015625, 14.7265625, 15.162109375, 15.59765625, 16.033203125, 16.46875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 0.0, 0.0, 4.0, 6.0, 5.0, 8.0, 18.0, 31.0, 64.0, 109.0, 536.0, 2831.0, 289.0, 87.0, 40.0, 17.0, 11.0, 8.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.9072265625, -3.705078125, -3.5029296875, -3.30078125, -3.0986328125, -2.896484375, -2.6943359375, -2.4921875, -2.2900390625, -2.087890625, -1.8857421875, -1.68359375, -1.4814453125, -1.279296875, -1.0771484375, -0.875, -0.6728515625, -0.470703125, -0.2685546875, -0.06640625, 0.1357421875, 0.337890625, 0.5400390625, 0.7421875, 0.9443359375, 1.146484375, 1.3486328125, 1.55078125, 1.7529296875, 1.955078125, 2.1572265625, 2.359375, 2.5615234375, 2.763671875, 2.9658203125, 3.16796875, 3.3701171875, 3.572265625, 3.7744140625, 3.9765625, 4.1787109375, 4.380859375, 4.5830078125, 4.78515625, 4.9873046875, 5.189453125, 5.3916015625, 5.59375, 5.7958984375, 5.998046875, 6.2001953125, 6.40234375, 6.6044921875, 6.806640625, 7.0087890625, 7.2109375, 7.4130859375, 7.615234375, 7.8173828125, 8.01953125, 8.2216796875, 8.423828125, 8.6259765625, 8.828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 16.0, 21.0, 20.0, 55.0, 108.0, 192.0, 198.0, 196.0, 91.0, 57.0, 24.0, 7.0, 8.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.190452575683594, -40.322509765625, -39.454566955566406, -38.58662414550781, -37.71868133544922, -36.850738525390625, -35.98279571533203, -35.11484909057617, -34.24690628051758, -33.378963470458984, -32.51102066040039, -31.643077850341797, -30.77513313293457, -29.907190322875977, -29.039247512817383, -28.17130470275879, -27.303361892700195, -26.4354190826416, -25.567476272583008, -24.69953155517578, -23.831588745117188, -22.963645935058594, -22.095703125, -21.227760314941406, -20.359817504882812, -19.49187469482422, -18.623931884765625, -17.75598907470703, -16.888044357299805, -16.02010154724121, -15.152158737182617, -14.284215927124023, -13.416272163391113, -12.54832935333252, -11.68038558959961, -10.812442779541016, -9.944499969482422, -9.076556205749512, -8.208613395690918, -7.340670108795166, -6.472726821899414, -5.604783535003662, -4.73684024810791, -3.8688974380493164, -3.0009541511535645, -2.1330108642578125, -1.2650680541992188, -0.3971247673034668, 0.47081851959228516, 1.3387616872787476, 2.20670485496521, 3.074647903442383, 3.9425911903381348, 4.810534477233887, 5.6784772872924805, 6.546420574188232, 7.414363861083984, 8.282306671142578, 9.150250434875488, 10.018193244934082, 10.886137008666992, 11.754079818725586, 12.62202262878418, 13.489965438842773, 14.357909202575684]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 13.0, 2.0, 9.0, 11.0, 13.0, 21.0, 19.0, 25.0, 25.0, 28.0, 24.0, 30.0, 40.0, 38.0, 28.0, 37.0, 46.0, 53.0, 40.0, 48.0, 44.0, 34.0, 61.0, 30.0, 41.0, 35.0, 28.0, 33.0, 27.0, 18.0, 15.0, 10.0, 17.0, 14.0, 9.0, 9.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.52735424041748, -10.2219877243042, -9.916621208190918, -9.611254692077637, -9.305888175964355, -9.000521659851074, -8.695155143737793, -8.389788627624512, -8.08442211151123, -7.779055595397949, -7.473689079284668, -7.168322563171387, -6.8629560470581055, -6.557589530944824, -6.252223014831543, -5.946856498718262, -5.6414899826049805, -5.336123466491699, -5.030756950378418, -4.725390434265137, -4.4200239181518555, -4.114657402038574, -3.809290885925293, -3.5039243698120117, -3.1985578536987305, -2.893191337585449, -2.587824821472168, -2.2824583053588867, -1.9770917892456055, -1.6717252731323242, -1.366358757019043, -1.0609922409057617, -0.7556266784667969, -0.4502601623535156, -0.14489364624023438, 0.16047286987304688, 0.4658393859863281, 0.7712059020996094, 1.0765724182128906, 1.3819389343261719, 1.6873054504394531, 1.9926719665527344, 2.2980384826660156, 2.603404998779297, 2.908771514892578, 3.2141380310058594, 3.5195045471191406, 3.824871063232422, 4.130237579345703, 4.435604095458984, 4.740970611572266, 5.046337127685547, 5.351703643798828, 5.657070159912109, 5.962436676025391, 6.267803192138672, 6.573169708251953, 6.878536224365234, 7.183902740478516, 7.489269256591797, 7.794635772705078, 8.10000228881836, 8.40536880493164, 8.710735321044922, 9.016101837158203]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 9.0, 6.0, 10.0, 12.0, 15.0, 23.0, 45.0, 58.0, 87.0, 197.0, 329.0, 662.0, 1987.0, 7388.0, 31288.0, 191055.0, 646358.0, 136267.0, 23936.0, 5871.0, 1642.0, 575.0, 289.0, 146.0, 101.0, 59.0, 34.0, 43.0, 17.0, 13.0, 8.0, 12.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5, -9.076171875, -8.65234375, -8.228515625, -7.8046875, -7.380859375, -6.95703125, -6.533203125, -6.109375, -5.685546875, -5.26171875, -4.837890625, -4.4140625, -3.990234375, -3.56640625, -3.142578125, -2.71875, -2.294921875, -1.87109375, -1.447265625, -1.0234375, -0.599609375, -0.17578125, 0.248046875, 0.671875, 1.095703125, 1.51953125, 1.943359375, 2.3671875, 2.791015625, 3.21484375, 3.638671875, 4.0625, 4.486328125, 4.91015625, 5.333984375, 5.7578125, 6.181640625, 6.60546875, 7.029296875, 7.453125, 7.876953125, 8.30078125, 8.724609375, 9.1484375, 9.572265625, 9.99609375, 10.419921875, 10.84375, 11.267578125, 11.69140625, 12.115234375, 12.5390625, 12.962890625, 13.38671875, 13.810546875, 14.234375, 14.658203125, 15.08203125, 15.505859375, 15.9296875, 16.353515625, 16.77734375, 17.201171875, 17.625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 15.0, 28.0, 37.0, 50.0, 70.0, 92.0, 93.0, 103.0, 97.0, 93.0, 92.0, 64.0, 45.0, 31.0, 38.0, 29.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.806640625, -3.655059814453125, -3.50347900390625, -3.351898193359375, -3.2003173828125, -3.048736572265625, -2.89715576171875, -2.745574951171875, -2.593994140625, -2.442413330078125, -2.29083251953125, -2.139251708984375, -1.9876708984375, -1.836090087890625, -1.68450927734375, -1.532928466796875, -1.38134765625, -1.229766845703125, -1.07818603515625, -0.926605224609375, -0.7750244140625, -0.623443603515625, -0.47186279296875, -0.320281982421875, -0.168701171875, -0.017120361328125, 0.13446044921875, 0.286041259765625, 0.4376220703125, 0.589202880859375, 0.74078369140625, 0.892364501953125, 1.0439453125, 1.195526123046875, 1.34710693359375, 1.498687744140625, 1.6502685546875, 1.801849365234375, 1.95343017578125, 2.105010986328125, 2.256591796875, 2.408172607421875, 2.55975341796875, 2.711334228515625, 2.8629150390625, 3.014495849609375, 3.16607666015625, 3.317657470703125, 3.46923828125, 3.620819091796875, 3.77239990234375, 3.923980712890625, 4.0755615234375, 4.227142333984375, 4.37872314453125, 4.530303955078125, 4.681884765625, 4.833465576171875, 4.98504638671875, 5.136627197265625, 5.2882080078125, 5.439788818359375, 5.59136962890625, 5.742950439453125, 5.89453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 5.0, 8.0, 6.0, 15.0, 20.0, 26.0, 45.0, 58.0, 101.0, 176.0, 290.0, 540.0, 1119.0, 2164.0, 5041.0, 12309.0, 36063.0, 132088.0, 505809.0, 257075.0, 62460.0, 19617.0, 7209.0, 3167.0, 1475.0, 734.0, 394.0, 206.0, 113.0, 76.0, 50.0, 34.0, 21.0, 13.0, 11.0, 8.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0390625, -7.78564453125, -7.5322265625, -7.27880859375, -7.025390625, -6.77197265625, -6.5185546875, -6.26513671875, -6.01171875, -5.75830078125, -5.5048828125, -5.25146484375, -4.998046875, -4.74462890625, -4.4912109375, -4.23779296875, -3.984375, -3.73095703125, -3.4775390625, -3.22412109375, -2.970703125, -2.71728515625, -2.4638671875, -2.21044921875, -1.95703125, -1.70361328125, -1.4501953125, -1.19677734375, -0.943359375, -0.68994140625, -0.4365234375, -0.18310546875, 0.0703125, 0.32373046875, 0.5771484375, 0.83056640625, 1.083984375, 1.33740234375, 1.5908203125, 1.84423828125, 2.09765625, 2.35107421875, 2.6044921875, 2.85791015625, 3.111328125, 3.36474609375, 3.6181640625, 3.87158203125, 4.125, 4.37841796875, 4.6318359375, 4.88525390625, 5.138671875, 5.39208984375, 5.6455078125, 5.89892578125, 6.15234375, 6.40576171875, 6.6591796875, 6.91259765625, 7.166015625, 7.41943359375, 7.6728515625, 7.92626953125, 8.1796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 8.0, 6.0, 3.0, 7.0, 11.0, 8.0, 18.0, 16.0, 18.0, 29.0, 31.0, 23.0, 41.0, 39.0, 45.0, 53.0, 68.0, 50.0, 57.0, 74.0, 53.0, 52.0, 47.0, 37.0, 40.0, 30.0, 24.0, 31.0, 21.0, 13.0, 13.0, 10.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.5078125, -9.1640625, -8.8203125, -8.4765625, -8.1328125, -7.7890625, -7.4453125, -7.1015625, -6.7578125, -6.4140625, -6.0703125, -5.7265625, -5.3828125, -5.0390625, -4.6953125, -4.3515625, -4.0078125, -3.6640625, -3.3203125, -2.9765625, -2.6328125, -2.2890625, -1.9453125, -1.6015625, -1.2578125, -0.9140625, -0.5703125, -0.2265625, 0.1171875, 0.4609375, 0.8046875, 1.1484375, 1.4921875, 1.8359375, 2.1796875, 2.5234375, 2.8671875, 3.2109375, 3.5546875, 3.8984375, 4.2421875, 4.5859375, 4.9296875, 5.2734375, 5.6171875, 5.9609375, 6.3046875, 6.6484375, 6.9921875, 7.3359375, 7.6796875, 8.0234375, 8.3671875, 8.7109375, 9.0546875, 9.3984375, 9.7421875, 10.0859375, 10.4296875, 10.7734375, 11.1171875, 11.4609375, 11.8046875, 12.1484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 8.0, 20.0, 30.0, 40.0, 83.0, 148.0, 324.0, 735.0, 2175.0, 7620.0, 41364.0, 643054.0, 317585.0, 26951.0, 5557.0, 1672.0, 592.0, 296.0, 121.0, 61.0, 39.0, 23.0, 13.0, 11.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.76751708984375, -4.6131591796875, -4.45880126953125, -4.304443359375, -4.15008544921875, -3.9957275390625, -3.84136962890625, -3.68701171875, -3.53265380859375, -3.3782958984375, -3.22393798828125, -3.069580078125, -2.91522216796875, -2.7608642578125, -2.60650634765625, -2.4521484375, -2.29779052734375, -2.1434326171875, -1.98907470703125, -1.834716796875, -1.68035888671875, -1.5260009765625, -1.37164306640625, -1.21728515625, -1.06292724609375, -0.9085693359375, -0.75421142578125, -0.599853515625, -0.44549560546875, -0.2911376953125, -0.13677978515625, 0.017578125, 0.17193603515625, 0.3262939453125, 0.48065185546875, 0.635009765625, 0.78936767578125, 0.9437255859375, 1.09808349609375, 1.25244140625, 1.40679931640625, 1.5611572265625, 1.71551513671875, 1.869873046875, 2.02423095703125, 2.1785888671875, 2.33294677734375, 2.4873046875, 2.64166259765625, 2.7960205078125, 2.95037841796875, 3.104736328125, 3.25909423828125, 3.4134521484375, 3.56781005859375, 3.72216796875, 3.87652587890625, 4.0308837890625, 4.18524169921875, 4.339599609375, 4.49395751953125, 4.6483154296875, 4.80267333984375, 4.95703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 5.0, 11.0, 7.0, 15.0, 23.0, 36.0, 48.0, 114.0, 242.0, 247.0, 80.0, 45.0, 37.0, 18.0, 17.0, 11.0, 12.0, 6.0, 5.0, 5.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009126663208007812, -0.0008872896432876587, -0.0008619129657745361, -0.0008365362882614136, -0.000811159610748291, -0.0007857829332351685, -0.0007604062557220459, -0.0007350295782089233, -0.0007096529006958008, -0.0006842762231826782, -0.0006588995456695557, -0.0006335228681564331, -0.0006081461906433105, -0.000582769513130188, -0.0005573928356170654, -0.0005320161581039429, -0.0005066394805908203, -0.00048126280307769775, -0.0004558861255645752, -0.00043050944805145264, -0.0004051327705383301, -0.0003797560930252075, -0.00035437941551208496, -0.0003290027379989624, -0.00030362606048583984, -0.0002782493829727173, -0.0002528727054595947, -0.00022749602794647217, -0.0002021193504333496, -0.00017674267292022705, -0.0001513659954071045, -0.00012598931789398193, -0.00010061264038085938, -7.523596286773682e-05, -4.985928535461426e-05, -2.44826078414917e-05, 8.940696716308594e-07, 2.6270747184753418e-05, 5.1647424697875977e-05, 7.702410221099854e-05, 0.0001024007797241211, 0.00012777745723724365, 0.0001531541347503662, 0.00017853081226348877, 0.00020390748977661133, 0.0002292841672897339, 0.00025466084480285645, 0.000280037522315979, 0.00030541419982910156, 0.0003307908773422241, 0.0003561675548553467, 0.00038154423236846924, 0.0004069209098815918, 0.00043229758739471436, 0.0004576742649078369, 0.00048305094242095947, 0.000508427619934082, 0.0005338042974472046, 0.0005591809749603271, 0.0005845576524734497, 0.0006099343299865723, 0.0006353110074996948, 0.0006606876850128174, 0.0006860643625259399, 0.0007114410400390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 2.0, 7.0, 8.0, 16.0, 20.0, 29.0, 44.0, 67.0, 97.0, 153.0, 275.0, 404.0, 710.0, 1354.0, 2462.0, 5618.0, 14110.0, 48171.0, 411275.0, 483716.0, 53015.0, 15240.0, 5786.0, 2597.0, 1380.0, 794.0, 459.0, 270.0, 162.0, 105.0, 68.0, 47.0, 25.0, 19.0, 11.0, 11.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5703125, -3.44732666015625, -3.3243408203125, -3.20135498046875, -3.078369140625, -2.95538330078125, -2.8323974609375, -2.70941162109375, -2.58642578125, -2.46343994140625, -2.3404541015625, -2.21746826171875, -2.094482421875, -1.97149658203125, -1.8485107421875, -1.72552490234375, -1.6025390625, -1.47955322265625, -1.3565673828125, -1.23358154296875, -1.110595703125, -0.98760986328125, -0.8646240234375, -0.74163818359375, -0.61865234375, -0.49566650390625, -0.3726806640625, -0.24969482421875, -0.126708984375, -0.00372314453125, 0.1192626953125, 0.24224853515625, 0.365234375, 0.48822021484375, 0.6112060546875, 0.73419189453125, 0.857177734375, 0.98016357421875, 1.1031494140625, 1.22613525390625, 1.34912109375, 1.47210693359375, 1.5950927734375, 1.71807861328125, 1.841064453125, 1.96405029296875, 2.0870361328125, 2.21002197265625, 2.3330078125, 2.45599365234375, 2.5789794921875, 2.70196533203125, 2.824951171875, 2.94793701171875, 3.0709228515625, 3.19390869140625, 3.31689453125, 3.43988037109375, 3.5628662109375, 3.68585205078125, 3.808837890625, 3.93182373046875, 4.0548095703125, 4.17779541015625, 4.30078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 6.0, 9.0, 10.0, 15.0, 26.0, 33.0, 44.0, 78.0, 161.0, 221.0, 173.0, 71.0, 46.0, 17.0, 24.0, 17.0, 11.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.075439453125, -5.90869140625, -5.741943359375, -5.5751953125, -5.408447265625, -5.24169921875, -5.074951171875, -4.908203125, -4.741455078125, -4.57470703125, -4.407958984375, -4.2412109375, -4.074462890625, -3.90771484375, -3.740966796875, -3.57421875, -3.407470703125, -3.24072265625, -3.073974609375, -2.9072265625, -2.740478515625, -2.57373046875, -2.406982421875, -2.240234375, -2.073486328125, -1.90673828125, -1.739990234375, -1.5732421875, -1.406494140625, -1.23974609375, -1.072998046875, -0.90625, -0.739501953125, -0.57275390625, -0.406005859375, -0.2392578125, -0.072509765625, 0.09423828125, 0.260986328125, 0.427734375, 0.594482421875, 0.76123046875, 0.927978515625, 1.0947265625, 1.261474609375, 1.42822265625, 1.594970703125, 1.76171875, 1.928466796875, 2.09521484375, 2.261962890625, 2.4287109375, 2.595458984375, 2.76220703125, 2.928955078125, 3.095703125, 3.262451171875, 3.42919921875, 3.595947265625, 3.7626953125, 3.929443359375, 4.09619140625, 4.262939453125, 4.4296875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 16.0, 17.0, 18.0, 51.0, 102.0, 152.0, 201.0, 164.0, 127.0, 65.0, 30.0, 20.0, 13.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.76167297363281, -34.56254959106445, -32.363426208496094, -30.16429901123047, -27.96517562866211, -25.76605224609375, -23.566926956176758, -21.367801666259766, -19.168678283691406, -16.969554901123047, -14.770429611206055, -12.571305274963379, -10.372180938720703, -8.173056602478027, -5.973932266235352, -3.774807929992676, -1.57568359375, 0.6234407424926758, 2.8225650787353516, 5.021689414978027, 7.220813751220703, 9.419938087463379, 11.619062423706055, 13.81818675994873, 16.017311096191406, 18.216434478759766, 20.415559768676758, 22.61468505859375, 24.81380844116211, 27.01293182373047, 29.21205711364746, 31.411182403564453, 33.61029815673828, 35.80942153930664, 38.008544921875, 40.207672119140625, 42.406795501708984, 44.605918884277344, 46.80504608154297, 49.00416946411133, 51.20329284667969, 53.40241622924805, 55.601539611816406, 57.80066680908203, 59.99979019165039, 62.19891357421875, 64.39804077148438, 66.59716033935547, 68.7962875366211, 70.99541473388672, 73.19453430175781, 75.39366149902344, 77.59278869628906, 79.79190826416016, 81.99103546142578, 84.19015502929688, 86.3892822265625, 88.58840942382812, 90.78752899169922, 92.98665618896484, 95.18577575683594, 97.38490295410156, 99.58403015136719, 101.78314971923828, 103.9822769165039]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 2.0, 4.0, 10.0, 14.0, 21.0, 19.0, 14.0, 23.0, 19.0, 24.0, 27.0, 21.0, 30.0, 31.0, 30.0, 40.0, 43.0, 40.0, 44.0, 39.0, 51.0, 39.0, 35.0, 27.0, 30.0, 36.0, 31.0, 31.0, 23.0, 29.0, 22.0, 14.0, 17.0, 20.0, 20.0, 11.0, 13.0, 9.0, 12.0, 5.0, 9.0, 10.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.0693359375, -40.86619186401367, -39.663047790527344, -38.459903717041016, -37.25675964355469, -36.05361557006836, -34.85047149658203, -33.64732360839844, -32.444183349609375, -31.241039276123047, -30.03789520263672, -28.83475112915039, -27.631607055664062, -26.428462982177734, -25.225317001342773, -24.022172927856445, -22.819026947021484, -21.615882873535156, -20.412738800048828, -19.2095947265625, -18.006450653076172, -16.803306579589844, -15.600160598754883, -14.397016525268555, -13.193872451782227, -11.990728378295898, -10.78758430480957, -9.584439277648926, -8.381295204162598, -7.1781511306762695, -5.975006580352783, -4.771862030029297, -3.5687179565429688, -2.3655736446380615, -1.1624293327331543, 0.04071497917175293, 1.2438592910766602, 2.4470033645629883, 3.6501479148864746, 4.853292465209961, 6.056436538696289, 7.259580612182617, 8.462724685668945, 9.66586971282959, 10.869013786315918, 12.072157859802246, 13.27530288696289, 14.478446960449219, 15.681591033935547, 16.884735107421875, 18.087879180908203, 19.29102325439453, 20.49416732788086, 21.697311401367188, 22.90045738220215, 24.103601455688477, 25.306745529174805, 26.509889602661133, 27.71303367614746, 28.91617774963379, 30.11932373046875, 31.322467803955078, 32.525611877441406, 33.728755950927734, 34.93190002441406]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 15.0, 12.0, 35.0, 36.0, 64.0, 126.0, 222.0, 507.0, 1437.0, 5724.0, 65795.0, 4094487.0, 21084.0, 3070.0, 841.0, 362.0, 196.0, 113.0, 57.0, 40.0, 19.0, 14.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.1875, -32.88818359375, -31.5888671875, -30.28955078125, -28.990234375, -27.69091796875, -26.3916015625, -25.09228515625, -23.79296875, -22.49365234375, -21.1943359375, -19.89501953125, -18.595703125, -17.29638671875, -15.9970703125, -14.69775390625, -13.3984375, -12.09912109375, -10.7998046875, -9.50048828125, -8.201171875, -6.90185546875, -5.6025390625, -4.30322265625, -3.00390625, -1.70458984375, -0.4052734375, 0.89404296875, 2.193359375, 3.49267578125, 4.7919921875, 6.09130859375, 7.390625, 8.68994140625, 9.9892578125, 11.28857421875, 12.587890625, 13.88720703125, 15.1865234375, 16.48583984375, 17.78515625, 19.08447265625, 20.3837890625, 21.68310546875, 22.982421875, 24.28173828125, 25.5810546875, 26.88037109375, 28.1796875, 29.47900390625, 30.7783203125, 32.07763671875, 33.376953125, 34.67626953125, 35.9755859375, 37.27490234375, 38.57421875, 39.87353515625, 41.1728515625, 42.47216796875, 43.771484375, 45.07080078125, 46.3701171875, 47.66943359375, 48.96875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 10.0, 13.0, 25.0, 33.0, 42.0, 56.0, 60.0, 85.0, 82.0, 77.0, 84.0, 83.0, 75.0, 69.0, 50.0, 44.0, 34.0, 36.0, 17.0, 14.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.625, -3.486083984375, -3.34716796875, -3.208251953125, -3.0693359375, -2.930419921875, -2.79150390625, -2.652587890625, -2.513671875, -2.374755859375, -2.23583984375, -2.096923828125, -1.9580078125, -1.819091796875, -1.68017578125, -1.541259765625, -1.40234375, -1.263427734375, -1.12451171875, -0.985595703125, -0.8466796875, -0.707763671875, -0.56884765625, -0.429931640625, -0.291015625, -0.152099609375, -0.01318359375, 0.125732421875, 0.2646484375, 0.403564453125, 0.54248046875, 0.681396484375, 0.8203125, 0.959228515625, 1.09814453125, 1.237060546875, 1.3759765625, 1.514892578125, 1.65380859375, 1.792724609375, 1.931640625, 2.070556640625, 2.20947265625, 2.348388671875, 2.4873046875, 2.626220703125, 2.76513671875, 2.904052734375, 3.04296875, 3.181884765625, 3.32080078125, 3.459716796875, 3.5986328125, 3.737548828125, 3.87646484375, 4.015380859375, 4.154296875, 4.293212890625, 4.43212890625, 4.571044921875, 4.7099609375, 4.848876953125, 4.98779296875, 5.126708984375, 5.265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 7.0, 5.0, 13.0, 18.0, 19.0, 30.0, 30.0, 49.0, 75.0, 115.0, 230.0, 500.0, 1251.0, 3646.0, 13124.0, 84562.0, 3978944.0, 91798.0, 13706.0, 3825.0, 1191.0, 527.0, 232.0, 129.0, 74.0, 56.0, 30.0, 25.0, 17.0, 6.0, 6.0, 7.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.21875, -20.621337890625, -20.02392578125, -19.426513671875, -18.8291015625, -18.231689453125, -17.63427734375, -17.036865234375, -16.439453125, -15.842041015625, -15.24462890625, -14.647216796875, -14.0498046875, -13.452392578125, -12.85498046875, -12.257568359375, -11.66015625, -11.062744140625, -10.46533203125, -9.867919921875, -9.2705078125, -8.673095703125, -8.07568359375, -7.478271484375, -6.880859375, -6.283447265625, -5.68603515625, -5.088623046875, -4.4912109375, -3.893798828125, -3.29638671875, -2.698974609375, -2.1015625, -1.504150390625, -0.90673828125, -0.309326171875, 0.2880859375, 0.885498046875, 1.48291015625, 2.080322265625, 2.677734375, 3.275146484375, 3.87255859375, 4.469970703125, 5.0673828125, 5.664794921875, 6.26220703125, 6.859619140625, 7.45703125, 8.054443359375, 8.65185546875, 9.249267578125, 9.8466796875, 10.444091796875, 11.04150390625, 11.638916015625, 12.236328125, 12.833740234375, 13.43115234375, 14.028564453125, 14.6259765625, 15.223388671875, 15.82080078125, 16.418212890625, 17.015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 9.0, 15.0, 30.0, 55.0, 132.0, 1312.0, 2284.0, 111.0, 51.0, 26.0, 12.0, 10.0, 7.0, 3.0, 0.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.46875, -12.185546875, -11.90234375, -11.619140625, -11.3359375, -11.052734375, -10.76953125, -10.486328125, -10.203125, -9.919921875, -9.63671875, -9.353515625, -9.0703125, -8.787109375, -8.50390625, -8.220703125, -7.9375, -7.654296875, -7.37109375, -7.087890625, -6.8046875, -6.521484375, -6.23828125, -5.955078125, -5.671875, -5.388671875, -5.10546875, -4.822265625, -4.5390625, -4.255859375, -3.97265625, -3.689453125, -3.40625, -3.123046875, -2.83984375, -2.556640625, -2.2734375, -1.990234375, -1.70703125, -1.423828125, -1.140625, -0.857421875, -0.57421875, -0.291015625, -0.0078125, 0.275390625, 0.55859375, 0.841796875, 1.125, 1.408203125, 1.69140625, 1.974609375, 2.2578125, 2.541015625, 2.82421875, 3.107421875, 3.390625, 3.673828125, 3.95703125, 4.240234375, 4.5234375, 4.806640625, 5.08984375, 5.373046875, 5.65625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 10.0, 14.0, 26.0, 44.0, 90.0, 160.0, 232.0, 230.0, 104.0, 55.0, 21.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-50.45697784423828, -49.33268737792969, -48.208396911621094, -47.0841064453125, -45.959815979003906, -44.83552551269531, -43.71123504638672, -42.58694839477539, -41.4626579284668, -40.3383674621582, -39.21407699584961, -38.089786529541016, -36.96549606323242, -35.841209411621094, -34.7169189453125, -33.592628479003906, -32.46833801269531, -31.34404754638672, -30.219757080078125, -29.09546661376953, -27.97117805480957, -26.846887588500977, -25.722597122192383, -24.59830665588379, -23.474014282226562, -22.34972381591797, -21.225433349609375, -20.10114288330078, -18.97685432434082, -17.852563858032227, -16.728273391723633, -15.603982925415039, -14.479692459106445, -13.355401992797852, -12.231112480163574, -11.10682201385498, -9.982532501220703, -8.85824203491211, -7.733951568603516, -6.60966157913208, -5.4853715896606445, -4.361081600189209, -3.2367913722991943, -2.1125011444091797, -0.9882111549377441, 0.1360788345336914, 1.2603693008422852, 2.3846592903137207, 3.5089492797851562, 4.633239269256592, 5.757529258728027, 6.881819725036621, 8.006109237670898, 9.130399703979492, 10.254690170288086, 11.37898063659668, 12.503270149230957, 13.62756061553955, 14.751850128173828, 15.876140594482422, 17.000431060791016, 18.12472152709961, 19.249011993408203, 20.373300552368164, 21.497591018676758]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 10.0, 14.0, 20.0, 15.0, 27.0, 32.0, 35.0, 40.0, 36.0, 43.0, 46.0, 71.0, 51.0, 61.0, 53.0, 57.0, 59.0, 50.0, 58.0, 42.0, 42.0, 27.0, 21.0, 22.0, 14.0, 14.0, 9.0, 7.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.091163635253906, -15.572766304016113, -15.05436897277832, -14.535971641540527, -14.017574310302734, -13.499177932739258, -12.980780601501465, -12.462383270263672, -11.943985939025879, -11.425588607788086, -10.907191276550293, -10.3887939453125, -9.870397567749023, -9.351999282836914, -8.833602905273438, -8.315205574035645, -7.796808242797852, -7.278410911560059, -6.760013580322266, -6.241616725921631, -5.723219394683838, -5.204822063446045, -4.68642520904541, -4.168027877807617, -3.649630546569824, -3.1312332153320312, -2.6128361225128174, -2.0944390296936035, -1.5760416984558105, -1.0576443672180176, -0.5392472743988037, -0.020850181579589844, 0.4975471496582031, 1.0159443616867065, 1.53434157371521, 2.052738666534424, 2.571135997772217, 3.0895333290100098, 3.6079304218292236, 4.1263275146484375, 4.6447248458862305, 5.163122177124023, 5.681519508361816, 6.199916362762451, 6.718313694000244, 7.236711025238037, 7.755107879638672, 8.273505210876465, 8.791902542114258, 9.31029987335205, 9.828697204589844, 10.347094535827637, 10.86549186706543, 11.383888244628906, 11.9022855758667, 12.420682907104492, 12.939080238342285, 13.457477569580078, 13.975874900817871, 14.494272232055664, 15.01266860961914, 15.53106689453125, 16.049463272094727, 16.567859649658203, 17.086257934570312]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 1.0, 6.0, 5.0, 5.0, 9.0, 8.0, 14.0, 17.0, 35.0, 67.0, 129.0, 288.0, 534.0, 1110.0, 2814.0, 8106.0, 34628.0, 277297.0, 624401.0, 77738.0, 13988.0, 4158.0, 1697.0, 711.0, 373.0, 167.0, 94.0, 49.0, 32.0, 20.0, 22.0, 11.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.349609375, -17.76171875, -17.173828125, -16.5859375, -15.998046875, -15.41015625, -14.822265625, -14.234375, -13.646484375, -13.05859375, -12.470703125, -11.8828125, -11.294921875, -10.70703125, -10.119140625, -9.53125, -8.943359375, -8.35546875, -7.767578125, -7.1796875, -6.591796875, -6.00390625, -5.416015625, -4.828125, -4.240234375, -3.65234375, -3.064453125, -2.4765625, -1.888671875, -1.30078125, -0.712890625, -0.125, 0.462890625, 1.05078125, 1.638671875, 2.2265625, 2.814453125, 3.40234375, 3.990234375, 4.578125, 5.166015625, 5.75390625, 6.341796875, 6.9296875, 7.517578125, 8.10546875, 8.693359375, 9.28125, 9.869140625, 10.45703125, 11.044921875, 11.6328125, 12.220703125, 12.80859375, 13.396484375, 13.984375, 14.572265625, 15.16015625, 15.748046875, 16.3359375, 16.923828125, 17.51171875, 18.099609375, 18.6875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 15.0, 14.0, 20.0, 31.0, 37.0, 64.0, 56.0, 76.0, 82.0, 77.0, 80.0, 91.0, 67.0, 71.0, 57.0, 45.0, 37.0, 24.0, 30.0, 14.0, 7.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.38031005859375, -3.2410888671875, -3.10186767578125, -2.962646484375, -2.82342529296875, -2.6842041015625, -2.54498291015625, -2.40576171875, -2.26654052734375, -2.1273193359375, -1.98809814453125, -1.848876953125, -1.70965576171875, -1.5704345703125, -1.43121337890625, -1.2919921875, -1.15277099609375, -1.0135498046875, -0.87432861328125, -0.735107421875, -0.59588623046875, -0.4566650390625, -0.31744384765625, -0.17822265625, -0.03900146484375, 0.1002197265625, 0.23944091796875, 0.378662109375, 0.51788330078125, 0.6571044921875, 0.79632568359375, 0.935546875, 1.07476806640625, 1.2139892578125, 1.35321044921875, 1.492431640625, 1.63165283203125, 1.7708740234375, 1.91009521484375, 2.04931640625, 2.18853759765625, 2.3277587890625, 2.46697998046875, 2.606201171875, 2.74542236328125, 2.8846435546875, 3.02386474609375, 3.1630859375, 3.30230712890625, 3.4415283203125, 3.58074951171875, 3.719970703125, 3.85919189453125, 3.9984130859375, 4.13763427734375, 4.27685546875, 4.41607666015625, 4.5552978515625, 4.69451904296875, 4.833740234375, 4.97296142578125, 5.1121826171875, 5.25140380859375, 5.390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 8.0, 12.0, 22.0, 35.0, 49.0, 72.0, 117.0, 189.0, 320.0, 602.0, 1199.0, 2543.0, 5775.0, 16417.0, 60752.0, 364859.0, 485012.0, 78431.0, 19703.0, 6848.0, 2774.0, 1286.0, 619.0, 351.0, 183.0, 132.0, 88.0, 51.0, 23.0, 26.0, 10.0, 11.0, 4.0, 10.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.0230712890625, -8.663330078125, -8.3035888671875, -7.94384765625, -7.5841064453125, -7.224365234375, -6.8646240234375, -6.5048828125, -6.1451416015625, -5.785400390625, -5.4256591796875, -5.06591796875, -4.7061767578125, -4.346435546875, -3.9866943359375, -3.626953125, -3.2672119140625, -2.907470703125, -2.5477294921875, -2.18798828125, -1.8282470703125, -1.468505859375, -1.1087646484375, -0.7490234375, -0.3892822265625, -0.029541015625, 0.3302001953125, 0.68994140625, 1.0496826171875, 1.409423828125, 1.7691650390625, 2.12890625, 2.4886474609375, 2.848388671875, 3.2081298828125, 3.56787109375, 3.9276123046875, 4.287353515625, 4.6470947265625, 5.0068359375, 5.3665771484375, 5.726318359375, 6.0860595703125, 6.44580078125, 6.8055419921875, 7.165283203125, 7.5250244140625, 7.884765625, 8.2445068359375, 8.604248046875, 8.9639892578125, 9.32373046875, 9.6834716796875, 10.043212890625, 10.4029541015625, 10.7626953125, 11.1224365234375, 11.482177734375, 11.8419189453125, 12.20166015625, 12.5614013671875, 12.921142578125, 13.2808837890625, 13.640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 8.0, 15.0, 16.0, 23.0, 21.0, 24.0, 32.0, 31.0, 41.0, 50.0, 57.0, 63.0, 75.0, 66.0, 71.0, 67.0, 49.0, 61.0, 45.0, 37.0, 31.0, 23.0, 21.0, 8.0, 11.0, 6.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-20.4375, -19.9178466796875, -19.398193359375, -18.8785400390625, -18.35888671875, -17.8392333984375, -17.319580078125, -16.7999267578125, -16.2802734375, -15.7606201171875, -15.240966796875, -14.7213134765625, -14.20166015625, -13.6820068359375, -13.162353515625, -12.6427001953125, -12.123046875, -11.6033935546875, -11.083740234375, -10.5640869140625, -10.04443359375, -9.5247802734375, -9.005126953125, -8.4854736328125, -7.9658203125, -7.4461669921875, -6.926513671875, -6.4068603515625, -5.88720703125, -5.3675537109375, -4.847900390625, -4.3282470703125, -3.80859375, -3.2889404296875, -2.769287109375, -2.2496337890625, -1.72998046875, -1.2103271484375, -0.690673828125, -0.1710205078125, 0.3486328125, 0.8682861328125, 1.387939453125, 1.9075927734375, 2.42724609375, 2.9468994140625, 3.466552734375, 3.9862060546875, 4.505859375, 5.0255126953125, 5.545166015625, 6.0648193359375, 6.58447265625, 7.1041259765625, 7.623779296875, 8.1434326171875, 8.6630859375, 9.1827392578125, 9.702392578125, 10.2220458984375, 10.74169921875, 11.2613525390625, 11.781005859375, 12.3006591796875, 12.8203125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 12.0, 15.0, 25.0, 32.0, 47.0, 48.0, 72.0, 131.0, 201.0, 403.0, 895.0, 2565.0, 10222.0, 84859.0, 888666.0, 49094.0, 7604.0, 2000.0, 764.0, 353.0, 191.0, 103.0, 64.0, 47.0, 30.0, 21.0, 23.0, 17.0, 12.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.140625, -15.67138671875, -15.2021484375, -14.73291015625, -14.263671875, -13.79443359375, -13.3251953125, -12.85595703125, -12.38671875, -11.91748046875, -11.4482421875, -10.97900390625, -10.509765625, -10.04052734375, -9.5712890625, -9.10205078125, -8.6328125, -8.16357421875, -7.6943359375, -7.22509765625, -6.755859375, -6.28662109375, -5.8173828125, -5.34814453125, -4.87890625, -4.40966796875, -3.9404296875, -3.47119140625, -3.001953125, -2.53271484375, -2.0634765625, -1.59423828125, -1.125, -0.65576171875, -0.1865234375, 0.28271484375, 0.751953125, 1.22119140625, 1.6904296875, 2.15966796875, 2.62890625, 3.09814453125, 3.5673828125, 4.03662109375, 4.505859375, 4.97509765625, 5.4443359375, 5.91357421875, 6.3828125, 6.85205078125, 7.3212890625, 7.79052734375, 8.259765625, 8.72900390625, 9.1982421875, 9.66748046875, 10.13671875, 10.60595703125, 11.0751953125, 11.54443359375, 12.013671875, 12.48291015625, 12.9521484375, 13.42138671875, 13.890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 7.0, 6.0, 13.0, 17.0, 30.0, 50.0, 46.0, 109.0, 230.0, 212.0, 88.0, 58.0, 46.0, 28.0, 16.0, 10.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008792877197265625, -0.0008303225040435791, -0.0007813572883605957, -0.0007323920726776123, -0.0006834268569946289, -0.0006344616413116455, -0.0005854964256286621, -0.0005365312099456787, -0.0004875659942626953, -0.0004386007785797119, -0.0003896355628967285, -0.0003406703472137451, -0.0002917051315307617, -0.00024273991584777832, -0.00019377470016479492, -0.00014480948448181152, -9.584426879882812e-05, -4.6879053115844727e-05, 2.086162567138672e-06, 5.105137825012207e-05, 0.00010001659393310547, 0.00014898180961608887, 0.00019794702529907227, 0.00024691224098205566, 0.00029587745666503906, 0.00034484267234802246, 0.00039380788803100586, 0.00044277310371398926, 0.0004917383193969727, 0.0005407035350799561, 0.0005896687507629395, 0.0006386339664459229, 0.0006875991821289062, 0.0007365643978118896, 0.000785529613494873, 0.0008344948291778564, 0.0008834600448608398, 0.0009324252605438232, 0.0009813904762268066, 0.00103035569190979, 0.0010793209075927734, 0.0011282861232757568, 0.0011772513389587402, 0.0012262165546417236, 0.001275181770324707, 0.0013241469860076904, 0.0013731122016906738, 0.0014220774173736572, 0.0014710426330566406, 0.001520007848739624, 0.0015689730644226074, 0.0016179382801055908, 0.0016669034957885742, 0.0017158687114715576, 0.001764833927154541, 0.0018137991428375244, 0.0018627643585205078, 0.0019117295742034912, 0.0019606947898864746, 0.002009660005569458, 0.0020586252212524414, 0.002107590436935425, 0.002156555652618408, 0.0022055208683013916, 0.002254486083984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 5.0, 7.0, 8.0, 13.0, 17.0, 48.0, 62.0, 125.0, 233.0, 517.0, 1231.0, 2922.0, 9237.0, 45317.0, 795543.0, 166127.0, 18964.0, 4898.0, 1709.0, 779.0, 350.0, 202.0, 90.0, 52.0, 42.0, 14.0, 10.0, 7.0, 2.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-18.203125, -17.7564697265625, -17.309814453125, -16.8631591796875, -16.41650390625, -15.9698486328125, -15.523193359375, -15.0765380859375, -14.6298828125, -14.1832275390625, -13.736572265625, -13.2899169921875, -12.84326171875, -12.3966064453125, -11.949951171875, -11.5032958984375, -11.056640625, -10.6099853515625, -10.163330078125, -9.7166748046875, -9.27001953125, -8.8233642578125, -8.376708984375, -7.9300537109375, -7.4833984375, -7.0367431640625, -6.590087890625, -6.1434326171875, -5.69677734375, -5.2501220703125, -4.803466796875, -4.3568115234375, -3.91015625, -3.4635009765625, -3.016845703125, -2.5701904296875, -2.12353515625, -1.6768798828125, -1.230224609375, -0.7835693359375, -0.3369140625, 0.1097412109375, 0.556396484375, 1.0030517578125, 1.44970703125, 1.8963623046875, 2.343017578125, 2.7896728515625, 3.236328125, 3.6829833984375, 4.129638671875, 4.5762939453125, 5.02294921875, 5.4696044921875, 5.916259765625, 6.3629150390625, 6.8095703125, 7.2562255859375, 7.702880859375, 8.1495361328125, 8.59619140625, 9.0428466796875, 9.489501953125, 9.9361572265625, 10.3828125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 12.0, 8.0, 16.0, 17.0, 35.0, 63.0, 109.0, 269.0, 197.0, 97.0, 49.0, 28.0, 22.0, 14.0, 9.0, 7.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.515625, -16.0423583984375, -15.569091796875, -15.0958251953125, -14.62255859375, -14.1492919921875, -13.676025390625, -13.2027587890625, -12.7294921875, -12.2562255859375, -11.782958984375, -11.3096923828125, -10.83642578125, -10.3631591796875, -9.889892578125, -9.4166259765625, -8.943359375, -8.4700927734375, -7.996826171875, -7.5235595703125, -7.05029296875, -6.5770263671875, -6.103759765625, -5.6304931640625, -5.1572265625, -4.6839599609375, -4.210693359375, -3.7374267578125, -3.26416015625, -2.7908935546875, -2.317626953125, -1.8443603515625, -1.37109375, -0.8978271484375, -0.424560546875, 0.0487060546875, 0.52197265625, 0.9952392578125, 1.468505859375, 1.9417724609375, 2.4150390625, 2.8883056640625, 3.361572265625, 3.8348388671875, 4.30810546875, 4.7813720703125, 5.254638671875, 5.7279052734375, 6.201171875, 6.6744384765625, 7.147705078125, 7.6209716796875, 8.09423828125, 8.5675048828125, 9.040771484375, 9.5140380859375, 9.9873046875, 10.4605712890625, 10.933837890625, 11.4071044921875, 11.88037109375, 12.3536376953125, 12.826904296875, 13.3001708984375, 13.7734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 10.0, 11.0, 25.0, 27.0, 47.0, 82.0, 115.0, 141.0, 137.0, 135.0, 74.0, 79.0, 33.0, 32.0, 18.0, 16.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.53411865234375, -126.13600158691406, -122.73788452148438, -119.33977508544922, -115.94165802001953, -112.54354095458984, -109.14543151855469, -105.747314453125, -102.34919738769531, -98.95108032226562, -95.55296325683594, -92.15485382080078, -88.7567367553711, -85.3586196899414, -81.96051025390625, -78.56239318847656, -75.16427612304688, -71.76615905761719, -68.3680419921875, -64.96993255615234, -61.571815490722656, -58.17369842529297, -54.77558517456055, -51.377471923828125, -47.97935485839844, -44.58123779296875, -41.18312454223633, -37.785011291503906, -34.38689422607422, -30.988779067993164, -27.59066390991211, -24.192548751831055, -20.79443359375, -17.396318435668945, -13.99820327758789, -10.600088119506836, -7.201972961425781, -3.8038578033447266, -0.4057426452636719, 2.992372512817383, 6.3904876708984375, 9.788602828979492, 13.186717987060547, 16.5848331451416, 19.982948303222656, 23.38106346130371, 26.779178619384766, 30.17729377746582, 33.575408935546875, 36.97352600097656, 40.371639251708984, 43.769752502441406, 47.167869567871094, 50.56598663330078, 53.9640998840332, 57.362213134765625, 60.76033020019531, 64.158447265625, 67.55656433105469, 70.95467376708984, 74.35279083251953, 77.75090789794922, 81.14901733398438, 84.54713439941406, 87.94525146484375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 8.0, 9.0, 14.0, 13.0, 19.0, 20.0, 34.0, 24.0, 32.0, 36.0, 55.0, 53.0, 47.0, 51.0, 71.0, 49.0, 59.0, 53.0, 57.0, 42.0, 49.0, 42.0, 36.0, 27.0, 20.0, 19.0, 16.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.43598937988281, -84.06910705566406, -80.70222473144531, -77.33534240722656, -73.96846008300781, -70.60157775878906, -67.23469543457031, -63.867820739746094, -60.500938415527344, -57.134056091308594, -53.767173767089844, -50.400291442871094, -47.03341293334961, -43.66653060913086, -40.29964828491211, -36.932769775390625, -33.56588363647461, -30.19900131225586, -26.832120895385742, -23.465238571166992, -20.098358154296875, -16.731475830078125, -13.364593505859375, -9.997713088989258, -6.630830764770508, -3.263949155807495, 0.10293245315551758, 3.4698143005371094, 6.836695671081543, 10.203577041625977, 13.570459365844727, 16.937339782714844, 20.304222106933594, 23.671104431152344, 27.03798484802246, 30.40486717224121, 33.77174758911133, 37.13862991333008, 40.50551223754883, 43.87239074707031, 47.23927307128906, 50.60615539550781, 53.97303771972656, 57.33992004394531, 60.7067985534668, 64.07368469238281, 67.44056701660156, 70.80744171142578, 74.17433166503906, 77.54121398925781, 80.90809631347656, 84.27497863769531, 87.64186096191406, 91.00874328613281, 94.37562561035156, 97.74250030517578, 101.10938262939453, 104.47626495361328, 107.84314727783203, 111.21002960205078, 114.57691192626953, 117.94378662109375, 121.3106689453125, 124.67755126953125, 128.04443359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 6.0, 11.0, 14.0, 30.0, 34.0, 47.0, 86.0, 130.0, 201.0, 317.0, 584.0, 1162.0, 2741.0, 9951.0, 70775.0, 3984229.0, 105639.0, 12277.0, 3235.0, 1231.0, 607.0, 348.0, 195.0, 138.0, 80.0, 74.0, 40.0, 26.0, 14.0, 16.0, 8.0, 5.0, 2.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.546875, -18.751220703125, -17.95556640625, -17.159912109375, -16.3642578125, -15.568603515625, -14.77294921875, -13.977294921875, -13.181640625, -12.385986328125, -11.59033203125, -10.794677734375, -9.9990234375, -9.203369140625, -8.40771484375, -7.612060546875, -6.81640625, -6.020751953125, -5.22509765625, -4.429443359375, -3.6337890625, -2.838134765625, -2.04248046875, -1.246826171875, -0.451171875, 0.344482421875, 1.14013671875, 1.935791015625, 2.7314453125, 3.527099609375, 4.32275390625, 5.118408203125, 5.9140625, 6.709716796875, 7.50537109375, 8.301025390625, 9.0966796875, 9.892333984375, 10.68798828125, 11.483642578125, 12.279296875, 13.074951171875, 13.87060546875, 14.666259765625, 15.4619140625, 16.257568359375, 17.05322265625, 17.848876953125, 18.64453125, 19.440185546875, 20.23583984375, 21.031494140625, 21.8271484375, 22.622802734375, 23.41845703125, 24.214111328125, 25.009765625, 25.805419921875, 26.60107421875, 27.396728515625, 28.1923828125, 28.988037109375, 29.78369140625, 30.579345703125, 31.375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 10.0, 13.0, 21.0, 19.0, 20.0, 40.0, 27.0, 41.0, 33.0, 48.0, 49.0, 53.0, 80.0, 62.0, 66.0, 68.0, 59.0, 48.0, 56.0, 31.0, 31.0, 23.0, 17.0, 26.0, 18.0, 10.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.560546875, -3.425506591796875, -3.29046630859375, -3.155426025390625, -3.0203857421875, -2.885345458984375, -2.75030517578125, -2.615264892578125, -2.480224609375, -2.345184326171875, -2.21014404296875, -2.075103759765625, -1.9400634765625, -1.805023193359375, -1.66998291015625, -1.534942626953125, -1.39990234375, -1.264862060546875, -1.12982177734375, -0.994781494140625, -0.8597412109375, -0.724700927734375, -0.58966064453125, -0.454620361328125, -0.319580078125, -0.184539794921875, -0.04949951171875, 0.085540771484375, 0.2205810546875, 0.355621337890625, 0.49066162109375, 0.625701904296875, 0.7607421875, 0.895782470703125, 1.03082275390625, 1.165863037109375, 1.3009033203125, 1.435943603515625, 1.57098388671875, 1.706024169921875, 1.841064453125, 1.976104736328125, 2.11114501953125, 2.246185302734375, 2.3812255859375, 2.516265869140625, 2.65130615234375, 2.786346435546875, 2.92138671875, 3.056427001953125, 3.19146728515625, 3.326507568359375, 3.4615478515625, 3.596588134765625, 3.73162841796875, 3.866668701171875, 4.001708984375, 4.136749267578125, 4.27178955078125, 4.406829833984375, 4.5418701171875, 4.676910400390625, 4.81195068359375, 4.946990966796875, 5.08203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 8.0, 10.0, 22.0, 22.0, 58.0, 87.0, 138.0, 274.0, 561.0, 1185.0, 2870.0, 9100.0, 40450.0, 616122.0, 3436778.0, 67298.0, 12542.0, 3860.0, 1448.0, 678.0, 343.0, 192.0, 98.0, 49.0, 36.0, 19.0, 14.0, 6.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.734375, -21.11572265625, -20.4970703125, -19.87841796875, -19.259765625, -18.64111328125, -18.0224609375, -17.40380859375, -16.78515625, -16.16650390625, -15.5478515625, -14.92919921875, -14.310546875, -13.69189453125, -13.0732421875, -12.45458984375, -11.8359375, -11.21728515625, -10.5986328125, -9.97998046875, -9.361328125, -8.74267578125, -8.1240234375, -7.50537109375, -6.88671875, -6.26806640625, -5.6494140625, -5.03076171875, -4.412109375, -3.79345703125, -3.1748046875, -2.55615234375, -1.9375, -1.31884765625, -0.7001953125, -0.08154296875, 0.537109375, 1.15576171875, 1.7744140625, 2.39306640625, 3.01171875, 3.63037109375, 4.2490234375, 4.86767578125, 5.486328125, 6.10498046875, 6.7236328125, 7.34228515625, 7.9609375, 8.57958984375, 9.1982421875, 9.81689453125, 10.435546875, 11.05419921875, 11.6728515625, 12.29150390625, 12.91015625, 13.52880859375, 14.1474609375, 14.76611328125, 15.384765625, 16.00341796875, 16.6220703125, 17.24072265625, 17.859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 13.0, 18.0, 26.0, 42.0, 59.0, 119.0, 290.0, 2277.0, 776.0, 194.0, 92.0, 49.0, 31.0, 23.0, 17.0, 10.0, 10.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.078125, -12.7410888671875, -12.404052734375, -12.0670166015625, -11.72998046875, -11.3929443359375, -11.055908203125, -10.7188720703125, -10.3818359375, -10.0447998046875, -9.707763671875, -9.3707275390625, -9.03369140625, -8.6966552734375, -8.359619140625, -8.0225830078125, -7.685546875, -7.3485107421875, -7.011474609375, -6.6744384765625, -6.33740234375, -6.0003662109375, -5.663330078125, -5.3262939453125, -4.9892578125, -4.6522216796875, -4.315185546875, -3.9781494140625, -3.64111328125, -3.3040771484375, -2.967041015625, -2.6300048828125, -2.29296875, -1.9559326171875, -1.618896484375, -1.2818603515625, -0.94482421875, -0.6077880859375, -0.270751953125, 0.0662841796875, 0.4033203125, 0.7403564453125, 1.077392578125, 1.4144287109375, 1.75146484375, 2.0885009765625, 2.425537109375, 2.7625732421875, 3.099609375, 3.4366455078125, 3.773681640625, 4.1107177734375, 4.44775390625, 4.7847900390625, 5.121826171875, 5.4588623046875, 5.7958984375, 6.1329345703125, 6.469970703125, 6.8070068359375, 7.14404296875, 7.4810791015625, 7.818115234375, 8.1551513671875, 8.4921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 24.0, 64.0, 159.0, 239.0, 246.0, 133.0, 68.0, 29.0, 20.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.79466247558594, -68.25247955322266, -65.71029663085938, -63.16810989379883, -60.62592315673828, -58.083740234375, -55.54155731201172, -52.99937438964844, -50.45718765258789, -47.91500473022461, -45.37281799316406, -42.83063507080078, -40.2884521484375, -37.74626541137695, -35.20408248901367, -32.661895751953125, -30.119712829589844, -27.57752799987793, -25.035343170166016, -22.493160247802734, -19.95097541809082, -17.408790588378906, -14.866606712341309, -12.324422836303711, -9.782238006591797, -7.240053653717041, -4.697869300842285, -2.1556849479675293, 0.38649940490722656, 2.9286842346191406, 5.470868110656738, 8.013051986694336, 10.555229187011719, 13.097414016723633, 15.63959789276123, 18.181781768798828, 20.723966598510742, 23.266151428222656, 25.808334350585938, 28.35051918029785, 30.892704010009766, 33.43488693237305, 35.977073669433594, 38.519256591796875, 41.061439514160156, 43.6036262512207, 46.145809173583984, 48.68799591064453, 51.23017883300781, 53.772361755371094, 56.31454849243164, 58.85673141479492, 61.39891815185547, 63.94110107421875, 66.48328399658203, 69.02546691894531, 71.56765747070312, 74.1098403930664, 76.65202331542969, 79.1942138671875, 81.73639678955078, 84.27857971191406, 86.82076263427734, 89.36294555664062, 91.9051284790039]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 9.0, 13.0, 14.0, 19.0, 14.0, 26.0, 20.0, 27.0, 34.0, 40.0, 38.0, 39.0, 48.0, 54.0, 33.0, 43.0, 60.0, 47.0, 46.0, 44.0, 45.0, 42.0, 38.0, 33.0, 27.0, 19.0, 24.0, 18.0, 9.0, 12.0, 16.0, 5.0, 10.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-23.774707794189453, -22.93950080871582, -22.104293823242188, -21.269084930419922, -20.43387794494629, -19.598670959472656, -18.763463973999023, -17.92825698852539, -17.093050003051758, -16.257843017578125, -15.422635078430176, -14.587428092956543, -13.75222110748291, -12.917013168334961, -12.081806182861328, -11.246599197387695, -10.411391258239746, -9.576184272766113, -8.740976333618164, -7.905769348144531, -7.070562362670898, -6.235354900360107, -5.400147438049316, -4.564940452575684, -3.7297329902648926, -2.8945257663726807, -2.0593185424804688, -1.2241110801696777, -0.3889038562774658, 0.4463033676147461, 1.281510829925537, 2.11671781539917, 2.951925277709961, 3.787132501602173, 4.622339725494385, 5.457547187805176, 6.292754173278809, 7.1279616355896, 7.963169097900391, 8.798376083374023, 9.633583068847656, 10.468790054321289, 11.303997993469238, 12.139204978942871, 12.974411964416504, 13.809619903564453, 14.644826889038086, 15.480033874511719, 16.315242767333984, 17.150449752807617, 17.98565673828125, 18.820865631103516, 19.65607261657715, 20.49127960205078, 21.326486587524414, 22.161693572998047, 22.99690055847168, 23.832107543945312, 24.667314529418945, 25.502521514892578, 26.337730407714844, 27.172937393188477, 28.00814437866211, 28.843351364135742, 29.678558349609375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 10.0, 9.0, 18.0, 25.0, 44.0, 66.0, 107.0, 170.0, 258.0, 431.0, 680.0, 1281.0, 2470.0, 5155.0, 12159.0, 31342.0, 94671.0, 292989.0, 383402.0, 146120.0, 46266.0, 16824.0, 6938.0, 3263.0, 1647.0, 869.0, 495.0, 300.0, 197.0, 129.0, 71.0, 45.0, 29.0, 21.0, 18.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.40185546875, -8.0927734375, -7.78369140625, -7.474609375, -7.16552734375, -6.8564453125, -6.54736328125, -6.23828125, -5.92919921875, -5.6201171875, -5.31103515625, -5.001953125, -4.69287109375, -4.3837890625, -4.07470703125, -3.765625, -3.45654296875, -3.1474609375, -2.83837890625, -2.529296875, -2.22021484375, -1.9111328125, -1.60205078125, -1.29296875, -0.98388671875, -0.6748046875, -0.36572265625, -0.056640625, 0.25244140625, 0.5615234375, 0.87060546875, 1.1796875, 1.48876953125, 1.7978515625, 2.10693359375, 2.416015625, 2.72509765625, 3.0341796875, 3.34326171875, 3.65234375, 3.96142578125, 4.2705078125, 4.57958984375, 4.888671875, 5.19775390625, 5.5068359375, 5.81591796875, 6.125, 6.43408203125, 6.7431640625, 7.05224609375, 7.361328125, 7.67041015625, 7.9794921875, 8.28857421875, 8.59765625, 8.90673828125, 9.2158203125, 9.52490234375, 9.833984375, 10.14306640625, 10.4521484375, 10.76123046875, 11.0703125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 4.0, 12.0, 8.0, 20.0, 19.0, 21.0, 22.0, 26.0, 30.0, 35.0, 42.0, 54.0, 34.0, 41.0, 61.0, 56.0, 69.0, 63.0, 44.0, 48.0, 39.0, 42.0, 36.0, 31.0, 20.0, 29.0, 15.0, 21.0, 11.0, 11.0, 2.0, 6.0, 11.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.107513427734375, -2.98260498046875, -2.857696533203125, -2.7327880859375, -2.607879638671875, -2.48297119140625, -2.358062744140625, -2.233154296875, -2.108245849609375, -1.98333740234375, -1.858428955078125, -1.7335205078125, -1.608612060546875, -1.48370361328125, -1.358795166015625, -1.23388671875, -1.108978271484375, -0.98406982421875, -0.859161376953125, -0.7342529296875, -0.609344482421875, -0.48443603515625, -0.359527587890625, -0.234619140625, -0.109710693359375, 0.01519775390625, 0.140106201171875, 0.2650146484375, 0.389923095703125, 0.51483154296875, 0.639739990234375, 0.7646484375, 0.889556884765625, 1.01446533203125, 1.139373779296875, 1.2642822265625, 1.389190673828125, 1.51409912109375, 1.639007568359375, 1.763916015625, 1.888824462890625, 2.01373291015625, 2.138641357421875, 2.2635498046875, 2.388458251953125, 2.51336669921875, 2.638275146484375, 2.76318359375, 2.888092041015625, 3.01300048828125, 3.137908935546875, 3.2628173828125, 3.387725830078125, 3.51263427734375, 3.637542724609375, 3.762451171875, 3.887359619140625, 4.01226806640625, 4.137176513671875, 4.2620849609375, 4.386993408203125, 4.51190185546875, 4.636810302734375, 4.76171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 5.0, 8.0, 8.0, 8.0, 18.0, 17.0, 32.0, 49.0, 82.0, 160.0, 298.0, 638.0, 1364.0, 3659.0, 11269.0, 47120.0, 295498.0, 561518.0, 97285.0, 19964.0, 5780.0, 2049.0, 832.0, 407.0, 182.0, 102.0, 63.0, 37.0, 31.0, 16.0, 11.0, 15.0, 4.0, 9.0, 5.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.21875, -15.66357421875, -15.1083984375, -14.55322265625, -13.998046875, -13.44287109375, -12.8876953125, -12.33251953125, -11.77734375, -11.22216796875, -10.6669921875, -10.11181640625, -9.556640625, -9.00146484375, -8.4462890625, -7.89111328125, -7.3359375, -6.78076171875, -6.2255859375, -5.67041015625, -5.115234375, -4.56005859375, -4.0048828125, -3.44970703125, -2.89453125, -2.33935546875, -1.7841796875, -1.22900390625, -0.673828125, -0.11865234375, 0.4365234375, 0.99169921875, 1.546875, 2.10205078125, 2.6572265625, 3.21240234375, 3.767578125, 4.32275390625, 4.8779296875, 5.43310546875, 5.98828125, 6.54345703125, 7.0986328125, 7.65380859375, 8.208984375, 8.76416015625, 9.3193359375, 9.87451171875, 10.4296875, 10.98486328125, 11.5400390625, 12.09521484375, 12.650390625, 13.20556640625, 13.7607421875, 14.31591796875, 14.87109375, 15.42626953125, 15.9814453125, 16.53662109375, 17.091796875, 17.64697265625, 18.2021484375, 18.75732421875, 19.3125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 10.0, 5.0, 7.0, 8.0, 9.0, 22.0, 17.0, 18.0, 24.0, 28.0, 25.0, 32.0, 49.0, 44.0, 47.0, 60.0, 51.0, 56.0, 51.0, 83.0, 61.0, 36.0, 35.0, 37.0, 30.0, 39.0, 16.0, 22.0, 18.0, 15.0, 10.0, 12.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.171875, -24.321044921875, -23.47021484375, -22.619384765625, -21.7685546875, -20.917724609375, -20.06689453125, -19.216064453125, -18.365234375, -17.514404296875, -16.66357421875, -15.812744140625, -14.9619140625, -14.111083984375, -13.26025390625, -12.409423828125, -11.55859375, -10.707763671875, -9.85693359375, -9.006103515625, -8.1552734375, -7.304443359375, -6.45361328125, -5.602783203125, -4.751953125, -3.901123046875, -3.05029296875, -2.199462890625, -1.3486328125, -0.497802734375, 0.35302734375, 1.203857421875, 2.0546875, 2.905517578125, 3.75634765625, 4.607177734375, 5.4580078125, 6.308837890625, 7.15966796875, 8.010498046875, 8.861328125, 9.712158203125, 10.56298828125, 11.413818359375, 12.2646484375, 13.115478515625, 13.96630859375, 14.817138671875, 15.66796875, 16.518798828125, 17.36962890625, 18.220458984375, 19.0712890625, 19.922119140625, 20.77294921875, 21.623779296875, 22.474609375, 23.325439453125, 24.17626953125, 25.027099609375, 25.8779296875, 26.728759765625, 27.57958984375, 28.430419921875, 29.28125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 11.0, 6.0, 19.0, 11.0, 23.0, 29.0, 76.0, 88.0, 193.0, 386.0, 1062.0, 3287.0, 19247.0, 349832.0, 633895.0, 33478.0, 4621.0, 1287.0, 478.0, 235.0, 121.0, 56.0, 34.0, 26.0, 21.0, 9.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.866943359375, -11.44482421875, -11.022705078125, -10.6005859375, -10.178466796875, -9.75634765625, -9.334228515625, -8.912109375, -8.489990234375, -8.06787109375, -7.645751953125, -7.2236328125, -6.801513671875, -6.37939453125, -5.957275390625, -5.53515625, -5.113037109375, -4.69091796875, -4.268798828125, -3.8466796875, -3.424560546875, -3.00244140625, -2.580322265625, -2.158203125, -1.736083984375, -1.31396484375, -0.891845703125, -0.4697265625, -0.047607421875, 0.37451171875, 0.796630859375, 1.21875, 1.640869140625, 2.06298828125, 2.485107421875, 2.9072265625, 3.329345703125, 3.75146484375, 4.173583984375, 4.595703125, 5.017822265625, 5.43994140625, 5.862060546875, 6.2841796875, 6.706298828125, 7.12841796875, 7.550537109375, 7.97265625, 8.394775390625, 8.81689453125, 9.239013671875, 9.6611328125, 10.083251953125, 10.50537109375, 10.927490234375, 11.349609375, 11.771728515625, 12.19384765625, 12.615966796875, 13.0380859375, 13.460205078125, 13.88232421875, 14.304443359375, 14.7265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 2.0, 10.0, 11.0, 16.0, 21.0, 48.0, 51.0, 84.0, 119.0, 140.0, 125.0, 110.0, 75.0, 60.0, 37.0, 32.0, 19.0, 9.0, 7.0, 2.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010900497436523438, -0.0010421723127365112, -0.0009942948818206787, -0.0009464174509048462, -0.0008985400199890137, -0.0008506625890731812, -0.0008027851581573486, -0.0007549077272415161, -0.0007070302963256836, -0.0006591528654098511, -0.0006112754344940186, -0.000563398003578186, -0.0005155205726623535, -0.000467643141746521, -0.0004197657108306885, -0.00037188827991485596, -0.00032401084899902344, -0.0002761334180831909, -0.0002282559871673584, -0.00018037855625152588, -0.00013250112533569336, -8.462369441986084e-05, -3.674626350402832e-05, 1.11311674118042e-05, 5.900859832763672e-05, 0.00010688602924346924, 0.00015476346015930176, 0.00020264089107513428, 0.0002505183219909668, 0.0002983957529067993, 0.00034627318382263184, 0.00039415061473846436, 0.0004420280456542969, 0.0004899054765701294, 0.0005377829074859619, 0.0005856603384017944, 0.000633537769317627, 0.0006814152002334595, 0.000729292631149292, 0.0007771700620651245, 0.000825047492980957, 0.0008729249238967896, 0.0009208023548126221, 0.0009686797857284546, 0.0010165572166442871, 0.0010644346475601196, 0.0011123120784759521, 0.0011601895093917847, 0.0012080669403076172, 0.0012559443712234497, 0.0013038218021392822, 0.0013516992330551147, 0.0013995766639709473, 0.0014474540948867798, 0.0014953315258026123, 0.0015432089567184448, 0.0015910863876342773, 0.0016389638185501099, 0.0016868412494659424, 0.001734718680381775, 0.0017825961112976074, 0.00183047354221344, 0.0018783509731292725, 0.001926228404045105, 0.0019741058349609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 10.0, 16.0, 37.0, 35.0, 62.0, 117.0, 234.0, 456.0, 971.0, 2649.0, 8756.0, 42813.0, 291677.0, 575172.0, 100742.0, 17616.0, 4367.0, 1514.0, 626.0, 284.0, 139.0, 94.0, 58.0, 41.0, 23.0, 20.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.9705810546875, -8.683349609375, -8.3961181640625, -8.10888671875, -7.8216552734375, -7.534423828125, -7.2471923828125, -6.9599609375, -6.6727294921875, -6.385498046875, -6.0982666015625, -5.81103515625, -5.5238037109375, -5.236572265625, -4.9493408203125, -4.662109375, -4.3748779296875, -4.087646484375, -3.8004150390625, -3.51318359375, -3.2259521484375, -2.938720703125, -2.6514892578125, -2.3642578125, -2.0770263671875, -1.789794921875, -1.5025634765625, -1.21533203125, -0.9281005859375, -0.640869140625, -0.3536376953125, -0.06640625, 0.2208251953125, 0.508056640625, 0.7952880859375, 1.08251953125, 1.3697509765625, 1.656982421875, 1.9442138671875, 2.2314453125, 2.5186767578125, 2.805908203125, 3.0931396484375, 3.38037109375, 3.6676025390625, 3.954833984375, 4.2420654296875, 4.529296875, 4.8165283203125, 5.103759765625, 5.3909912109375, 5.67822265625, 5.9654541015625, 6.252685546875, 6.5399169921875, 6.8271484375, 7.1143798828125, 7.401611328125, 7.6888427734375, 7.97607421875, 8.2633056640625, 8.550537109375, 8.8377685546875, 9.125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 7.0, 4.0, 9.0, 11.0, 18.0, 16.0, 24.0, 35.0, 45.0, 60.0, 96.0, 101.0, 109.0, 127.0, 84.0, 75.0, 49.0, 39.0, 27.0, 23.0, 16.0, 13.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9765625, -12.579833984375, -12.18310546875, -11.786376953125, -11.3896484375, -10.992919921875, -10.59619140625, -10.199462890625, -9.802734375, -9.406005859375, -9.00927734375, -8.612548828125, -8.2158203125, -7.819091796875, -7.42236328125, -7.025634765625, -6.62890625, -6.232177734375, -5.83544921875, -5.438720703125, -5.0419921875, -4.645263671875, -4.24853515625, -3.851806640625, -3.455078125, -3.058349609375, -2.66162109375, -2.264892578125, -1.8681640625, -1.471435546875, -1.07470703125, -0.677978515625, -0.28125, 0.115478515625, 0.51220703125, 0.908935546875, 1.3056640625, 1.702392578125, 2.09912109375, 2.495849609375, 2.892578125, 3.289306640625, 3.68603515625, 4.082763671875, 4.4794921875, 4.876220703125, 5.27294921875, 5.669677734375, 6.06640625, 6.463134765625, 6.85986328125, 7.256591796875, 7.6533203125, 8.050048828125, 8.44677734375, 8.843505859375, 9.240234375, 9.636962890625, 10.03369140625, 10.430419921875, 10.8271484375, 11.223876953125, 11.62060546875, 12.017333984375, 12.4140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 13.0, 62.0, 168.0, 283.0, 267.0, 136.0, 52.0, 15.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-411.8455810546875, -403.589111328125, -395.3326416015625, -387.076171875, -378.8197021484375, -370.563232421875, -362.3067626953125, -354.05029296875, -345.7938232421875, -337.537353515625, -329.2808837890625, -321.0244140625, -312.7679443359375, -304.511474609375, -296.2550048828125, -287.99853515625, -279.7420349121094, -271.4855651855469, -263.2290954589844, -254.97262573242188, -246.71615600585938, -238.45968627929688, -230.2032012939453, -221.9467315673828, -213.6902618408203, -205.4337921142578, -197.1773223876953, -188.9208526611328, -180.66436767578125, -172.40789794921875, -164.15142822265625, -155.89495849609375, -147.63851928710938, -139.38204956054688, -131.12557983398438, -122.86910247802734, -114.61263275146484, -106.35616302490234, -98.09968566894531, -89.84321594238281, -81.58674621582031, -73.33027648925781, -65.07380676269531, -56.81732940673828, -48.56085968017578, -40.30438995361328, -32.047916412353516, -23.79144287109375, -15.53497314453125, -7.278501510620117, 0.9779701232910156, 9.234441757202148, 17.49091339111328, 25.74738311767578, 34.00385665893555, 42.26033020019531, 50.51679992675781, 58.77326965332031, 67.02973937988281, 75.28621673583984, 83.54268646240234, 91.79915618896484, 100.05563354492188, 108.31210327148438, 116.56857299804688]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 9.0, 9.0, 17.0, 21.0, 14.0, 16.0, 21.0, 25.0, 25.0, 32.0, 33.0, 42.0, 39.0, 47.0, 38.0, 50.0, 48.0, 52.0, 43.0, 38.0, 42.0, 44.0, 43.0, 31.0, 35.0, 28.0, 19.0, 27.0, 19.0, 16.0, 14.0, 8.0, 9.0, 10.0, 3.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-120.56280517578125, -116.78648376464844, -113.01016998291016, -109.23384857177734, -105.45753479003906, -101.68121337890625, -97.90489196777344, -94.12857818603516, -90.35226440429688, -86.57594299316406, -82.79962921142578, -79.02330780029297, -75.24699401855469, -71.47067260742188, -67.69435119628906, -63.91803741455078, -60.14171600341797, -56.36539840698242, -52.589080810546875, -48.81275939941406, -45.03644561767578, -41.26012420654297, -37.48380661010742, -33.707489013671875, -29.931171417236328, -26.15485382080078, -22.378536224365234, -18.602216720581055, -14.825899124145508, -11.049581527709961, -7.273262023925781, -3.4969444274902344, 0.27938079833984375, 4.055698871612549, 7.832016944885254, 11.608335494995117, 15.384653091430664, 19.16097068786621, 22.93729019165039, 26.713607788085938, 30.489925384521484, 34.26624298095703, 38.04256057739258, 41.818878173828125, 45.59519958496094, 49.37151336669922, 53.14783477783203, 56.92415237426758, 60.700469970703125, 64.47679138183594, 68.25310516357422, 72.02942657470703, 75.80574035644531, 79.58206176757812, 83.35838317871094, 87.13469696044922, 90.9110107421875, 94.68733215332031, 98.4636459350586, 102.2399673461914, 106.01628112792969, 109.7926025390625, 113.56892395019531, 117.3452377319336, 121.1215591430664]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 9.0, 8.0, 5.0, 10.0, 18.0, 30.0, 27.0, 54.0, 62.0, 83.0, 138.0, 193.0, 333.0, 579.0, 1010.0, 2132.0, 5747.0, 24085.0, 3901866.0, 233662.0, 15801.0, 4360.0, 1799.0, 878.0, 491.0, 304.0, 181.0, 119.0, 93.0, 66.0, 32.0, 28.0, 19.0, 16.0, 17.0, 4.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-16.046875, -15.47119140625, -14.8955078125, -14.31982421875, -13.744140625, -13.16845703125, -12.5927734375, -12.01708984375, -11.44140625, -10.86572265625, -10.2900390625, -9.71435546875, -9.138671875, -8.56298828125, -7.9873046875, -7.41162109375, -6.8359375, -6.26025390625, -5.6845703125, -5.10888671875, -4.533203125, -3.95751953125, -3.3818359375, -2.80615234375, -2.23046875, -1.65478515625, -1.0791015625, -0.50341796875, 0.072265625, 0.64794921875, 1.2236328125, 1.79931640625, 2.375, 2.95068359375, 3.5263671875, 4.10205078125, 4.677734375, 5.25341796875, 5.8291015625, 6.40478515625, 6.98046875, 7.55615234375, 8.1318359375, 8.70751953125, 9.283203125, 9.85888671875, 10.4345703125, 11.01025390625, 11.5859375, 12.16162109375, 12.7373046875, 13.31298828125, 13.888671875, 14.46435546875, 15.0400390625, 15.61572265625, 16.19140625, 16.76708984375, 17.3427734375, 17.91845703125, 18.494140625, 19.06982421875, 19.6455078125, 20.22119140625, 20.796875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 8.0, 7.0, 14.0, 19.0, 21.0, 41.0, 37.0, 44.0, 45.0, 44.0, 68.0, 63.0, 84.0, 68.0, 72.0, 77.0, 43.0, 48.0, 51.0, 30.0, 28.0, 16.0, 17.0, 11.0, 8.0, 7.0, 10.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.07952880859375, -4.8660888671875, -4.65264892578125, -4.439208984375, -4.22576904296875, -4.0123291015625, -3.79888916015625, -3.58544921875, -3.37200927734375, -3.1585693359375, -2.94512939453125, -2.731689453125, -2.51824951171875, -2.3048095703125, -2.09136962890625, -1.8779296875, -1.66448974609375, -1.4510498046875, -1.23760986328125, -1.024169921875, -0.81072998046875, -0.5972900390625, -0.38385009765625, -0.17041015625, 0.04302978515625, 0.2564697265625, 0.46990966796875, 0.683349609375, 0.89678955078125, 1.1102294921875, 1.32366943359375, 1.537109375, 1.75054931640625, 1.9639892578125, 2.17742919921875, 2.390869140625, 2.60430908203125, 2.8177490234375, 3.03118896484375, 3.24462890625, 3.45806884765625, 3.6715087890625, 3.88494873046875, 4.098388671875, 4.31182861328125, 4.5252685546875, 4.73870849609375, 4.9521484375, 5.16558837890625, 5.3790283203125, 5.59246826171875, 5.805908203125, 6.01934814453125, 6.2327880859375, 6.44622802734375, 6.65966796875, 6.87310791015625, 7.0865478515625, 7.29998779296875, 7.513427734375, 7.72686767578125, 7.9403076171875, 8.15374755859375, 8.3671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 7.0, 11.0, 20.0, 27.0, 28.0, 55.0, 55.0, 78.0, 134.0, 179.0, 257.0, 367.0, 627.0, 961.0, 1449.0, 2447.0, 4113.0, 8271.0, 19687.0, 87157.0, 3879941.0, 141732.0, 25287.0, 9668.0, 4588.0, 2673.0, 1611.0, 937.0, 680.0, 377.0, 246.0, 163.0, 124.0, 90.0, 59.0, 44.0, 36.0, 22.0, 23.0, 16.0, 7.0, 3.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.375, -12.9378662109375, -12.500732421875, -12.0635986328125, -11.62646484375, -11.1893310546875, -10.752197265625, -10.3150634765625, -9.8779296875, -9.4407958984375, -9.003662109375, -8.5665283203125, -8.12939453125, -7.6922607421875, -7.255126953125, -6.8179931640625, -6.380859375, -5.9437255859375, -5.506591796875, -5.0694580078125, -4.63232421875, -4.1951904296875, -3.758056640625, -3.3209228515625, -2.8837890625, -2.4466552734375, -2.009521484375, -1.5723876953125, -1.13525390625, -0.6981201171875, -0.260986328125, 0.1761474609375, 0.61328125, 1.0504150390625, 1.487548828125, 1.9246826171875, 2.36181640625, 2.7989501953125, 3.236083984375, 3.6732177734375, 4.1103515625, 4.5474853515625, 4.984619140625, 5.4217529296875, 5.85888671875, 6.2960205078125, 6.733154296875, 7.1702880859375, 7.607421875, 8.0445556640625, 8.481689453125, 8.9188232421875, 9.35595703125, 9.7930908203125, 10.230224609375, 10.6673583984375, 11.1044921875, 11.5416259765625, 11.978759765625, 12.4158935546875, 12.85302734375, 13.2901611328125, 13.727294921875, 14.1644287109375, 14.6015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 6.0, 11.0, 14.0, 31.0, 104.0, 3213.0, 501.0, 81.0, 33.0, 25.0, 12.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.02734375, -6.831298828125, -6.63525390625, -6.439208984375, -6.2431640625, -6.047119140625, -5.85107421875, -5.655029296875, -5.458984375, -5.262939453125, -5.06689453125, -4.870849609375, -4.6748046875, -4.478759765625, -4.28271484375, -4.086669921875, -3.890625, -3.694580078125, -3.49853515625, -3.302490234375, -3.1064453125, -2.910400390625, -2.71435546875, -2.518310546875, -2.322265625, -2.126220703125, -1.93017578125, -1.734130859375, -1.5380859375, -1.342041015625, -1.14599609375, -0.949951171875, -0.75390625, -0.557861328125, -0.36181640625, -0.165771484375, 0.0302734375, 0.226318359375, 0.42236328125, 0.618408203125, 0.814453125, 1.010498046875, 1.20654296875, 1.402587890625, 1.5986328125, 1.794677734375, 1.99072265625, 2.186767578125, 2.3828125, 2.578857421875, 2.77490234375, 2.970947265625, 3.1669921875, 3.363037109375, 3.55908203125, 3.755126953125, 3.951171875, 4.147216796875, 4.34326171875, 4.539306640625, 4.7353515625, 4.931396484375, 5.12744140625, 5.323486328125, 5.51953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 5.0, 12.0, 20.0, 27.0, 51.0, 86.0, 154.0, 181.0, 177.0, 129.0, 68.0, 38.0, 20.0, 15.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.427258491516113, -10.73616886138916, -10.045079231262207, -9.353989601135254, -8.6628999710083, -7.971810340881348, -7.280721187591553, -6.5896315574646, -5.8985419273376465, -5.207452297210693, -4.51636266708374, -3.825273275375366, -3.134183645248413, -2.44309401512146, -1.752004623413086, -1.0609149932861328, -0.3698253631591797, 0.32126420736312866, 1.012353777885437, 1.7034432888031006, 2.3945329189300537, 3.085622549057007, 3.776711940765381, 4.467801570892334, 5.158891201019287, 5.84998083114624, 6.541070461273193, 7.232159614562988, 7.923249244689941, 8.614338874816895, 9.305428504943848, 9.9965181350708, 10.68760871887207, 11.378698348999023, 12.069787979125977, 12.76087760925293, 13.451967239379883, 14.143056869506836, 14.834146499633789, 15.525236129760742, 16.216325759887695, 16.90741539001465, 17.5985050201416, 18.289594650268555, 18.980684280395508, 19.67177391052246, 20.362863540649414, 21.053953170776367, 21.745040893554688, 22.43613052368164, 23.127220153808594, 23.818309783935547, 24.5093994140625, 25.200489044189453, 25.891578674316406, 26.58266830444336, 27.273757934570312, 27.964847564697266, 28.65593719482422, 29.347026824951172, 30.038116455078125, 30.729206085205078, 31.42029571533203, 32.111385345458984, 32.80247497558594]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 10.0, 5.0, 5.0, 14.0, 14.0, 17.0, 15.0, 21.0, 21.0, 22.0, 24.0, 24.0, 26.0, 29.0, 31.0, 39.0, 33.0, 53.0, 31.0, 44.0, 37.0, 33.0, 28.0, 40.0, 49.0, 36.0, 37.0, 27.0, 33.0, 26.0, 19.0, 21.0, 22.0, 17.0, 9.0, 17.0, 14.0, 11.0, 8.0, 5.0, 7.0, 3.0, 6.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.024789810180664, -7.766061782836914, -7.507333755493164, -7.248605728149414, -6.989877700805664, -6.731149673461914, -6.472421646118164, -6.213693618774414, -5.954965591430664, -5.696237564086914, -5.437509536743164, -5.178781509399414, -4.920053482055664, -4.661325454711914, -4.402597427368164, -4.143869400024414, -3.885141372680664, -3.626413345336914, -3.367685317993164, -3.108957290649414, -2.850229263305664, -2.591501235961914, -2.332773208618164, -2.074045181274414, -1.815317153930664, -1.556589126586914, -1.297861099243164, -1.039133071899414, -0.7804050445556641, -0.5216770172119141, -0.26294898986816406, -0.0042209625244140625, 0.25450801849365234, 0.5132360458374023, 0.7719640731811523, 1.0306921005249023, 1.2894201278686523, 1.5481481552124023, 1.8068761825561523, 2.0656042098999023, 2.3243322372436523, 2.5830602645874023, 2.8417882919311523, 3.1005163192749023, 3.3592443466186523, 3.6179723739624023, 3.8767004013061523, 4.135428428649902, 4.394156455993652, 4.652884483337402, 4.911612510681152, 5.170340538024902, 5.429068565368652, 5.687796592712402, 5.946524620056152, 6.205252647399902, 6.463980674743652, 6.722708702087402, 6.981436729431152, 7.240164756774902, 7.498892784118652, 7.757620811462402, 8.016348838806152, 8.275076866149902, 8.533804893493652]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 9.0, 8.0, 13.0, 27.0, 33.0, 35.0, 71.0, 129.0, 225.0, 426.0, 844.0, 1740.0, 3913.0, 9854.0, 26797.0, 83816.0, 261960.0, 400992.0, 173231.0, 53821.0, 18033.0, 6821.0, 2895.0, 1389.0, 689.0, 341.0, 172.0, 103.0, 58.0, 40.0, 20.0, 15.0, 11.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.541259765625, -9.19189453125, -8.842529296875, -8.4931640625, -8.143798828125, -7.79443359375, -7.445068359375, -7.095703125, -6.746337890625, -6.39697265625, -6.047607421875, -5.6982421875, -5.348876953125, -4.99951171875, -4.650146484375, -4.30078125, -3.951416015625, -3.60205078125, -3.252685546875, -2.9033203125, -2.553955078125, -2.20458984375, -1.855224609375, -1.505859375, -1.156494140625, -0.80712890625, -0.457763671875, -0.1083984375, 0.240966796875, 0.59033203125, 0.939697265625, 1.2890625, 1.638427734375, 1.98779296875, 2.337158203125, 2.6865234375, 3.035888671875, 3.38525390625, 3.734619140625, 4.083984375, 4.433349609375, 4.78271484375, 5.132080078125, 5.4814453125, 5.830810546875, 6.18017578125, 6.529541015625, 6.87890625, 7.228271484375, 7.57763671875, 7.927001953125, 8.2763671875, 8.625732421875, 8.97509765625, 9.324462890625, 9.673828125, 10.023193359375, 10.37255859375, 10.721923828125, 11.0712890625, 11.420654296875, 11.77001953125, 12.119384765625, 12.46875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 10.0, 4.0, 12.0, 6.0, 12.0, 18.0, 23.0, 29.0, 48.0, 35.0, 39.0, 47.0, 50.0, 58.0, 56.0, 54.0, 59.0, 63.0, 67.0, 45.0, 49.0, 50.0, 27.0, 31.0, 23.0, 21.0, 12.0, 11.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.60528564453125, -4.4176025390625, -4.22991943359375, -4.042236328125, -3.85455322265625, -3.6668701171875, -3.47918701171875, -3.29150390625, -3.10382080078125, -2.9161376953125, -2.72845458984375, -2.540771484375, -2.35308837890625, -2.1654052734375, -1.97772216796875, -1.7900390625, -1.60235595703125, -1.4146728515625, -1.22698974609375, -1.039306640625, -0.85162353515625, -0.6639404296875, -0.47625732421875, -0.28857421875, -0.10089111328125, 0.0867919921875, 0.27447509765625, 0.462158203125, 0.64984130859375, 0.8375244140625, 1.02520751953125, 1.212890625, 1.40057373046875, 1.5882568359375, 1.77593994140625, 1.963623046875, 2.15130615234375, 2.3389892578125, 2.52667236328125, 2.71435546875, 2.90203857421875, 3.0897216796875, 3.27740478515625, 3.465087890625, 3.65277099609375, 3.8404541015625, 4.02813720703125, 4.2158203125, 4.40350341796875, 4.5911865234375, 4.77886962890625, 4.966552734375, 5.15423583984375, 5.3419189453125, 5.52960205078125, 5.71728515625, 5.90496826171875, 6.0926513671875, 6.28033447265625, 6.468017578125, 6.65570068359375, 6.8433837890625, 7.03106689453125, 7.21875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 16.0, 17.0, 38.0, 47.0, 75.0, 136.0, 281.0, 574.0, 1391.0, 3976.0, 13138.0, 61301.0, 438157.0, 446490.0, 62896.0, 13399.0, 3892.0, 1467.0, 601.0, 291.0, 148.0, 82.0, 54.0, 17.0, 17.0, 14.0, 17.0, 5.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.248291015625, -19.65283203125, -19.057373046875, -18.4619140625, -17.866455078125, -17.27099609375, -16.675537109375, -16.080078125, -15.484619140625, -14.88916015625, -14.293701171875, -13.6982421875, -13.102783203125, -12.50732421875, -11.911865234375, -11.31640625, -10.720947265625, -10.12548828125, -9.530029296875, -8.9345703125, -8.339111328125, -7.74365234375, -7.148193359375, -6.552734375, -5.957275390625, -5.36181640625, -4.766357421875, -4.1708984375, -3.575439453125, -2.97998046875, -2.384521484375, -1.7890625, -1.193603515625, -0.59814453125, -0.002685546875, 0.5927734375, 1.188232421875, 1.78369140625, 2.379150390625, 2.974609375, 3.570068359375, 4.16552734375, 4.760986328125, 5.3564453125, 5.951904296875, 6.54736328125, 7.142822265625, 7.73828125, 8.333740234375, 8.92919921875, 9.524658203125, 10.1201171875, 10.715576171875, 11.31103515625, 11.906494140625, 12.501953125, 13.097412109375, 13.69287109375, 14.288330078125, 14.8837890625, 15.479248046875, 16.07470703125, 16.670166015625, 17.265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 4.0, 8.0, 9.0, 5.0, 19.0, 15.0, 24.0, 17.0, 33.0, 31.0, 28.0, 41.0, 51.0, 48.0, 53.0, 67.0, 29.0, 55.0, 47.0, 55.0, 41.0, 36.0, 51.0, 33.0, 39.0, 22.0, 24.0, 19.0, 16.0, 18.0, 13.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.46875, -29.512939453125, -28.55712890625, -27.601318359375, -26.6455078125, -25.689697265625, -24.73388671875, -23.778076171875, -22.822265625, -21.866455078125, -20.91064453125, -19.954833984375, -18.9990234375, -18.043212890625, -17.08740234375, -16.131591796875, -15.17578125, -14.219970703125, -13.26416015625, -12.308349609375, -11.3525390625, -10.396728515625, -9.44091796875, -8.485107421875, -7.529296875, -6.573486328125, -5.61767578125, -4.661865234375, -3.7060546875, -2.750244140625, -1.79443359375, -0.838623046875, 0.1171875, 1.072998046875, 2.02880859375, 2.984619140625, 3.9404296875, 4.896240234375, 5.85205078125, 6.807861328125, 7.763671875, 8.719482421875, 9.67529296875, 10.631103515625, 11.5869140625, 12.542724609375, 13.49853515625, 14.454345703125, 15.41015625, 16.365966796875, 17.32177734375, 18.277587890625, 19.2333984375, 20.189208984375, 21.14501953125, 22.100830078125, 23.056640625, 24.012451171875, 24.96826171875, 25.924072265625, 26.8798828125, 27.835693359375, 28.79150390625, 29.747314453125, 30.703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 5.0, 11.0, 10.0, 29.0, 46.0, 59.0, 107.0, 217.0, 446.0, 1106.0, 3069.0, 14161.0, 126259.0, 712414.0, 167122.0, 17671.0, 3617.0, 1132.0, 512.0, 232.0, 134.0, 71.0, 42.0, 24.0, 17.0, 12.0, 5.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.11328125, -6.86419677734375, -6.6151123046875, -6.36602783203125, -6.116943359375, -5.86785888671875, -5.6187744140625, -5.36968994140625, -5.12060546875, -4.87152099609375, -4.6224365234375, -4.37335205078125, -4.124267578125, -3.87518310546875, -3.6260986328125, -3.37701416015625, -3.1279296875, -2.87884521484375, -2.6297607421875, -2.38067626953125, -2.131591796875, -1.88250732421875, -1.6334228515625, -1.38433837890625, -1.13525390625, -0.88616943359375, -0.6370849609375, -0.38800048828125, -0.138916015625, 0.11016845703125, 0.3592529296875, 0.60833740234375, 0.857421875, 1.10650634765625, 1.3555908203125, 1.60467529296875, 1.853759765625, 2.10284423828125, 2.3519287109375, 2.60101318359375, 2.85009765625, 3.09918212890625, 3.3482666015625, 3.59735107421875, 3.846435546875, 4.09552001953125, 4.3446044921875, 4.59368896484375, 4.8427734375, 5.09185791015625, 5.3409423828125, 5.59002685546875, 5.839111328125, 6.08819580078125, 6.3372802734375, 6.58636474609375, 6.83544921875, 7.08453369140625, 7.3336181640625, 7.58270263671875, 7.831787109375, 8.08087158203125, 8.3299560546875, 8.57904052734375, 8.828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 2.0, 9.0, 9.0, 11.0, 20.0, 20.0, 25.0, 32.0, 24.0, 54.0, 49.0, 74.0, 60.0, 69.0, 74.0, 70.0, 72.0, 59.0, 51.0, 35.0, 35.0, 41.0, 28.0, 16.0, 17.0, 8.0, 10.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007123947143554688, -0.0006897896528244019, -0.000667184591293335, -0.0006445795297622681, -0.0006219744682312012, -0.0005993694067001343, -0.0005767643451690674, -0.0005541592836380005, -0.0005315542221069336, -0.0005089491605758667, -0.0004863440990447998, -0.0004637390375137329, -0.000441133975982666, -0.0004185289144515991, -0.0003959238529205322, -0.00037331879138946533, -0.00035071372985839844, -0.00032810866832733154, -0.00030550360679626465, -0.00028289854526519775, -0.00026029348373413086, -0.00023768842220306396, -0.00021508336067199707, -0.00019247829914093018, -0.00016987323760986328, -0.0001472681760787964, -0.0001246631145477295, -0.0001020580530166626, -7.94529914855957e-05, -5.684792995452881e-05, -3.4242868423461914e-05, -1.163780689239502e-05, 1.0967254638671875e-05, 3.357231616973877e-05, 5.6177377700805664e-05, 7.878243923187256e-05, 0.00010138750076293945, 0.00012399256229400635, 0.00014659762382507324, 0.00016920268535614014, 0.00019180774688720703, 0.00021441280841827393, 0.00023701786994934082, 0.0002596229314804077, 0.0002822279930114746, 0.0003048330545425415, 0.0003274381160736084, 0.0003500431776046753, 0.0003726482391357422, 0.0003952533006668091, 0.000417858362197876, 0.00044046342372894287, 0.00046306848526000977, 0.00048567354679107666, 0.0005082786083221436, 0.0005308836698532104, 0.0005534887313842773, 0.0005760937929153442, 0.0005986988544464111, 0.000621303915977478, 0.0006439089775085449, 0.0006665140390396118, 0.0006891191005706787, 0.0007117241621017456, 0.0007343292236328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 5.0, 11.0, 19.0, 19.0, 21.0, 45.0, 80.0, 135.0, 246.0, 480.0, 1020.0, 2300.0, 7290.0, 33893.0, 239688.0, 613818.0, 122121.0, 19326.0, 4651.0, 1730.0, 724.0, 399.0, 195.0, 131.0, 55.0, 42.0, 31.0, 13.0, 12.0, 11.0, 7.0, 7.0, 2.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.05859375, -6.83331298828125, -6.6080322265625, -6.38275146484375, -6.157470703125, -5.93218994140625, -5.7069091796875, -5.48162841796875, -5.25634765625, -5.03106689453125, -4.8057861328125, -4.58050537109375, -4.355224609375, -4.12994384765625, -3.9046630859375, -3.67938232421875, -3.4541015625, -3.22882080078125, -3.0035400390625, -2.77825927734375, -2.552978515625, -2.32769775390625, -2.1024169921875, -1.87713623046875, -1.65185546875, -1.42657470703125, -1.2012939453125, -0.97601318359375, -0.750732421875, -0.52545166015625, -0.3001708984375, -0.07489013671875, 0.150390625, 0.37567138671875, 0.6009521484375, 0.82623291015625, 1.051513671875, 1.27679443359375, 1.5020751953125, 1.72735595703125, 1.95263671875, 2.17791748046875, 2.4031982421875, 2.62847900390625, 2.853759765625, 3.07904052734375, 3.3043212890625, 3.52960205078125, 3.7548828125, 3.98016357421875, 4.2054443359375, 4.43072509765625, 4.656005859375, 4.88128662109375, 5.1065673828125, 5.33184814453125, 5.55712890625, 5.78240966796875, 6.0076904296875, 6.23297119140625, 6.458251953125, 6.68353271484375, 6.9088134765625, 7.13409423828125, 7.359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 9.0, 9.0, 12.0, 13.0, 25.0, 37.0, 56.0, 83.0, 95.0, 132.0, 118.0, 122.0, 98.0, 60.0, 40.0, 30.0, 18.0, 13.0, 12.0, 6.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8984375, -10.512939453125, -10.12744140625, -9.741943359375, -9.3564453125, -8.970947265625, -8.58544921875, -8.199951171875, -7.814453125, -7.428955078125, -7.04345703125, -6.657958984375, -6.2724609375, -5.886962890625, -5.50146484375, -5.115966796875, -4.73046875, -4.344970703125, -3.95947265625, -3.573974609375, -3.1884765625, -2.802978515625, -2.41748046875, -2.031982421875, -1.646484375, -1.260986328125, -0.87548828125, -0.489990234375, -0.1044921875, 0.281005859375, 0.66650390625, 1.052001953125, 1.4375, 1.822998046875, 2.20849609375, 2.593994140625, 2.9794921875, 3.364990234375, 3.75048828125, 4.135986328125, 4.521484375, 4.906982421875, 5.29248046875, 5.677978515625, 6.0634765625, 6.448974609375, 6.83447265625, 7.219970703125, 7.60546875, 7.990966796875, 8.37646484375, 8.761962890625, 9.1474609375, 9.532958984375, 9.91845703125, 10.303955078125, 10.689453125, 11.074951171875, 11.46044921875, 11.845947265625, 12.2314453125, 12.616943359375, 13.00244140625, 13.387939453125, 13.7734375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 16.0, 29.0, 105.0, 223.0, 271.0, 190.0, 88.0, 37.0, 21.0, 11.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.9130554199219, -271.9813232421875, -265.049560546875, -258.1178283691406, -251.1860809326172, -244.25433349609375, -237.3225860595703, -230.39083862304688, -223.4591064453125, -216.52735900878906, -209.59561157226562, -202.66387939453125, -195.7321319580078, -188.80038452148438, -181.86863708496094, -174.9368896484375, -168.00515747070312, -161.0734100341797, -154.14166259765625, -147.20993041992188, -140.27818298339844, -133.346435546875, -126.41468811035156, -119.48294830322266, -112.55119323730469, -105.61944580078125, -98.68770599365234, -91.7559585571289, -84.82421875, -77.89247131347656, -70.96072387695312, -64.02898406982422, -57.09724426269531, -50.16550064086914, -43.23375701904297, -36.30200958251953, -29.370267868041992, -22.438522338867188, -15.506778717041016, -8.575035095214844, -1.6432914733886719, 5.288452625274658, 12.220196723937988, 19.151941299438477, 26.08368492126465, 33.01543045043945, 39.947174072265625, 46.8789176940918, 53.81066131591797, 60.74240493774414, 67.67414855957031, 74.60589599609375, 81.53763580322266, 88.4693832397461, 95.401123046875, 102.33287048339844, 109.26461791992188, 116.19636535644531, 123.12810516357422, 130.05984497070312, 136.99159240722656, 143.92333984375, 150.85508728027344, 157.78683471679688, 164.71856689453125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 3.0, 5.0, 3.0, 8.0, 3.0, 11.0, 11.0, 12.0, 18.0, 19.0, 18.0, 22.0, 18.0, 25.0, 28.0, 41.0, 44.0, 47.0, 56.0, 47.0, 56.0, 60.0, 62.0, 52.0, 35.0, 51.0, 35.0, 36.0, 30.0, 33.0, 22.0, 14.0, 18.0, 14.0, 12.0, 8.0, 3.0, 7.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-156.32781982421875, -152.07965087890625, -147.83148193359375, -143.5832977294922, -139.3351287841797, -135.0869598388672, -130.8387908935547, -126.59062194824219, -122.34244537353516, -118.09427642822266, -113.84609985351562, -109.59793090820312, -105.34976196289062, -101.1015853881836, -96.8534164428711, -92.60523986816406, -88.35707092285156, -84.10890197753906, -79.86072540283203, -75.61255645751953, -71.3643798828125, -67.1162109375, -62.8680419921875, -58.619869232177734, -54.37169647216797, -50.1235237121582, -45.87535095214844, -41.62718200683594, -37.37900924682617, -33.130836486816406, -28.882665634155273, -24.63449478149414, -20.386337280273438, -16.138164520263672, -11.889993667602539, -7.64182186126709, -3.3936500549316406, 0.854522705078125, 5.102693557739258, 9.35086441040039, 13.599037170410156, 17.847209930419922, 22.095380783081055, 26.343551635742188, 30.591724395751953, 34.83989715576172, 39.08806610107422, 43.336238861083984, 47.58441162109375, 51.832584381103516, 56.08075714111328, 60.32892608642578, 64.57710266113281, 68.82527160644531, 73.07344055175781, 77.32160949707031, 81.56978607177734, 85.81795501708984, 90.06613159179688, 94.31430053710938, 98.56246948242188, 102.8106460571289, 107.0588150024414, 111.30699157714844, 115.55516052246094]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 13.0, 11.0, 11.0, 14.0, 20.0, 30.0, 35.0, 42.0, 61.0, 76.0, 86.0, 121.0, 227.0, 374.0, 1128.0, 4032.0, 33027.0, 4111410.0, 36752.0, 4344.0, 1207.0, 467.0, 237.0, 126.0, 100.0, 67.0, 48.0, 39.0, 33.0, 26.0, 23.0, 25.0, 16.0, 14.0, 8.0, 7.0, 1.0, 8.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.40625, -24.57373046875, -23.7412109375, -22.90869140625, -22.076171875, -21.24365234375, -20.4111328125, -19.57861328125, -18.74609375, -17.91357421875, -17.0810546875, -16.24853515625, -15.416015625, -14.58349609375, -13.7509765625, -12.91845703125, -12.0859375, -11.25341796875, -10.4208984375, -9.58837890625, -8.755859375, -7.92333984375, -7.0908203125, -6.25830078125, -5.42578125, -4.59326171875, -3.7607421875, -2.92822265625, -2.095703125, -1.26318359375, -0.4306640625, 0.40185546875, 1.234375, 2.06689453125, 2.8994140625, 3.73193359375, 4.564453125, 5.39697265625, 6.2294921875, 7.06201171875, 7.89453125, 8.72705078125, 9.5595703125, 10.39208984375, 11.224609375, 12.05712890625, 12.8896484375, 13.72216796875, 14.5546875, 15.38720703125, 16.2197265625, 17.05224609375, 17.884765625, 18.71728515625, 19.5498046875, 20.38232421875, 21.21484375, 22.04736328125, 22.8798828125, 23.71240234375, 24.544921875, 25.37744140625, 26.2099609375, 27.04248046875, 27.875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 1.0, 8.0, 4.0, 8.0, 8.0, 12.0, 18.0, 21.0, 24.0, 32.0, 32.0, 33.0, 36.0, 37.0, 46.0, 60.0, 49.0, 86.0, 52.0, 55.0, 46.0, 50.0, 47.0, 34.0, 37.0, 32.0, 27.0, 23.0, 17.0, 11.0, 9.0, 11.0, 7.0, 5.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0], "bins": [-7.71484375, -7.52978515625, -7.3447265625, -7.15966796875, -6.974609375, -6.78955078125, -6.6044921875, -6.41943359375, -6.234375, -6.04931640625, -5.8642578125, -5.67919921875, -5.494140625, -5.30908203125, -5.1240234375, -4.93896484375, -4.75390625, -4.56884765625, -4.3837890625, -4.19873046875, -4.013671875, -3.82861328125, -3.6435546875, -3.45849609375, -3.2734375, -3.08837890625, -2.9033203125, -2.71826171875, -2.533203125, -2.34814453125, -2.1630859375, -1.97802734375, -1.79296875, -1.60791015625, -1.4228515625, -1.23779296875, -1.052734375, -0.86767578125, -0.6826171875, -0.49755859375, -0.3125, -0.12744140625, 0.0576171875, 0.24267578125, 0.427734375, 0.61279296875, 0.7978515625, 0.98291015625, 1.16796875, 1.35302734375, 1.5380859375, 1.72314453125, 1.908203125, 2.09326171875, 2.2783203125, 2.46337890625, 2.6484375, 2.83349609375, 3.0185546875, 3.20361328125, 3.388671875, 3.57373046875, 3.7587890625, 3.94384765625, 4.12890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 4.0, 8.0, 7.0, 12.0, 15.0, 39.0, 20.0, 41.0, 46.0, 83.0, 104.0, 128.0, 185.0, 295.0, 438.0, 659.0, 1093.0, 1850.0, 3570.0, 8478.0, 26347.0, 233906.0, 3817566.0, 71594.0, 15224.0, 5690.0, 2724.0, 1509.0, 866.0, 588.0, 368.0, 208.0, 140.0, 129.0, 101.0, 65.0, 41.0, 44.0, 29.0, 21.0, 8.0, 10.0, 7.0, 2.0, 11.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.1171875, -14.67626953125, -14.2353515625, -13.79443359375, -13.353515625, -12.91259765625, -12.4716796875, -12.03076171875, -11.58984375, -11.14892578125, -10.7080078125, -10.26708984375, -9.826171875, -9.38525390625, -8.9443359375, -8.50341796875, -8.0625, -7.62158203125, -7.1806640625, -6.73974609375, -6.298828125, -5.85791015625, -5.4169921875, -4.97607421875, -4.53515625, -4.09423828125, -3.6533203125, -3.21240234375, -2.771484375, -2.33056640625, -1.8896484375, -1.44873046875, -1.0078125, -0.56689453125, -0.1259765625, 0.31494140625, 0.755859375, 1.19677734375, 1.6376953125, 2.07861328125, 2.51953125, 2.96044921875, 3.4013671875, 3.84228515625, 4.283203125, 4.72412109375, 5.1650390625, 5.60595703125, 6.046875, 6.48779296875, 6.9287109375, 7.36962890625, 7.810546875, 8.25146484375, 8.6923828125, 9.13330078125, 9.57421875, 10.01513671875, 10.4560546875, 10.89697265625, 11.337890625, 11.77880859375, 12.2197265625, 12.66064453125, 13.1015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 11.0, 12.0, 15.0, 31.0, 46.0, 201.0, 3202.0, 406.0, 79.0, 34.0, 13.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3828125, -8.16619873046875, -7.9495849609375, -7.73297119140625, -7.516357421875, -7.29974365234375, -7.0831298828125, -6.86651611328125, -6.64990234375, -6.43328857421875, -6.2166748046875, -6.00006103515625, -5.783447265625, -5.56683349609375, -5.3502197265625, -5.13360595703125, -4.9169921875, -4.70037841796875, -4.4837646484375, -4.26715087890625, -4.050537109375, -3.83392333984375, -3.6173095703125, -3.40069580078125, -3.18408203125, -2.96746826171875, -2.7508544921875, -2.53424072265625, -2.317626953125, -2.10101318359375, -1.8843994140625, -1.66778564453125, -1.451171875, -1.23455810546875, -1.0179443359375, -0.80133056640625, -0.584716796875, -0.36810302734375, -0.1514892578125, 0.06512451171875, 0.28173828125, 0.49835205078125, 0.7149658203125, 0.93157958984375, 1.148193359375, 1.36480712890625, 1.5814208984375, 1.79803466796875, 2.0146484375, 2.23126220703125, 2.4478759765625, 2.66448974609375, 2.881103515625, 3.09771728515625, 3.3143310546875, 3.53094482421875, 3.74755859375, 3.96417236328125, 4.1807861328125, 4.39739990234375, 4.614013671875, 4.83062744140625, 5.0472412109375, 5.26385498046875, 5.48046875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 12.0, 12.0, 28.0, 35.0, 66.0, 86.0, 108.0, 142.0, 145.0, 140.0, 85.0, 56.0, 32.0, 20.0, 6.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.008729934692383, -20.412391662597656, -19.816055297851562, -19.219717025756836, -18.62337875366211, -18.027042388916016, -17.43070411682129, -16.834365844726562, -16.23802947998047, -15.641692161560059, -15.045353889465332, -14.449016571044922, -13.852678298950195, -13.256340980529785, -12.660003662109375, -12.063665390014648, -11.467327117919922, -10.870989799499512, -10.274651527404785, -9.678314208984375, -9.081975936889648, -8.485638618469238, -7.889301300048828, -7.29296350479126, -6.696625709533691, -6.100287914276123, -5.503950119018555, -4.9076128005981445, -4.311275005340576, -3.714937210083008, -3.1185996532440186, -2.5222620964050293, -1.9259262084960938, -1.329588532447815, -0.7332508563995361, -0.13691318035125732, 0.4594244956970215, 1.0557622909545898, 1.652099847793579, 2.2484374046325684, 2.8447751998901367, 3.441112995147705, 4.037450790405273, 4.633788108825684, 5.230125904083252, 5.82646369934082, 6.4228010177612305, 7.019138813018799, 7.615476608276367, 8.211813926696777, 8.808152198791504, 9.404489517211914, 10.00082778930664, 10.59716510772705, 11.193502426147461, 11.789840698242188, 12.386178016662598, 12.982515335083008, 13.578853607177734, 14.175190925598145, 14.771528244018555, 15.367866516113281, 15.964203834533691, 16.5605411529541, 17.156879425048828]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 8.0, 11.0, 5.0, 11.0, 9.0, 13.0, 16.0, 25.0, 17.0, 29.0, 25.0, 28.0, 34.0, 27.0, 40.0, 37.0, 42.0, 48.0, 35.0, 52.0, 41.0, 41.0, 35.0, 47.0, 41.0, 37.0, 31.0, 27.0, 30.0, 20.0, 23.0, 21.0, 22.0, 10.0, 11.0, 9.0, 12.0, 11.0, 5.0, 4.0, 2.0, 2.0, 8.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.277486801147461, -8.947338104248047, -8.617189407348633, -8.287041664123535, -7.956892967224121, -7.626744270324707, -7.296595573425293, -6.966446876525879, -6.636298656463623, -6.306149959564209, -5.976001739501953, -5.645853042602539, -5.315704345703125, -4.985556125640869, -4.655407428741455, -4.325259208679199, -3.995110511779785, -3.66496205329895, -3.3348135948181152, -3.004664897918701, -2.674516439437866, -2.3443679809570312, -2.014219284057617, -1.6840708255767822, -1.3539223670959473, -1.0237739086151123, -0.6936253309249878, -0.36347681283950806, -0.03332829475402832, 0.29682016372680664, 0.6269687414169312, 0.9571173191070557, 1.2872648239135742, 1.6174132823944092, 1.9475618600845337, 2.277710437774658, 2.607858896255493, 2.938007354736328, 3.268156051635742, 3.598304510116577, 3.928452968597412, 4.258601665496826, 4.588749885559082, 4.918898582458496, 5.24904727935791, 5.579195499420166, 5.90934419631958, 6.239492416381836, 6.56964111328125, 6.899789810180664, 7.22993803024292, 7.560086727142334, 7.89023494720459, 8.220383644104004, 8.550532341003418, 8.880681037902832, 9.21082878112793, 9.540977478027344, 9.871126174926758, 10.201273918151855, 10.53142261505127, 10.861571311950684, 11.191720008850098, 11.521868705749512, 11.852017402648926]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 13.0, 20.0, 25.0, 41.0, 60.0, 106.0, 137.0, 245.0, 415.0, 685.0, 1252.0, 2601.0, 5721.0, 14299.0, 39410.0, 119624.0, 316177.0, 338669.0, 136059.0, 44668.0, 15835.0, 6445.0, 2844.0, 1364.0, 728.0, 400.0, 254.0, 138.0, 91.0, 58.0, 49.0, 23.0, 14.0, 20.0, 12.0, 13.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.765625, -8.4921875, -8.21875, -7.9453125, -7.671875, -7.3984375, -7.125, -6.8515625, -6.578125, -6.3046875, -6.03125, -5.7578125, -5.484375, -5.2109375, -4.9375, -4.6640625, -4.390625, -4.1171875, -3.84375, -3.5703125, -3.296875, -3.0234375, -2.75, -2.4765625, -2.203125, -1.9296875, -1.65625, -1.3828125, -1.109375, -0.8359375, -0.5625, -0.2890625, -0.015625, 0.2578125, 0.53125, 0.8046875, 1.078125, 1.3515625, 1.625, 1.8984375, 2.171875, 2.4453125, 2.71875, 2.9921875, 3.265625, 3.5390625, 3.8125, 4.0859375, 4.359375, 4.6328125, 4.90625, 5.1796875, 5.453125, 5.7265625, 6.0, 6.2734375, 6.546875, 6.8203125, 7.09375, 7.3671875, 7.640625, 7.9140625, 8.1875, 8.4609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 4.0, 6.0, 5.0, 6.0, 16.0, 19.0, 15.0, 20.0, 21.0, 27.0, 28.0, 38.0, 44.0, 30.0, 33.0, 56.0, 48.0, 55.0, 37.0, 44.0, 50.0, 43.0, 42.0, 42.0, 43.0, 42.0, 25.0, 24.0, 28.0, 25.0, 13.0, 16.0, 7.0, 7.0, 8.0, 3.0, 6.0, 4.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0], "bins": [-6.171875, -6.0108642578125, -5.849853515625, -5.6888427734375, -5.52783203125, -5.3668212890625, -5.205810546875, -5.0447998046875, -4.8837890625, -4.7227783203125, -4.561767578125, -4.4007568359375, -4.23974609375, -4.0787353515625, -3.917724609375, -3.7567138671875, -3.595703125, -3.4346923828125, -3.273681640625, -3.1126708984375, -2.95166015625, -2.7906494140625, -2.629638671875, -2.4686279296875, -2.3076171875, -2.1466064453125, -1.985595703125, -1.8245849609375, -1.66357421875, -1.5025634765625, -1.341552734375, -1.1805419921875, -1.01953125, -0.8585205078125, -0.697509765625, -0.5364990234375, -0.37548828125, -0.2144775390625, -0.053466796875, 0.1075439453125, 0.2685546875, 0.4295654296875, 0.590576171875, 0.7515869140625, 0.91259765625, 1.0736083984375, 1.234619140625, 1.3956298828125, 1.556640625, 1.7176513671875, 1.878662109375, 2.0396728515625, 2.20068359375, 2.3616943359375, 2.522705078125, 2.6837158203125, 2.8447265625, 3.0057373046875, 3.166748046875, 3.3277587890625, 3.48876953125, 3.6497802734375, 3.810791015625, 3.9718017578125, 4.1328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 10.0, 19.0, 29.0, 41.0, 70.0, 134.0, 253.0, 632.0, 1698.0, 6447.0, 44812.0, 614629.0, 346959.0, 26100.0, 4481.0, 1256.0, 494.0, 193.0, 128.0, 63.0, 36.0, 16.0, 22.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.484375, -17.796630859375, -17.10888671875, -16.421142578125, -15.7333984375, -15.045654296875, -14.35791015625, -13.670166015625, -12.982421875, -12.294677734375, -11.60693359375, -10.919189453125, -10.2314453125, -9.543701171875, -8.85595703125, -8.168212890625, -7.48046875, -6.792724609375, -6.10498046875, -5.417236328125, -4.7294921875, -4.041748046875, -3.35400390625, -2.666259765625, -1.978515625, -1.290771484375, -0.60302734375, 0.084716796875, 0.7724609375, 1.460205078125, 2.14794921875, 2.835693359375, 3.5234375, 4.211181640625, 4.89892578125, 5.586669921875, 6.2744140625, 6.962158203125, 7.64990234375, 8.337646484375, 9.025390625, 9.713134765625, 10.40087890625, 11.088623046875, 11.7763671875, 12.464111328125, 13.15185546875, 13.839599609375, 14.52734375, 15.215087890625, 15.90283203125, 16.590576171875, 17.2783203125, 17.966064453125, 18.65380859375, 19.341552734375, 20.029296875, 20.717041015625, 21.40478515625, 22.092529296875, 22.7802734375, 23.468017578125, 24.15576171875, 24.843505859375, 25.53125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 13.0, 21.0, 23.0, 29.0, 25.0, 27.0, 39.0, 42.0, 45.0, 57.0, 44.0, 40.0, 65.0, 54.0, 39.0, 39.0, 48.0, 40.0, 42.0, 33.0, 30.0, 31.0, 28.0, 27.0, 16.0, 16.0, 10.0, 7.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.296875, -24.46240234375, -23.6279296875, -22.79345703125, -21.958984375, -21.12451171875, -20.2900390625, -19.45556640625, -18.62109375, -17.78662109375, -16.9521484375, -16.11767578125, -15.283203125, -14.44873046875, -13.6142578125, -12.77978515625, -11.9453125, -11.11083984375, -10.2763671875, -9.44189453125, -8.607421875, -7.77294921875, -6.9384765625, -6.10400390625, -5.26953125, -4.43505859375, -3.6005859375, -2.76611328125, -1.931640625, -1.09716796875, -0.2626953125, 0.57177734375, 1.40625, 2.24072265625, 3.0751953125, 3.90966796875, 4.744140625, 5.57861328125, 6.4130859375, 7.24755859375, 8.08203125, 8.91650390625, 9.7509765625, 10.58544921875, 11.419921875, 12.25439453125, 13.0888671875, 13.92333984375, 14.7578125, 15.59228515625, 16.4267578125, 17.26123046875, 18.095703125, 18.93017578125, 19.7646484375, 20.59912109375, 21.43359375, 22.26806640625, 23.1025390625, 23.93701171875, 24.771484375, 25.60595703125, 26.4404296875, 27.27490234375, 28.109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 2.0, 2.0, 10.0, 8.0, 8.0, 15.0, 12.0, 15.0, 24.0, 51.0, 69.0, 121.0, 263.0, 699.0, 2644.0, 22429.0, 797491.0, 213513.0, 8661.0, 1543.0, 452.0, 203.0, 112.0, 53.0, 35.0, 22.0, 17.0, 17.0, 12.0, 7.0, 10.0, 6.0, 5.0, 3.0, 4.0, 5.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.921875, -14.4931640625, -14.064453125, -13.6357421875, -13.20703125, -12.7783203125, -12.349609375, -11.9208984375, -11.4921875, -11.0634765625, -10.634765625, -10.2060546875, -9.77734375, -9.3486328125, -8.919921875, -8.4912109375, -8.0625, -7.6337890625, -7.205078125, -6.7763671875, -6.34765625, -5.9189453125, -5.490234375, -5.0615234375, -4.6328125, -4.2041015625, -3.775390625, -3.3466796875, -2.91796875, -2.4892578125, -2.060546875, -1.6318359375, -1.203125, -0.7744140625, -0.345703125, 0.0830078125, 0.51171875, 0.9404296875, 1.369140625, 1.7978515625, 2.2265625, 2.6552734375, 3.083984375, 3.5126953125, 3.94140625, 4.3701171875, 4.798828125, 5.2275390625, 5.65625, 6.0849609375, 6.513671875, 6.9423828125, 7.37109375, 7.7998046875, 8.228515625, 8.6572265625, 9.0859375, 9.5146484375, 9.943359375, 10.3720703125, 10.80078125, 11.2294921875, 11.658203125, 12.0869140625, 12.515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 10.0, 17.0, 25.0, 37.0, 54.0, 78.0, 88.0, 128.0, 131.0, 115.0, 100.0, 71.0, 40.0, 28.0, 23.0, 17.0, 13.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001277923583984375, -0.0012341439723968506, -0.0011903643608093262, -0.0011465847492218018, -0.0011028051376342773, -0.001059025526046753, -0.0010152459144592285, -0.0009714663028717041, -0.0009276866912841797, -0.0008839070796966553, -0.0008401274681091309, -0.0007963478565216064, -0.000752568244934082, -0.0007087886333465576, -0.0006650090217590332, -0.0006212294101715088, -0.0005774497985839844, -0.00053367018699646, -0.0004898905754089355, -0.00044611096382141113, -0.0004023313522338867, -0.0003585517406463623, -0.0003147721290588379, -0.0002709925174713135, -0.00022721290588378906, -0.00018343329429626465, -0.00013965368270874023, -9.587407112121582e-05, -5.2094459533691406e-05, -8.314847946166992e-06, 3.546476364135742e-05, 7.924437522888184e-05, 0.00012302398681640625, 0.00016680359840393066, 0.00021058320999145508, 0.0002543628215789795, 0.0002981424331665039, 0.0003419220447540283, 0.00038570165634155273, 0.00042948126792907715, 0.00047326087951660156, 0.000517040491104126, 0.0005608201026916504, 0.0006045997142791748, 0.0006483793258666992, 0.0006921589374542236, 0.000735938549041748, 0.0007797181606292725, 0.0008234977722167969, 0.0008672773838043213, 0.0009110569953918457, 0.0009548366069793701, 0.0009986162185668945, 0.001042395830154419, 0.0010861754417419434, 0.0011299550533294678, 0.0011737346649169922, 0.0012175142765045166, 0.001261293888092041, 0.0013050734996795654, 0.0013488531112670898, 0.0013926327228546143, 0.0014364123344421387, 0.001480191946029663, 0.0015239715576171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 12.0, 12.0, 31.0, 44.0, 79.0, 175.0, 476.0, 2005.0, 22144.0, 951248.0, 67992.0, 3261.0, 672.0, 222.0, 92.0, 39.0, 30.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.3878173828125, -13.752197265625, -13.1165771484375, -12.48095703125, -11.8453369140625, -11.209716796875, -10.5740966796875, -9.9384765625, -9.3028564453125, -8.667236328125, -8.0316162109375, -7.39599609375, -6.7603759765625, -6.124755859375, -5.4891357421875, -4.853515625, -4.2178955078125, -3.582275390625, -2.9466552734375, -2.31103515625, -1.6754150390625, -1.039794921875, -0.4041748046875, 0.2314453125, 0.8670654296875, 1.502685546875, 2.1383056640625, 2.77392578125, 3.4095458984375, 4.045166015625, 4.6807861328125, 5.31640625, 5.9520263671875, 6.587646484375, 7.2232666015625, 7.85888671875, 8.4945068359375, 9.130126953125, 9.7657470703125, 10.4013671875, 11.0369873046875, 11.672607421875, 12.3082275390625, 12.94384765625, 13.5794677734375, 14.215087890625, 14.8507080078125, 15.486328125, 16.1219482421875, 16.757568359375, 17.3931884765625, 18.02880859375, 18.6644287109375, 19.300048828125, 19.9356689453125, 20.5712890625, 21.2069091796875, 21.842529296875, 22.4781494140625, 23.11376953125, 23.7493896484375, 24.385009765625, 25.0206298828125, 25.65625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 8.0, 8.0, 22.0, 19.0, 42.0, 67.0, 85.0, 133.0, 143.0, 115.0, 113.0, 85.0, 56.0, 32.0, 12.0, 13.0, 10.0, 12.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1015625, -13.7470703125, -13.392578125, -13.0380859375, -12.68359375, -12.3291015625, -11.974609375, -11.6201171875, -11.265625, -10.9111328125, -10.556640625, -10.2021484375, -9.84765625, -9.4931640625, -9.138671875, -8.7841796875, -8.4296875, -8.0751953125, -7.720703125, -7.3662109375, -7.01171875, -6.6572265625, -6.302734375, -5.9482421875, -5.59375, -5.2392578125, -4.884765625, -4.5302734375, -4.17578125, -3.8212890625, -3.466796875, -3.1123046875, -2.7578125, -2.4033203125, -2.048828125, -1.6943359375, -1.33984375, -0.9853515625, -0.630859375, -0.2763671875, 0.078125, 0.4326171875, 0.787109375, 1.1416015625, 1.49609375, 1.8505859375, 2.205078125, 2.5595703125, 2.9140625, 3.2685546875, 3.623046875, 3.9775390625, 4.33203125, 4.6865234375, 5.041015625, 5.3955078125, 5.75, 6.1044921875, 6.458984375, 6.8134765625, 7.16796875, 7.5224609375, 7.876953125, 8.2314453125, 8.5859375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 21.0, 58.0, 304.0, 449.0, 137.0, 25.0, 2.0, 3.0, 2.0, 4.0], "bins": [-755.94287109375, -742.769287109375, -729.595703125, -716.422119140625, -703.24853515625, -690.074951171875, -676.9013671875, -663.7278442382812, -650.5542602539062, -637.3806762695312, -624.2070922851562, -611.0335083007812, -597.8599243164062, -584.6864013671875, -571.5128173828125, -558.3392333984375, -545.1656494140625, -531.9920654296875, -518.8184814453125, -505.6448974609375, -492.4713439941406, -479.2977600097656, -466.1241760253906, -452.9505920410156, -439.7769775390625, -426.6033935546875, -413.4298095703125, -400.2562255859375, -387.0826721191406, -373.9090881347656, -360.7355041503906, -347.5619201660156, -334.38836669921875, -321.21478271484375, -308.04119873046875, -294.86761474609375, -281.6940612792969, -268.5204772949219, -255.34689331054688, -242.17330932617188, -228.99972534179688, -215.82614135742188, -202.65257263183594, -189.47898864746094, -176.305419921875, -163.1318359375, -149.958251953125, -136.78466796875, -123.61109924316406, -110.4375228881836, -97.26394653320312, -84.09036254882812, -70.91678619384766, -57.74320983886719, -44.56962585449219, -31.39604949951172, -18.22247314453125, -5.048894882202148, 8.124683380126953, 21.298263549804688, 34.471839904785156, 47.645416259765625, 60.819000244140625, 73.9925765991211, 87.16615295410156]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 3.0, 4.0, 11.0, 4.0, 12.0, 14.0, 16.0, 19.0, 27.0, 25.0, 37.0, 55.0, 49.0, 68.0, 59.0, 74.0, 68.0, 54.0, 64.0, 64.0, 42.0, 53.0, 32.0, 36.0, 31.0, 27.0, 12.0, 16.0, 9.0, 6.0, 8.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-200.82382202148438, -195.7283477783203, -190.6328582763672, -185.53738403320312, -180.44190979003906, -175.346435546875, -170.25094604492188, -165.1554718017578, -160.05999755859375, -154.9645233154297, -149.86903381347656, -144.7735595703125, -139.67808532714844, -134.58261108398438, -129.48712158203125, -124.39164733886719, -119.29615783691406, -114.20067596435547, -109.1052017211914, -104.00971984863281, -98.91424560546875, -93.81876373291016, -88.72328186035156, -83.6278076171875, -78.5323257446289, -73.43684387207031, -68.34136962890625, -63.245887756347656, -58.15040969848633, -53.054931640625, -47.959449768066406, -42.86397171020508, -37.76847839355469, -32.67300033569336, -27.5775203704834, -22.482040405273438, -17.38656234741211, -12.291084289550781, -7.19560432434082, -2.1001243591308594, 2.9953536987304688, 8.090832710266113, 13.186311721801758, 18.28179168701172, 23.377269744873047, 28.472747802734375, 33.56822967529297, 38.6637077331543, 43.759185791015625, 48.85466384887695, 53.95014190673828, 59.045623779296875, 64.14109802246094, 69.23657989501953, 74.33206176757812, 79.42753601074219, 84.52301788330078, 89.61849975585938, 94.71397399902344, 99.80945587158203, 104.90493774414062, 110.00041198730469, 115.09589385986328, 120.19137573242188, 125.28684997558594]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 5.0, 8.0, 16.0, 23.0, 18.0, 54.0, 55.0, 83.0, 136.0, 232.0, 358.0, 583.0, 930.0, 1648.0, 3245.0, 7260.0, 21701.0, 148895.0, 3940536.0, 46002.0, 12078.0, 4839.0, 2396.0, 1278.0, 733.0, 410.0, 269.0, 180.0, 103.0, 72.0, 44.0, 36.0, 20.0, 16.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.9375, -11.6170654296875, -11.296630859375, -10.9761962890625, -10.65576171875, -10.3353271484375, -10.014892578125, -9.6944580078125, -9.3740234375, -9.0535888671875, -8.733154296875, -8.4127197265625, -8.09228515625, -7.7718505859375, -7.451416015625, -7.1309814453125, -6.810546875, -6.4901123046875, -6.169677734375, -5.8492431640625, -5.52880859375, -5.2083740234375, -4.887939453125, -4.5675048828125, -4.2470703125, -3.9266357421875, -3.606201171875, -3.2857666015625, -2.96533203125, -2.6448974609375, -2.324462890625, -2.0040283203125, -1.68359375, -1.3631591796875, -1.042724609375, -0.7222900390625, -0.40185546875, -0.0814208984375, 0.239013671875, 0.5594482421875, 0.8798828125, 1.2003173828125, 1.520751953125, 1.8411865234375, 2.16162109375, 2.4820556640625, 2.802490234375, 3.1229248046875, 3.443359375, 3.7637939453125, 4.084228515625, 4.4046630859375, 4.72509765625, 5.0455322265625, 5.365966796875, 5.6864013671875, 6.0068359375, 6.3272705078125, 6.647705078125, 6.9681396484375, 7.28857421875, 7.6090087890625, 7.929443359375, 8.2498779296875, 8.5703125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 13.0, 21.0, 31.0, 36.0, 49.0, 46.0, 47.0, 53.0, 83.0, 72.0, 74.0, 69.0, 74.0, 53.0, 71.0, 55.0, 34.0, 25.0, 30.0, 22.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.1231689453125, -8.871337890625, -8.6195068359375, -8.36767578125, -8.1158447265625, -7.864013671875, -7.6121826171875, -7.3603515625, -7.1085205078125, -6.856689453125, -6.6048583984375, -6.35302734375, -6.1011962890625, -5.849365234375, -5.5975341796875, -5.345703125, -5.0938720703125, -4.842041015625, -4.5902099609375, -4.33837890625, -4.0865478515625, -3.834716796875, -3.5828857421875, -3.3310546875, -3.0792236328125, -2.827392578125, -2.5755615234375, -2.32373046875, -2.0718994140625, -1.820068359375, -1.5682373046875, -1.31640625, -1.0645751953125, -0.812744140625, -0.5609130859375, -0.30908203125, -0.0572509765625, 0.194580078125, 0.4464111328125, 0.6982421875, 0.9500732421875, 1.201904296875, 1.4537353515625, 1.70556640625, 1.9573974609375, 2.209228515625, 2.4610595703125, 2.712890625, 2.9647216796875, 3.216552734375, 3.4683837890625, 3.72021484375, 3.9720458984375, 4.223876953125, 4.4757080078125, 4.7275390625, 4.9793701171875, 5.231201171875, 5.4830322265625, 5.73486328125, 5.9866943359375, 6.238525390625, 6.4903564453125, 6.7421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 12.0, 10.0, 8.0, 22.0, 32.0, 41.0, 53.0, 60.0, 88.0, 98.0, 182.0, 243.0, 369.0, 663.0, 1465.0, 3455.0, 11201.0, 70694.0, 4004215.0, 81947.0, 12170.0, 3727.0, 1512.0, 700.0, 376.0, 240.0, 164.0, 106.0, 73.0, 69.0, 69.0, 45.0, 32.0, 32.0, 22.0, 19.0, 15.0, 4.0, 12.0, 8.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.640625, -16.144287109375, -15.64794921875, -15.151611328125, -14.6552734375, -14.158935546875, -13.66259765625, -13.166259765625, -12.669921875, -12.173583984375, -11.67724609375, -11.180908203125, -10.6845703125, -10.188232421875, -9.69189453125, -9.195556640625, -8.69921875, -8.202880859375, -7.70654296875, -7.210205078125, -6.7138671875, -6.217529296875, -5.72119140625, -5.224853515625, -4.728515625, -4.232177734375, -3.73583984375, -3.239501953125, -2.7431640625, -2.246826171875, -1.75048828125, -1.254150390625, -0.7578125, -0.261474609375, 0.23486328125, 0.731201171875, 1.2275390625, 1.723876953125, 2.22021484375, 2.716552734375, 3.212890625, 3.709228515625, 4.20556640625, 4.701904296875, 5.1982421875, 5.694580078125, 6.19091796875, 6.687255859375, 7.18359375, 7.679931640625, 8.17626953125, 8.672607421875, 9.1689453125, 9.665283203125, 10.16162109375, 10.657958984375, 11.154296875, 11.650634765625, 12.14697265625, 12.643310546875, 13.1396484375, 13.635986328125, 14.13232421875, 14.628662109375, 15.125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 1.0, 1.0, 9.0, 5.0, 2.0, 15.0, 23.0, 48.0, 76.0, 235.0, 3245.0, 231.0, 80.0, 32.0, 19.0, 18.0, 10.0, 3.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.2442626953125, -2.129150390625, -2.0140380859375, -1.89892578125, -1.7838134765625, -1.668701171875, -1.5535888671875, -1.4384765625, -1.3233642578125, -1.208251953125, -1.0931396484375, -0.97802734375, -0.8629150390625, -0.747802734375, -0.6326904296875, -0.517578125, -0.4024658203125, -0.287353515625, -0.1722412109375, -0.05712890625, 0.0579833984375, 0.173095703125, 0.2882080078125, 0.4033203125, 0.5184326171875, 0.633544921875, 0.7486572265625, 0.86376953125, 0.9788818359375, 1.093994140625, 1.2091064453125, 1.32421875, 1.4393310546875, 1.554443359375, 1.6695556640625, 1.78466796875, 1.8997802734375, 2.014892578125, 2.1300048828125, 2.2451171875, 2.3602294921875, 2.475341796875, 2.5904541015625, 2.70556640625, 2.8206787109375, 2.935791015625, 3.0509033203125, 3.166015625, 3.2811279296875, 3.396240234375, 3.5113525390625, 3.62646484375, 3.7415771484375, 3.856689453125, 3.9718017578125, 4.0869140625, 4.2020263671875, 4.317138671875, 4.4322509765625, 4.54736328125, 4.6624755859375, 4.777587890625, 4.8927001953125, 5.0078125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 12.0, 26.0, 41.0, 71.0, 109.0, 159.0, 119.0, 142.0, 102.0, 68.0, 57.0, 34.0, 11.0, 8.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03124713897705, -9.516375541687012, -9.001503944396973, -8.486631393432617, -7.971759796142578, -7.456888198852539, -6.9420166015625, -6.427145004272461, -5.912272930145264, -5.397401332855225, -4.882529258728027, -4.367657661437988, -3.85278582572937, -3.337913990020752, -2.823042392730713, -2.3081705570220947, -1.7932987213134766, -1.2784268856048584, -0.7635551691055298, -0.24868345260620117, 0.266188383102417, 0.7810602188110352, 1.2959318161010742, 1.8108036518096924, 2.3256754875183105, 2.8405473232269287, 3.355419158935547, 3.870290756225586, 4.385162353515625, 4.900034427642822, 5.414906024932861, 5.929778099060059, 6.444648742675781, 6.95952033996582, 7.474392414093018, 7.989264011383057, 8.504136085510254, 9.019007682800293, 9.533879280090332, 10.048750877380371, 10.563623428344727, 11.078495025634766, 11.593366622924805, 12.108238220214844, 12.6231107711792, 13.137982368469238, 13.652853965759277, 14.167725563049316, 14.682597160339355, 15.197468757629395, 15.712340354919434, 16.22721290588379, 16.742084503173828, 17.256956100463867, 17.771827697753906, 18.286699295043945, 18.801570892333984, 19.316442489624023, 19.831314086914062, 20.3461856842041, 20.86105728149414, 21.375930786132812, 21.89080047607422, 22.40567398071289, 22.92054557800293]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 8.0, 6.0, 8.0, 17.0, 14.0, 13.0, 11.0, 15.0, 23.0, 31.0, 30.0, 33.0, 40.0, 41.0, 34.0, 33.0, 36.0, 52.0, 40.0, 39.0, 41.0, 37.0, 40.0, 42.0, 36.0, 46.0, 25.0, 30.0, 23.0, 22.0, 24.0, 18.0, 15.0, 11.0, 10.0, 12.0, 7.0, 10.0, 4.0, 5.0, 2.0, 0.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.5951948165893555, -5.411416530609131, -5.227637767791748, -5.043859481811523, -4.860081195831299, -4.676302909851074, -4.492524147033691, -4.308745861053467, -4.124967575073242, -3.9411890506744385, -3.757410764694214, -3.57363224029541, -3.3898539543151855, -3.206075429916382, -3.022296905517578, -2.8385186195373535, -2.6547398567199707, -2.470961332321167, -2.2871830463409424, -2.1034045219421387, -1.9196261167526245, -1.7358477115631104, -1.5520691871643066, -1.3682907819747925, -1.1845123767852783, -1.0007339715957642, -0.8169555068016052, -0.6331770420074463, -0.44939863681793213, -0.26562023162841797, -0.08184170722961426, 0.1019366979598999, 0.28571510314941406, 0.4694935381412506, 0.6532719731330872, 0.8370504379272461, 1.0208288431167603, 1.2046072483062744, 1.3883857727050781, 1.5721641778945923, 1.7559425830841064, 1.9397209882736206, 2.1234993934631348, 2.3072779178619385, 2.491056442260742, 2.674834728240967, 2.8586132526397705, 3.042391777038574, 3.226170063018799, 3.4099485874176025, 3.593726873397827, 3.777505397796631, 3.9612836837768555, 4.145062446594238, 4.328840732574463, 4.5126190185546875, 4.69639778137207, 4.880176067352295, 5.063954830169678, 5.247733116149902, 5.431511402130127, 5.615289688110352, 5.799068450927734, 5.982846736907959, 6.166625022888184]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 12.0, 13.0, 15.0, 28.0, 37.0, 60.0, 109.0, 199.0, 278.0, 524.0, 1055.0, 2143.0, 4987.0, 12508.0, 35257.0, 108838.0, 306704.0, 361673.0, 141077.0, 45877.0, 15878.0, 6048.0, 2572.0, 1225.0, 586.0, 322.0, 211.0, 123.0, 61.0, 54.0, 21.0, 22.0, 10.0, 13.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91015625, -6.64556884765625, -6.3809814453125, -6.11639404296875, -5.851806640625, -5.58721923828125, -5.3226318359375, -5.05804443359375, -4.79345703125, -4.52886962890625, -4.2642822265625, -3.99969482421875, -3.735107421875, -3.47052001953125, -3.2059326171875, -2.94134521484375, -2.6767578125, -2.41217041015625, -2.1475830078125, -1.88299560546875, -1.618408203125, -1.35382080078125, -1.0892333984375, -0.82464599609375, -0.56005859375, -0.29547119140625, -0.0308837890625, 0.23370361328125, 0.498291015625, 0.76287841796875, 1.0274658203125, 1.29205322265625, 1.556640625, 1.82122802734375, 2.0858154296875, 2.35040283203125, 2.614990234375, 2.87957763671875, 3.1441650390625, 3.40875244140625, 3.67333984375, 3.93792724609375, 4.2025146484375, 4.46710205078125, 4.731689453125, 4.99627685546875, 5.2608642578125, 5.52545166015625, 5.7900390625, 6.05462646484375, 6.3192138671875, 6.58380126953125, 6.848388671875, 7.11297607421875, 7.3775634765625, 7.64215087890625, 7.90673828125, 8.17132568359375, 8.4359130859375, 8.70050048828125, 8.965087890625, 9.22967529296875, 9.4942626953125, 9.75885009765625, 10.0234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 9.0, 16.0, 15.0, 32.0, 23.0, 43.0, 41.0, 54.0, 62.0, 65.0, 74.0, 66.0, 80.0, 72.0, 66.0, 61.0, 48.0, 50.0, 33.0, 20.0, 22.0, 16.0, 4.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.8695068359375, -9.614013671875, -9.3585205078125, -9.10302734375, -8.8475341796875, -8.592041015625, -8.3365478515625, -8.0810546875, -7.8255615234375, -7.570068359375, -7.3145751953125, -7.05908203125, -6.8035888671875, -6.548095703125, -6.2926025390625, -6.037109375, -5.7816162109375, -5.526123046875, -5.2706298828125, -5.01513671875, -4.7596435546875, -4.504150390625, -4.2486572265625, -3.9931640625, -3.7376708984375, -3.482177734375, -3.2266845703125, -2.97119140625, -2.7156982421875, -2.460205078125, -2.2047119140625, -1.94921875, -1.6937255859375, -1.438232421875, -1.1827392578125, -0.92724609375, -0.6717529296875, -0.416259765625, -0.1607666015625, 0.0947265625, 0.3502197265625, 0.605712890625, 0.8612060546875, 1.11669921875, 1.3721923828125, 1.627685546875, 1.8831787109375, 2.138671875, 2.3941650390625, 2.649658203125, 2.9051513671875, 3.16064453125, 3.4161376953125, 3.671630859375, 3.9271240234375, 4.1826171875, 4.4381103515625, 4.693603515625, 4.9490966796875, 5.20458984375, 5.4600830078125, 5.715576171875, 5.9710693359375, 6.2265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 7.0, 12.0, 13.0, 11.0, 23.0, 23.0, 43.0, 76.0, 121.0, 229.0, 472.0, 1609.0, 7665.0, 91835.0, 846145.0, 90022.0, 7531.0, 1569.0, 545.0, 248.0, 134.0, 68.0, 49.0, 25.0, 23.0, 11.0, 15.0, 10.0, 6.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.71875, -20.016357421875, -19.31396484375, -18.611572265625, -17.9091796875, -17.206787109375, -16.50439453125, -15.802001953125, -15.099609375, -14.397216796875, -13.69482421875, -12.992431640625, -12.2900390625, -11.587646484375, -10.88525390625, -10.182861328125, -9.48046875, -8.778076171875, -8.07568359375, -7.373291015625, -6.6708984375, -5.968505859375, -5.26611328125, -4.563720703125, -3.861328125, -3.158935546875, -2.45654296875, -1.754150390625, -1.0517578125, -0.349365234375, 0.35302734375, 1.055419921875, 1.7578125, 2.460205078125, 3.16259765625, 3.864990234375, 4.5673828125, 5.269775390625, 5.97216796875, 6.674560546875, 7.376953125, 8.079345703125, 8.78173828125, 9.484130859375, 10.1865234375, 10.888916015625, 11.59130859375, 12.293701171875, 12.99609375, 13.698486328125, 14.40087890625, 15.103271484375, 15.8056640625, 16.508056640625, 17.21044921875, 17.912841796875, 18.615234375, 19.317626953125, 20.02001953125, 20.722412109375, 21.4248046875, 22.127197265625, 22.82958984375, 23.531982421875, 24.234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 7.0, 8.0, 10.0, 12.0, 16.0, 15.0, 22.0, 22.0, 32.0, 26.0, 38.0, 37.0, 32.0, 42.0, 40.0, 47.0, 38.0, 34.0, 34.0, 41.0, 41.0, 44.0, 28.0, 36.0, 41.0, 26.0, 26.0, 29.0, 22.0, 20.0, 14.0, 19.0, 14.0, 7.0, 10.0, 11.0, 10.0, 6.0, 2.0, 3.0, 4.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-23.265625, -22.579833984375, -21.89404296875, -21.208251953125, -20.5224609375, -19.836669921875, -19.15087890625, -18.465087890625, -17.779296875, -17.093505859375, -16.40771484375, -15.721923828125, -15.0361328125, -14.350341796875, -13.66455078125, -12.978759765625, -12.29296875, -11.607177734375, -10.92138671875, -10.235595703125, -9.5498046875, -8.864013671875, -8.17822265625, -7.492431640625, -6.806640625, -6.120849609375, -5.43505859375, -4.749267578125, -4.0634765625, -3.377685546875, -2.69189453125, -2.006103515625, -1.3203125, -0.634521484375, 0.05126953125, 0.737060546875, 1.4228515625, 2.108642578125, 2.79443359375, 3.480224609375, 4.166015625, 4.851806640625, 5.53759765625, 6.223388671875, 6.9091796875, 7.594970703125, 8.28076171875, 8.966552734375, 9.65234375, 10.338134765625, 11.02392578125, 11.709716796875, 12.3955078125, 13.081298828125, 13.76708984375, 14.452880859375, 15.138671875, 15.824462890625, 16.51025390625, 17.196044921875, 17.8818359375, 18.567626953125, 19.25341796875, 19.939208984375, 20.625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 16.0, 28.0, 54.0, 110.0, 267.0, 817.0, 4167.0, 166633.0, 865119.0, 9480.0, 1240.0, 365.0, 109.0, 54.0, 36.0, 17.0, 15.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.84375, -23.3038330078125, -22.763916015625, -22.2239990234375, -21.68408203125, -21.1441650390625, -20.604248046875, -20.0643310546875, -19.5244140625, -18.9844970703125, -18.444580078125, -17.9046630859375, -17.36474609375, -16.8248291015625, -16.284912109375, -15.7449951171875, -15.205078125, -14.6651611328125, -14.125244140625, -13.5853271484375, -13.04541015625, -12.5054931640625, -11.965576171875, -11.4256591796875, -10.8857421875, -10.3458251953125, -9.805908203125, -9.2659912109375, -8.72607421875, -8.1861572265625, -7.646240234375, -7.1063232421875, -6.56640625, -6.0264892578125, -5.486572265625, -4.9466552734375, -4.40673828125, -3.8668212890625, -3.326904296875, -2.7869873046875, -2.2470703125, -1.7071533203125, -1.167236328125, -0.6273193359375, -0.08740234375, 0.4525146484375, 0.992431640625, 1.5323486328125, 2.072265625, 2.6121826171875, 3.152099609375, 3.6920166015625, 4.23193359375, 4.7718505859375, 5.311767578125, 5.8516845703125, 6.3916015625, 6.9315185546875, 7.471435546875, 8.0113525390625, 8.55126953125, 9.0911865234375, 9.631103515625, 10.1710205078125, 10.7109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 16.0, 23.0, 48.0, 100.0, 151.0, 284.0, 163.0, 106.0, 49.0, 25.0, 17.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017795562744140625, -0.0017101466655731201, -0.0016407370567321777, -0.0015713274478912354, -0.001501917839050293, -0.0014325082302093506, -0.0013630986213684082, -0.0012936890125274658, -0.0012242794036865234, -0.001154869794845581, -0.0010854601860046387, -0.0010160505771636963, -0.0009466409683227539, -0.0008772313594818115, -0.0008078217506408691, -0.0007384121417999268, -0.0006690025329589844, -0.000599592924118042, -0.0005301833152770996, -0.0004607737064361572, -0.00039136409759521484, -0.00032195448875427246, -0.0002525448799133301, -0.0001831352710723877, -0.00011372566223144531, -4.431605339050293e-05, 2.5093555450439453e-05, 9.450316429138184e-05, 0.00016391277313232422, 0.0002333223819732666, 0.000302731990814209, 0.00037214159965515137, 0.00044155120849609375, 0.0005109608173370361, 0.0005803704261779785, 0.0006497800350189209, 0.0007191896438598633, 0.0007885992527008057, 0.000858008861541748, 0.0009274184703826904, 0.0009968280792236328, 0.0010662376880645752, 0.0011356472969055176, 0.00120505690574646, 0.0012744665145874023, 0.0013438761234283447, 0.0014132857322692871, 0.0014826953411102295, 0.0015521049499511719, 0.0016215145587921143, 0.0016909241676330566, 0.001760333776473999, 0.0018297433853149414, 0.0018991529941558838, 0.001968562602996826, 0.0020379722118377686, 0.002107381820678711, 0.0021767914295196533, 0.0022462010383605957, 0.002315610647201538, 0.0023850202560424805, 0.002454429864883423, 0.0025238394737243652, 0.0025932490825653076, 0.00266265869140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 8.0, 4.0, 6.0, 10.0, 14.0, 20.0, 22.0, 39.0, 64.0, 71.0, 102.0, 183.0, 289.0, 640.0, 1312.0, 3539.0, 12615.0, 78548.0, 701639.0, 214865.0, 24930.0, 5737.0, 1995.0, 869.0, 439.0, 210.0, 126.0, 69.0, 50.0, 34.0, 19.0, 20.0, 12.0, 11.0, 8.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.55859375, -6.33782958984375, -6.1170654296875, -5.89630126953125, -5.675537109375, -5.45477294921875, -5.2340087890625, -5.01324462890625, -4.79248046875, -4.57171630859375, -4.3509521484375, -4.13018798828125, -3.909423828125, -3.68865966796875, -3.4678955078125, -3.24713134765625, -3.0263671875, -2.80560302734375, -2.5848388671875, -2.36407470703125, -2.143310546875, -1.92254638671875, -1.7017822265625, -1.48101806640625, -1.26025390625, -1.03948974609375, -0.8187255859375, -0.59796142578125, -0.377197265625, -0.15643310546875, 0.0643310546875, 0.28509521484375, 0.505859375, 0.72662353515625, 0.9473876953125, 1.16815185546875, 1.388916015625, 1.60968017578125, 1.8304443359375, 2.05120849609375, 2.27197265625, 2.49273681640625, 2.7135009765625, 2.93426513671875, 3.155029296875, 3.37579345703125, 3.5965576171875, 3.81732177734375, 4.0380859375, 4.25885009765625, 4.4796142578125, 4.70037841796875, 4.921142578125, 5.14190673828125, 5.3626708984375, 5.58343505859375, 5.80419921875, 6.02496337890625, 6.2457275390625, 6.46649169921875, 6.687255859375, 6.90802001953125, 7.1287841796875, 7.34954833984375, 7.5703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 21.0, 14.0, 22.0, 25.0, 52.0, 67.0, 70.0, 92.0, 122.0, 112.0, 106.0, 58.0, 56.0, 50.0, 35.0, 23.0, 10.0, 11.0, 6.0, 12.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.93896484375, -7.6748046875, -7.41064453125, -7.146484375, -6.88232421875, -6.6181640625, -6.35400390625, -6.08984375, -5.82568359375, -5.5615234375, -5.29736328125, -5.033203125, -4.76904296875, -4.5048828125, -4.24072265625, -3.9765625, -3.71240234375, -3.4482421875, -3.18408203125, -2.919921875, -2.65576171875, -2.3916015625, -2.12744140625, -1.86328125, -1.59912109375, -1.3349609375, -1.07080078125, -0.806640625, -0.54248046875, -0.2783203125, -0.01416015625, 0.25, 0.51416015625, 0.7783203125, 1.04248046875, 1.306640625, 1.57080078125, 1.8349609375, 2.09912109375, 2.36328125, 2.62744140625, 2.8916015625, 3.15576171875, 3.419921875, 3.68408203125, 3.9482421875, 4.21240234375, 4.4765625, 4.74072265625, 5.0048828125, 5.26904296875, 5.533203125, 5.79736328125, 6.0615234375, 6.32568359375, 6.58984375, 6.85400390625, 7.1181640625, 7.38232421875, 7.646484375, 7.91064453125, 8.1748046875, 8.43896484375, 8.703125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 27.0, 112.0, 439.0, 324.0, 82.0, 18.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-580.33740234375, -568.9228515625, -557.5083618164062, -546.0938110351562, -534.6792602539062, -523.2647094726562, -511.8502197265625, -500.4356689453125, -489.0211181640625, -477.6065979003906, -466.1920471191406, -454.77752685546875, -443.36297607421875, -431.9484558105469, -420.533935546875, -409.119384765625, -397.7048645019531, -386.29034423828125, -374.87579345703125, -363.4612731933594, -352.0467224121094, -340.6322021484375, -329.2176513671875, -317.8031311035156, -306.38861083984375, -294.9740905761719, -283.5595397949219, -272.14501953125, -260.73046875, -249.31594848632812, -237.9014129638672, -226.48687744140625, -215.0723114013672, -203.65777587890625, -192.2432403564453, -180.82870483398438, -169.4141845703125, -157.9996337890625, -146.58511352539062, -135.1705780029297, -123.75604248046875, -112.34150695800781, -100.92697143554688, -89.51244354248047, -78.09790802001953, -66.6833724975586, -55.26884460449219, -43.85430908203125, -32.43977355957031, -21.025239944458008, -9.610706329345703, 1.8038253784179688, 13.218360900878906, 24.632896423339844, 36.04742431640625, 47.46195983886719, 58.876495361328125, 70.29103088378906, 81.70556640625, 93.1200942993164, 104.53462982177734, 115.94916534423828, 127.36369323730469, 138.77822875976562, 150.19276428222656]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 12.0, 19.0, 14.0, 16.0, 24.0, 25.0, 30.0, 27.0, 30.0, 38.0, 44.0, 44.0, 57.0, 62.0, 59.0, 70.0, 47.0, 54.0, 52.0, 45.0, 33.0, 42.0, 34.0, 18.0, 18.0, 18.0, 13.0, 12.0, 11.0, 4.0, 6.0, 1.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-172.0580596923828, -167.5946807861328, -163.1313018798828, -158.66790771484375, -154.20452880859375, -149.74114990234375, -145.27777099609375, -140.81439208984375, -136.35101318359375, -131.88763427734375, -127.42424774169922, -122.96086883544922, -118.49748992919922, -114.03410339355469, -109.57072448730469, -105.10734558105469, -100.64395904541016, -96.18058013916016, -91.71719360351562, -87.25381469726562, -82.79043579101562, -78.32705688476562, -73.8636703491211, -69.4002914428711, -64.93690490722656, -60.4735221862793, -56.0101432800293, -51.54676055908203, -47.08338165283203, -42.619998931884766, -38.1566162109375, -33.6932373046875, -29.2298583984375, -24.766477584838867, -20.303096771240234, -15.839714050292969, -11.376333236694336, -6.912952423095703, -2.4495697021484375, 2.0138111114501953, 6.477191925048828, 10.940572738647461, 15.40395450592041, 19.86733627319336, 24.330717086791992, 28.794097900390625, 33.25748062133789, 37.720863342285156, 42.184242248535156, 46.64762496948242, 51.11100387573242, 55.57438659667969, 60.03776550292969, 64.50114440917969, 68.96453094482422, 73.42790985107422, 77.89129638671875, 82.35467529296875, 86.81806182861328, 91.28144073486328, 95.74481964111328, 100.20820617675781, 104.67158508300781, 109.13496398925781, 113.59834289550781]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 13.0, 26.0, 24.0, 46.0, 70.0, 187.0, 436.0, 1389.0, 7204.0, 124636.0, 4036028.0, 20182.0, 2796.0, 679.0, 275.0, 113.0, 58.0, 41.0, 19.0, 18.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.41943359375, -16.6357421875, -15.85205078125, -15.068359375, -14.28466796875, -13.5009765625, -12.71728515625, -11.93359375, -11.14990234375, -10.3662109375, -9.58251953125, -8.798828125, -8.01513671875, -7.2314453125, -6.44775390625, -5.6640625, -4.88037109375, -4.0966796875, -3.31298828125, -2.529296875, -1.74560546875, -0.9619140625, -0.17822265625, 0.60546875, 1.38916015625, 2.1728515625, 2.95654296875, 3.740234375, 4.52392578125, 5.3076171875, 6.09130859375, 6.875, 7.65869140625, 8.4423828125, 9.22607421875, 10.009765625, 10.79345703125, 11.5771484375, 12.36083984375, 13.14453125, 13.92822265625, 14.7119140625, 15.49560546875, 16.279296875, 17.06298828125, 17.8466796875, 18.63037109375, 19.4140625, 20.19775390625, 20.9814453125, 21.76513671875, 22.548828125, 23.33251953125, 24.1162109375, 24.89990234375, 25.68359375, 26.46728515625, 27.2509765625, 28.03466796875, 28.818359375, 29.60205078125, 30.3857421875, 31.16943359375, 31.953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 9.0, 7.0, 13.0, 22.0, 24.0, 26.0, 41.0, 34.0, 54.0, 43.0, 45.0, 47.0, 61.0, 54.0, 61.0, 70.0, 46.0, 48.0, 49.0, 49.0, 29.0, 33.0, 19.0, 20.0, 24.0, 19.0, 11.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-7.22265625, -7.0313720703125, -6.840087890625, -6.6488037109375, -6.45751953125, -6.2662353515625, -6.074951171875, -5.8836669921875, -5.6923828125, -5.5010986328125, -5.309814453125, -5.1185302734375, -4.92724609375, -4.7359619140625, -4.544677734375, -4.3533935546875, -4.162109375, -3.9708251953125, -3.779541015625, -3.5882568359375, -3.39697265625, -3.2056884765625, -3.014404296875, -2.8231201171875, -2.6318359375, -2.4405517578125, -2.249267578125, -2.0579833984375, -1.86669921875, -1.6754150390625, -1.484130859375, -1.2928466796875, -1.1015625, -0.9102783203125, -0.718994140625, -0.5277099609375, -0.33642578125, -0.1451416015625, 0.046142578125, 0.2374267578125, 0.4287109375, 0.6199951171875, 0.811279296875, 1.0025634765625, 1.19384765625, 1.3851318359375, 1.576416015625, 1.7677001953125, 1.958984375, 2.1502685546875, 2.341552734375, 2.5328369140625, 2.72412109375, 2.9154052734375, 3.106689453125, 3.2979736328125, 3.4892578125, 3.6805419921875, 3.871826171875, 4.0631103515625, 4.25439453125, 4.4456787109375, 4.636962890625, 4.8282470703125, 5.01953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 10.0, 21.0, 32.0, 26.0, 48.0, 70.0, 95.0, 126.0, 185.0, 278.0, 456.0, 1165.0, 3515.0, 14701.0, 228286.0, 3900238.0, 35236.0, 6170.0, 1822.0, 710.0, 334.0, 200.0, 163.0, 87.0, 90.0, 57.0, 37.0, 34.0, 28.0, 18.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.734375, -21.1171875, -20.5, -19.8828125, -19.265625, -18.6484375, -18.03125, -17.4140625, -16.796875, -16.1796875, -15.5625, -14.9453125, -14.328125, -13.7109375, -13.09375, -12.4765625, -11.859375, -11.2421875, -10.625, -10.0078125, -9.390625, -8.7734375, -8.15625, -7.5390625, -6.921875, -6.3046875, -5.6875, -5.0703125, -4.453125, -3.8359375, -3.21875, -2.6015625, -1.984375, -1.3671875, -0.75, -0.1328125, 0.484375, 1.1015625, 1.71875, 2.3359375, 2.953125, 3.5703125, 4.1875, 4.8046875, 5.421875, 6.0390625, 6.65625, 7.2734375, 7.890625, 8.5078125, 9.125, 9.7421875, 10.359375, 10.9765625, 11.59375, 12.2109375, 12.828125, 13.4453125, 14.0625, 14.6796875, 15.296875, 15.9140625, 16.53125, 17.1484375, 17.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 5.0, 10.0, 26.0, 31.0, 45.0, 146.0, 569.0, 2714.0, 280.0, 95.0, 55.0, 21.0, 12.0, 14.0, 12.0, 9.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.359375, -4.14453125, -3.9296875, -3.71484375, -3.5, -3.28515625, -3.0703125, -2.85546875, -2.640625, -2.42578125, -2.2109375, -1.99609375, -1.78125, -1.56640625, -1.3515625, -1.13671875, -0.921875, -0.70703125, -0.4921875, -0.27734375, -0.0625, 0.15234375, 0.3671875, 0.58203125, 0.796875, 1.01171875, 1.2265625, 1.44140625, 1.65625, 1.87109375, 2.0859375, 2.30078125, 2.515625, 2.73046875, 2.9453125, 3.16015625, 3.375, 3.58984375, 3.8046875, 4.01953125, 4.234375, 4.44921875, 4.6640625, 4.87890625, 5.09375, 5.30859375, 5.5234375, 5.73828125, 5.953125, 6.16796875, 6.3828125, 6.59765625, 6.8125, 7.02734375, 7.2421875, 7.45703125, 7.671875, 7.88671875, 8.1015625, 8.31640625, 8.53125, 8.74609375, 8.9609375, 9.17578125, 9.390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 18.0, 43.0, 59.0, 111.0, 180.0, 178.0, 172.0, 105.0, 62.0, 24.0, 18.0, 14.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.73705291748047, -24.437726974487305, -23.13840103149414, -21.839075088500977, -20.539749145507812, -19.24042320251465, -17.941097259521484, -16.64177131652832, -15.342445373535156, -14.043119430541992, -12.743793487548828, -11.444467544555664, -10.1451416015625, -8.845815658569336, -7.546489715576172, -6.247163772583008, -4.947837829589844, -3.6485118865966797, -2.3491859436035156, -1.0498600006103516, 0.2494659423828125, 1.5487918853759766, 2.8481178283691406, 4.147443771362305, 5.446769714355469, 6.746095657348633, 8.045421600341797, 9.344747543334961, 10.644073486328125, 11.943399429321289, 13.242725372314453, 14.542051315307617, 15.841381072998047, 17.14070701599121, 18.440032958984375, 19.73935890197754, 21.038684844970703, 22.338010787963867, 23.63733673095703, 24.936662673950195, 26.23598861694336, 27.535314559936523, 28.834640502929688, 30.13396644592285, 31.433292388916016, 32.73262023925781, 34.031944274902344, 35.331268310546875, 36.63059616088867, 37.92992401123047, 39.229248046875, 40.52857208251953, 41.82789993286133, 43.127227783203125, 44.426551818847656, 45.72587585449219, 47.025203704833984, 48.32453155517578, 49.62385559082031, 50.923179626464844, 52.22250747680664, 53.52183532714844, 54.82115936279297, 56.1204833984375, 57.4198112487793]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 14.0, 11.0, 14.0, 17.0, 16.0, 34.0, 27.0, 29.0, 31.0, 38.0, 49.0, 48.0, 44.0, 49.0, 60.0, 43.0, 50.0, 38.0, 56.0, 37.0, 45.0, 27.0, 40.0, 24.0, 30.0, 29.0, 14.0, 13.0, 14.0, 8.0, 11.0, 8.0, 7.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.011672973632812, -14.417015075683594, -13.822356224060059, -13.227697372436523, -12.633039474487305, -12.038381576538086, -11.44372272491455, -10.849063873291016, -10.254405975341797, -9.659748077392578, -9.065089225769043, -8.470430374145508, -7.875772476196289, -7.281114101409912, -6.686455726623535, -6.091797351837158, -5.497138977050781, -4.902480602264404, -4.307822227478027, -3.7131638526916504, -3.1185054779052734, -2.5238471031188965, -1.9291887283325195, -1.3345303535461426, -0.7398719787597656, -0.14521360397338867, 0.4494447708129883, 1.0441031455993652, 1.6387615203857422, 2.233419895172119, 2.828078269958496, 3.422736644744873, 4.017393112182617, 4.612051486968994, 5.206709861755371, 5.801368236541748, 6.396026611328125, 6.990684986114502, 7.585343360900879, 8.180002212524414, 8.774660110473633, 9.369318008422852, 9.963976860046387, 10.558635711669922, 11.15329360961914, 11.74795150756836, 12.342610359191895, 12.93726921081543, 13.531927108764648, 14.126585006713867, 14.721243858337402, 15.315902709960938, 15.910560607910156, 16.505218505859375, 17.099876403808594, 17.694536209106445, 18.289194107055664, 18.883852005004883, 19.478511810302734, 20.073169708251953, 20.667827606201172, 21.26248550415039, 21.85714340209961, 22.45180320739746, 23.04646110534668]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 4.0, 7.0, 5.0, 14.0, 17.0, 35.0, 29.0, 55.0, 83.0, 122.0, 187.0, 249.0, 399.0, 639.0, 1141.0, 2219.0, 4517.0, 10278.0, 27920.0, 87801.0, 270955.0, 396687.0, 163082.0, 50667.0, 17272.0, 6848.0, 3133.0, 1647.0, 933.0, 586.0, 342.0, 214.0, 148.0, 99.0, 57.0, 37.0, 35.0, 17.0, 14.0, 13.0, 10.0, 10.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9140625, -8.6539306640625, -8.393798828125, -8.1336669921875, -7.87353515625, -7.6134033203125, -7.353271484375, -7.0931396484375, -6.8330078125, -6.5728759765625, -6.312744140625, -6.0526123046875, -5.79248046875, -5.5323486328125, -5.272216796875, -5.0120849609375, -4.751953125, -4.4918212890625, -4.231689453125, -3.9715576171875, -3.71142578125, -3.4512939453125, -3.191162109375, -2.9310302734375, -2.6708984375, -2.4107666015625, -2.150634765625, -1.8905029296875, -1.63037109375, -1.3702392578125, -1.110107421875, -0.8499755859375, -0.58984375, -0.3297119140625, -0.069580078125, 0.1905517578125, 0.45068359375, 0.7108154296875, 0.970947265625, 1.2310791015625, 1.4912109375, 1.7513427734375, 2.011474609375, 2.2716064453125, 2.53173828125, 2.7918701171875, 3.052001953125, 3.3121337890625, 3.572265625, 3.8323974609375, 4.092529296875, 4.3526611328125, 4.61279296875, 4.8729248046875, 5.133056640625, 5.3931884765625, 5.6533203125, 5.9134521484375, 6.173583984375, 6.4337158203125, 6.69384765625, 6.9539794921875, 7.214111328125, 7.4742431640625, 7.734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 0.0, 4.0, 2.0, 5.0, 3.0, 16.0, 4.0, 13.0, 10.0, 23.0, 30.0, 29.0, 41.0, 36.0, 52.0, 48.0, 60.0, 56.0, 69.0, 61.0, 58.0, 63.0, 50.0, 47.0, 40.0, 40.0, 38.0, 14.0, 22.0, 14.0, 7.0, 13.0, 15.0, 5.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.5, -7.296142578125, -7.09228515625, -6.888427734375, -6.6845703125, -6.480712890625, -6.27685546875, -6.072998046875, -5.869140625, -5.665283203125, -5.46142578125, -5.257568359375, -5.0537109375, -4.849853515625, -4.64599609375, -4.442138671875, -4.23828125, -4.034423828125, -3.83056640625, -3.626708984375, -3.4228515625, -3.218994140625, -3.01513671875, -2.811279296875, -2.607421875, -2.403564453125, -2.19970703125, -1.995849609375, -1.7919921875, -1.588134765625, -1.38427734375, -1.180419921875, -0.9765625, -0.772705078125, -0.56884765625, -0.364990234375, -0.1611328125, 0.042724609375, 0.24658203125, 0.450439453125, 0.654296875, 0.858154296875, 1.06201171875, 1.265869140625, 1.4697265625, 1.673583984375, 1.87744140625, 2.081298828125, 2.28515625, 2.489013671875, 2.69287109375, 2.896728515625, 3.1005859375, 3.304443359375, 3.50830078125, 3.712158203125, 3.916015625, 4.119873046875, 4.32373046875, 4.527587890625, 4.7314453125, 4.935302734375, 5.13916015625, 5.343017578125, 5.546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 4.0, 9.0, 8.0, 12.0, 15.0, 22.0, 32.0, 50.0, 71.0, 127.0, 191.0, 390.0, 758.0, 2071.0, 8619.0, 100205.0, 835462.0, 89129.0, 7737.0, 1993.0, 746.0, 326.0, 185.0, 126.0, 78.0, 55.0, 36.0, 23.0, 17.0, 9.0, 12.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.015625, -18.37060546875, -17.7255859375, -17.08056640625, -16.435546875, -15.79052734375, -15.1455078125, -14.50048828125, -13.85546875, -13.21044921875, -12.5654296875, -11.92041015625, -11.275390625, -10.63037109375, -9.9853515625, -9.34033203125, -8.6953125, -8.05029296875, -7.4052734375, -6.76025390625, -6.115234375, -5.47021484375, -4.8251953125, -4.18017578125, -3.53515625, -2.89013671875, -2.2451171875, -1.60009765625, -0.955078125, -0.31005859375, 0.3349609375, 0.97998046875, 1.625, 2.27001953125, 2.9150390625, 3.56005859375, 4.205078125, 4.85009765625, 5.4951171875, 6.14013671875, 6.78515625, 7.43017578125, 8.0751953125, 8.72021484375, 9.365234375, 10.01025390625, 10.6552734375, 11.30029296875, 11.9453125, 12.59033203125, 13.2353515625, 13.88037109375, 14.525390625, 15.17041015625, 15.8154296875, 16.46044921875, 17.10546875, 17.75048828125, 18.3955078125, 19.04052734375, 19.685546875, 20.33056640625, 20.9755859375, 21.62060546875, 22.265625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 9.0, 19.0, 26.0, 28.0, 25.0, 32.0, 48.0, 50.0, 46.0, 62.0, 48.0, 59.0, 56.0, 61.0, 45.0, 67.0, 54.0, 51.0, 32.0, 35.0, 18.0, 18.0, 25.0, 12.0, 12.0, 10.0, 13.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.921875, -29.079345703125, -28.23681640625, -27.394287109375, -26.5517578125, -25.709228515625, -24.86669921875, -24.024169921875, -23.181640625, -22.339111328125, -21.49658203125, -20.654052734375, -19.8115234375, -18.968994140625, -18.12646484375, -17.283935546875, -16.44140625, -15.598876953125, -14.75634765625, -13.913818359375, -13.0712890625, -12.228759765625, -11.38623046875, -10.543701171875, -9.701171875, -8.858642578125, -8.01611328125, -7.173583984375, -6.3310546875, -5.488525390625, -4.64599609375, -3.803466796875, -2.9609375, -2.118408203125, -1.27587890625, -0.433349609375, 0.4091796875, 1.251708984375, 2.09423828125, 2.936767578125, 3.779296875, 4.621826171875, 5.46435546875, 6.306884765625, 7.1494140625, 7.991943359375, 8.83447265625, 9.677001953125, 10.51953125, 11.362060546875, 12.20458984375, 13.047119140625, 13.8896484375, 14.732177734375, 15.57470703125, 16.417236328125, 17.259765625, 18.102294921875, 18.94482421875, 19.787353515625, 20.6298828125, 21.472412109375, 22.31494140625, 23.157470703125, 24.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 6.0, 13.0, 19.0, 15.0, 46.0, 68.0, 158.0, 375.0, 1175.0, 6710.0, 181758.0, 836023.0, 19009.0, 2147.0, 548.0, 215.0, 94.0, 52.0, 35.0, 15.0, 19.0, 10.0, 3.0, 11.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.671875, -11.3203125, -10.96875, -10.6171875, -10.265625, -9.9140625, -9.5625, -9.2109375, -8.859375, -8.5078125, -8.15625, -7.8046875, -7.453125, -7.1015625, -6.75, -6.3984375, -6.046875, -5.6953125, -5.34375, -4.9921875, -4.640625, -4.2890625, -3.9375, -3.5859375, -3.234375, -2.8828125, -2.53125, -2.1796875, -1.828125, -1.4765625, -1.125, -0.7734375, -0.421875, -0.0703125, 0.28125, 0.6328125, 0.984375, 1.3359375, 1.6875, 2.0390625, 2.390625, 2.7421875, 3.09375, 3.4453125, 3.796875, 4.1484375, 4.5, 4.8515625, 5.203125, 5.5546875, 5.90625, 6.2578125, 6.609375, 6.9609375, 7.3125, 7.6640625, 8.015625, 8.3671875, 8.71875, 9.0703125, 9.421875, 9.7734375, 10.125, 10.4765625, 10.828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 6.0, 6.0, 4.0, 4.0, 12.0, 8.0, 23.0, 16.0, 30.0, 36.0, 44.0, 59.0, 80.0, 100.0, 117.0, 102.0, 70.0, 68.0, 49.0, 33.0, 37.0, 21.0, 18.0, 15.0, 6.0, 3.0, 4.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.001312255859375, -0.0012772083282470703, -0.0012421607971191406, -0.001207113265991211, -0.0011720657348632812, -0.0011370182037353516, -0.0011019706726074219, -0.0010669231414794922, -0.0010318756103515625, -0.0009968280792236328, -0.0009617805480957031, -0.0009267330169677734, -0.0008916854858398438, -0.0008566379547119141, -0.0008215904235839844, -0.0007865428924560547, -0.000751495361328125, -0.0007164478302001953, -0.0006814002990722656, -0.0006463527679443359, -0.0006113052368164062, -0.0005762577056884766, -0.0005412101745605469, -0.0005061626434326172, -0.0004711151123046875, -0.0004360675811767578, -0.0004010200500488281, -0.00036597251892089844, -0.00033092498779296875, -0.00029587745666503906, -0.0002608299255371094, -0.0002257823944091797, -0.00019073486328125, -0.0001556873321533203, -0.00012063980102539062, -8.559226989746094e-05, -5.054473876953125e-05, -1.5497207641601562e-05, 1.9550323486328125e-05, 5.459785461425781e-05, 8.96453857421875e-05, 0.0001246929168701172, 0.00015974044799804688, 0.00019478797912597656, 0.00022983551025390625, 0.00026488304138183594, 0.0002999305725097656, 0.0003349781036376953, 0.000370025634765625, 0.0004050731658935547, 0.0004401206970214844, 0.00047516822814941406, 0.0005102157592773438, 0.0005452632904052734, 0.0005803108215332031, 0.0006153583526611328, 0.0006504058837890625, 0.0006854534149169922, 0.0007205009460449219, 0.0007555484771728516, 0.0007905960083007812, 0.0008256435394287109, 0.0008606910705566406, 0.0008957386016845703, 0.0009307861328125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 9.0, 26.0, 42.0, 117.0, 264.0, 705.0, 4349.0, 344566.0, 691064.0, 6067.0, 837.0, 271.0, 119.0, 46.0, 34.0, 15.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.158447265625, -15.58251953125, -15.006591796875, -14.4306640625, -13.854736328125, -13.27880859375, -12.702880859375, -12.126953125, -11.551025390625, -10.97509765625, -10.399169921875, -9.8232421875, -9.247314453125, -8.67138671875, -8.095458984375, -7.51953125, -6.943603515625, -6.36767578125, -5.791748046875, -5.2158203125, -4.639892578125, -4.06396484375, -3.488037109375, -2.912109375, -2.336181640625, -1.76025390625, -1.184326171875, -0.6083984375, -0.032470703125, 0.54345703125, 1.119384765625, 1.6953125, 2.271240234375, 2.84716796875, 3.423095703125, 3.9990234375, 4.574951171875, 5.15087890625, 5.726806640625, 6.302734375, 6.878662109375, 7.45458984375, 8.030517578125, 8.6064453125, 9.182373046875, 9.75830078125, 10.334228515625, 10.91015625, 11.486083984375, 12.06201171875, 12.637939453125, 13.2138671875, 13.789794921875, 14.36572265625, 14.941650390625, 15.517578125, 16.093505859375, 16.66943359375, 17.245361328125, 17.8212890625, 18.397216796875, 18.97314453125, 19.549072265625, 20.125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 12.0, 10.0, 43.0, 155.0, 335.0, 286.0, 113.0, 37.0, 14.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.890625, -19.1767578125, -18.462890625, -17.7490234375, -17.03515625, -16.3212890625, -15.607421875, -14.8935546875, -14.1796875, -13.4658203125, -12.751953125, -12.0380859375, -11.32421875, -10.6103515625, -9.896484375, -9.1826171875, -8.46875, -7.7548828125, -7.041015625, -6.3271484375, -5.61328125, -4.8994140625, -4.185546875, -3.4716796875, -2.7578125, -2.0439453125, -1.330078125, -0.6162109375, 0.09765625, 0.8115234375, 1.525390625, 2.2392578125, 2.953125, 3.6669921875, 4.380859375, 5.0947265625, 5.80859375, 6.5224609375, 7.236328125, 7.9501953125, 8.6640625, 9.3779296875, 10.091796875, 10.8056640625, 11.51953125, 12.2333984375, 12.947265625, 13.6611328125, 14.375, 15.0888671875, 15.802734375, 16.5166015625, 17.23046875, 17.9443359375, 18.658203125, 19.3720703125, 20.0859375, 20.7998046875, 21.513671875, 22.2275390625, 22.94140625, 23.6552734375, 24.369140625, 25.0830078125, 25.796875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 16.0, 19.0, 47.0, 90.0, 152.0, 203.0, 211.0, 115.0, 70.0, 33.0, 15.0, 8.0, 10.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.285888671875, -169.7859344482422, -165.2859649658203, -160.7860107421875, -156.28604125976562, -151.7860870361328, -147.2861328125, -142.78616333007812, -138.2862091064453, -133.7862548828125, -129.28628540039062, -124.78633117675781, -120.28636932373047, -115.78640747070312, -111.28645324707031, -106.78649139404297, -102.28652954101562, -97.78656768798828, -93.28660583496094, -88.78665161132812, -84.28668975830078, -79.78672790527344, -75.28677368164062, -70.78681182861328, -66.28684997558594, -61.786888122558594, -57.286930084228516, -52.78697204589844, -48.287010192871094, -43.78704833984375, -39.28709030151367, -34.787132263183594, -30.28717041015625, -25.78721046447754, -21.287250518798828, -16.787290573120117, -12.287330627441406, -7.787370681762695, -3.2874107360839844, 1.2125492095947266, 5.7125091552734375, 10.212469100952148, 14.71242904663086, 19.21238899230957, 23.71234893798828, 28.212308883666992, 32.7122688293457, 37.21222686767578, 41.712188720703125, 46.21215057373047, 50.71210861206055, 55.212066650390625, 59.71202850341797, 64.21199035644531, 68.71194458007812, 73.21190643310547, 77.71186828613281, 82.21183013916016, 86.7117919921875, 91.21174621582031, 95.71170806884766, 100.211669921875, 104.71162414550781, 109.21158599853516, 113.7115478515625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 0.0, 5.0, 11.0, 8.0, 12.0, 18.0, 25.0, 20.0, 19.0, 23.0, 43.0, 38.0, 34.0, 56.0, 47.0, 68.0, 56.0, 64.0, 47.0, 62.0, 45.0, 54.0, 40.0, 37.0, 21.0, 30.0, 27.0, 17.0, 23.0, 11.0, 6.0, 6.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.69227600097656, -105.95861053466797, -102.22493743896484, -98.49127197265625, -94.75760650634766, -91.02393341064453, -87.29026794433594, -83.55659484863281, -79.82292938232422, -76.08926391601562, -72.3555908203125, -68.6219253540039, -64.88825988769531, -61.15458679199219, -57.420921325683594, -53.687252044677734, -49.95358657836914, -46.21991729736328, -42.48625183105469, -38.75258255004883, -35.01891326904297, -31.285245895385742, -27.551578521728516, -23.817909240722656, -20.08424186706543, -16.350574493408203, -12.616905212402344, -8.883237838745117, -5.149569511413574, -1.4159011840820312, 2.3177661895751953, 6.051435470581055, 9.785102844238281, 13.518771171569824, 17.252439498901367, 20.986106872558594, 24.719776153564453, 28.45344352722168, 32.187110900878906, 35.920780181884766, 39.654449462890625, 43.388118743896484, 47.12178421020508, 50.85545349121094, 54.5891227722168, 58.322792053222656, 62.05645751953125, 65.79013061523438, 69.52378845214844, 73.25745391845703, 76.99112701416016, 80.72479248046875, 84.45845794677734, 88.19213104248047, 91.92579650878906, 95.65946960449219, 99.39313507080078, 103.12680053710938, 106.8604736328125, 110.5941390991211, 114.32780456542969, 118.06147766113281, 121.7951431274414, 125.52880859375, 129.26248168945312]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 0.0, 4.0, 7.0, 9.0, 19.0, 24.0, 39.0, 61.0, 119.0, 199.0, 368.0, 635.0, 1314.0, 2826.0, 7158.0, 22599.0, 147180.0, 2919787.0, 1007230.0, 61262.0, 14128.0, 5019.0, 2096.0, 1013.0, 544.0, 260.0, 159.0, 89.0, 56.0, 26.0, 20.0, 9.0, 9.0, 7.0, 3.0, 2.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.34100341796875, -9.0726318359375, -8.80426025390625, -8.535888671875, -8.26751708984375, -7.9991455078125, -7.73077392578125, -7.46240234375, -7.19403076171875, -6.9256591796875, -6.65728759765625, -6.388916015625, -6.12054443359375, -5.8521728515625, -5.58380126953125, -5.3154296875, -5.04705810546875, -4.7786865234375, -4.51031494140625, -4.241943359375, -3.97357177734375, -3.7052001953125, -3.43682861328125, -3.16845703125, -2.90008544921875, -2.6317138671875, -2.36334228515625, -2.094970703125, -1.82659912109375, -1.5582275390625, -1.28985595703125, -1.021484375, -0.75311279296875, -0.4847412109375, -0.21636962890625, 0.052001953125, 0.32037353515625, 0.5887451171875, 0.85711669921875, 1.12548828125, 1.39385986328125, 1.6622314453125, 1.93060302734375, 2.198974609375, 2.46734619140625, 2.7357177734375, 3.00408935546875, 3.2724609375, 3.54083251953125, 3.8092041015625, 4.07757568359375, 4.345947265625, 4.61431884765625, 4.8826904296875, 5.15106201171875, 5.41943359375, 5.68780517578125, 5.9561767578125, 6.22454833984375, 6.492919921875, 6.76129150390625, 7.0296630859375, 7.29803466796875, 7.56640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 1.0, 10.0, 6.0, 12.0, 17.0, 16.0, 19.0, 17.0, 21.0, 47.0, 37.0, 34.0, 39.0, 60.0, 58.0, 48.0, 51.0, 48.0, 65.0, 56.0, 39.0, 38.0, 37.0, 37.0, 40.0, 28.0, 23.0, 27.0, 15.0, 17.0, 9.0, 6.0, 7.0, 8.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-5.64453125, -5.483154296875, -5.32177734375, -5.160400390625, -4.9990234375, -4.837646484375, -4.67626953125, -4.514892578125, -4.353515625, -4.192138671875, -4.03076171875, -3.869384765625, -3.7080078125, -3.546630859375, -3.38525390625, -3.223876953125, -3.0625, -2.901123046875, -2.73974609375, -2.578369140625, -2.4169921875, -2.255615234375, -2.09423828125, -1.932861328125, -1.771484375, -1.610107421875, -1.44873046875, -1.287353515625, -1.1259765625, -0.964599609375, -0.80322265625, -0.641845703125, -0.48046875, -0.319091796875, -0.15771484375, 0.003662109375, 0.1650390625, 0.326416015625, 0.48779296875, 0.649169921875, 0.810546875, 0.971923828125, 1.13330078125, 1.294677734375, 1.4560546875, 1.617431640625, 1.77880859375, 1.940185546875, 2.1015625, 2.262939453125, 2.42431640625, 2.585693359375, 2.7470703125, 2.908447265625, 3.06982421875, 3.231201171875, 3.392578125, 3.553955078125, 3.71533203125, 3.876708984375, 4.0380859375, 4.199462890625, 4.36083984375, 4.522216796875, 4.68359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 16.0, 14.0, 18.0, 23.0, 40.0, 62.0, 103.0, 182.0, 327.0, 650.0, 1552.0, 4005.0, 12067.0, 48019.0, 487735.0, 3435559.0, 162891.0, 27475.0, 8111.0, 2952.0, 1268.0, 555.0, 246.0, 128.0, 74.0, 64.0, 28.0, 19.0, 21.0, 15.0, 3.0, 11.0, 5.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.5579833984375, -10.209716796875, -9.8614501953125, -9.51318359375, -9.1649169921875, -8.816650390625, -8.4683837890625, -8.1201171875, -7.7718505859375, -7.423583984375, -7.0753173828125, -6.72705078125, -6.3787841796875, -6.030517578125, -5.6822509765625, -5.333984375, -4.9857177734375, -4.637451171875, -4.2891845703125, -3.94091796875, -3.5926513671875, -3.244384765625, -2.8961181640625, -2.5478515625, -2.1995849609375, -1.851318359375, -1.5030517578125, -1.15478515625, -0.8065185546875, -0.458251953125, -0.1099853515625, 0.23828125, 0.5865478515625, 0.934814453125, 1.2830810546875, 1.63134765625, 1.9796142578125, 2.327880859375, 2.6761474609375, 3.0244140625, 3.3726806640625, 3.720947265625, 4.0692138671875, 4.41748046875, 4.7657470703125, 5.114013671875, 5.4622802734375, 5.810546875, 6.1588134765625, 6.507080078125, 6.8553466796875, 7.20361328125, 7.5518798828125, 7.900146484375, 8.2484130859375, 8.5966796875, 8.9449462890625, 9.293212890625, 9.6414794921875, 9.98974609375, 10.3380126953125, 10.686279296875, 11.0345458984375, 11.3828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 4.0, 15.0, 24.0, 21.0, 46.0, 64.0, 86.0, 142.0, 232.0, 483.0, 842.0, 889.0, 516.0, 256.0, 151.0, 66.0, 47.0, 35.0, 31.0, 22.0, 20.0, 11.0, 9.0, 10.0, 7.0, 6.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.1578369140625, -7.831298828125, -7.5047607421875, -7.17822265625, -6.8516845703125, -6.525146484375, -6.1986083984375, -5.8720703125, -5.5455322265625, -5.218994140625, -4.8924560546875, -4.56591796875, -4.2393798828125, -3.912841796875, -3.5863037109375, -3.259765625, -2.9332275390625, -2.606689453125, -2.2801513671875, -1.95361328125, -1.6270751953125, -1.300537109375, -0.9739990234375, -0.6474609375, -0.3209228515625, 0.005615234375, 0.3321533203125, 0.65869140625, 0.9852294921875, 1.311767578125, 1.6383056640625, 1.96484375, 2.2913818359375, 2.617919921875, 2.9444580078125, 3.27099609375, 3.5975341796875, 3.924072265625, 4.2506103515625, 4.5771484375, 4.9036865234375, 5.230224609375, 5.5567626953125, 5.88330078125, 6.2098388671875, 6.536376953125, 6.8629150390625, 7.189453125, 7.5159912109375, 7.842529296875, 8.1690673828125, 8.49560546875, 8.8221435546875, 9.148681640625, 9.4752197265625, 9.8017578125, 10.1282958984375, 10.454833984375, 10.7813720703125, 11.10791015625, 11.4344482421875, 11.760986328125, 12.0875244140625, 12.4140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 32.0, 125.0, 244.0, 333.0, 188.0, 39.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-301.28814697265625, -295.3007507324219, -289.3133850097656, -283.32598876953125, -277.338623046875, -271.3512268066406, -265.36383056640625, -259.37646484375, -253.38906860351562, -247.4016876220703, -241.414306640625, -235.42691040039062, -229.4395294189453, -223.4521484375, -217.46475219726562, -211.4773712158203, -205.489990234375, -199.5026092529297, -193.51522827148438, -187.52783203125, -181.5404510498047, -175.55307006835938, -169.565673828125, -163.5782928466797, -157.59091186523438, -151.60353088378906, -145.61614990234375, -139.62875366210938, -133.64137268066406, -127.65399169921875, -121.6666030883789, -115.67921447753906, -109.69182586669922, -103.70443725585938, -97.71705627441406, -91.72967529296875, -85.7422866821289, -79.75489807128906, -73.76751708984375, -67.78013610839844, -61.792747497558594, -55.805362701416016, -49.81797790527344, -43.83059310913086, -37.84320831298828, -31.855823516845703, -25.868438720703125, -19.881053924560547, -13.893669128417969, -7.906284332275391, -1.9188995361328125, 4.068485260009766, 10.055870056152344, 16.043254852294922, 22.0306396484375, 28.018024444580078, 34.005409240722656, 39.992794036865234, 45.98017883300781, 51.96756362915039, 57.95494842529297, 63.94233322143555, 69.92971801757812, 75.91709899902344, 81.90448760986328]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 8.0, 9.0, 13.0, 12.0, 11.0, 24.0, 27.0, 21.0, 28.0, 49.0, 28.0, 51.0, 35.0, 43.0, 51.0, 47.0, 32.0, 41.0, 63.0, 58.0, 40.0, 30.0, 33.0, 36.0, 38.0, 34.0, 25.0, 23.0, 19.0, 11.0, 10.0, 4.0, 7.0, 6.0, 3.0, 4.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.74684524536133, -46.208980560302734, -44.671119689941406, -43.13325500488281, -41.59539031982422, -40.057525634765625, -38.51966094970703, -36.9818000793457, -35.44393539428711, -33.906070709228516, -32.36820983886719, -30.830345153808594, -29.29248046875, -27.754615783691406, -26.216753005981445, -24.678890228271484, -23.14102554321289, -21.603160858154297, -20.065298080444336, -18.527435302734375, -16.98957061767578, -15.451706886291504, -13.913843154907227, -12.37597942352295, -10.838115692138672, -9.300251960754395, -7.762388229370117, -6.22452449798584, -4.6866607666015625, -3.148797035217285, -1.6109333038330078, -0.07306957244873047, 1.4647903442382812, 3.0026540756225586, 4.540517807006836, 6.078381538391113, 7.616245269775391, 9.154109001159668, 10.691972732543945, 12.229836463928223, 13.7677001953125, 15.305563926696777, 16.843427658081055, 18.381290435791016, 19.91915512084961, 21.457019805908203, 22.994882583618164, 24.532745361328125, 26.07061004638672, 27.608474731445312, 29.146337509155273, 30.684200286865234, 32.22206497192383, 33.75992965698242, 35.29779052734375, 36.835655212402344, 38.37351989746094, 39.91138458251953, 41.449249267578125, 42.98711013793945, 44.52497482299805, 46.06283950805664, 47.60070037841797, 49.13856506347656, 50.676429748535156]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 12.0, 6.0, 12.0, 19.0, 38.0, 51.0, 80.0, 106.0, 143.0, 239.0, 321.0, 531.0, 878.0, 1612.0, 2673.0, 4711.0, 8903.0, 17802.0, 35865.0, 73589.0, 151784.0, 272341.0, 237262.0, 121259.0, 58674.0, 28477.0, 14252.0, 7248.0, 3973.0, 2182.0, 1308.0, 762.0, 455.0, 345.0, 209.0, 151.0, 92.0, 52.0, 40.0, 29.0, 25.0, 11.0, 9.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.80078125, -4.65460205078125, -4.5084228515625, -4.36224365234375, -4.216064453125, -4.06988525390625, -3.9237060546875, -3.77752685546875, -3.63134765625, -3.48516845703125, -3.3389892578125, -3.19281005859375, -3.046630859375, -2.90045166015625, -2.7542724609375, -2.60809326171875, -2.4619140625, -2.31573486328125, -2.1695556640625, -2.02337646484375, -1.877197265625, -1.73101806640625, -1.5848388671875, -1.43865966796875, -1.29248046875, -1.14630126953125, -1.0001220703125, -0.85394287109375, -0.707763671875, -0.56158447265625, -0.4154052734375, -0.26922607421875, -0.123046875, 0.02313232421875, 0.1693115234375, 0.31549072265625, 0.461669921875, 0.60784912109375, 0.7540283203125, 0.90020751953125, 1.04638671875, 1.19256591796875, 1.3387451171875, 1.48492431640625, 1.631103515625, 1.77728271484375, 1.9234619140625, 2.06964111328125, 2.2158203125, 2.36199951171875, 2.5081787109375, 2.65435791015625, 2.800537109375, 2.94671630859375, 3.0928955078125, 3.23907470703125, 3.38525390625, 3.53143310546875, 3.6776123046875, 3.82379150390625, 3.969970703125, 4.11614990234375, 4.2623291015625, 4.40850830078125, 4.5546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 9.0, 6.0, 6.0, 15.0, 10.0, 16.0, 19.0, 21.0, 28.0, 24.0, 30.0, 30.0, 36.0, 33.0, 37.0, 52.0, 50.0, 43.0, 47.0, 45.0, 43.0, 51.0, 39.0, 41.0, 39.0, 24.0, 36.0, 23.0, 28.0, 18.0, 22.0, 24.0, 17.0, 9.0, 13.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.62109375, -4.4796142578125, -4.338134765625, -4.1966552734375, -4.05517578125, -3.9136962890625, -3.772216796875, -3.6307373046875, -3.4892578125, -3.3477783203125, -3.206298828125, -3.0648193359375, -2.92333984375, -2.7818603515625, -2.640380859375, -2.4989013671875, -2.357421875, -2.2159423828125, -2.074462890625, -1.9329833984375, -1.79150390625, -1.6500244140625, -1.508544921875, -1.3670654296875, -1.2255859375, -1.0841064453125, -0.942626953125, -0.8011474609375, -0.65966796875, -0.5181884765625, -0.376708984375, -0.2352294921875, -0.09375, 0.0477294921875, 0.189208984375, 0.3306884765625, 0.47216796875, 0.6136474609375, 0.755126953125, 0.8966064453125, 1.0380859375, 1.1795654296875, 1.321044921875, 1.4625244140625, 1.60400390625, 1.7454833984375, 1.886962890625, 2.0284423828125, 2.169921875, 2.3114013671875, 2.452880859375, 2.5943603515625, 2.73583984375, 2.8773193359375, 3.018798828125, 3.1602783203125, 3.3017578125, 3.4432373046875, 3.584716796875, 3.7261962890625, 3.86767578125, 4.0091552734375, 4.150634765625, 4.2921142578125, 4.43359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 6.0, 12.0, 11.0, 18.0, 49.0, 41.0, 91.0, 169.0, 282.0, 492.0, 1114.0, 3025.0, 19929.0, 469168.0, 527873.0, 20706.0, 3192.0, 1092.0, 518.0, 292.0, 162.0, 97.0, 59.0, 30.0, 25.0, 20.0, 19.0, 12.0, 14.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.078125, -21.428955078125, -20.77978515625, -20.130615234375, -19.4814453125, -18.832275390625, -18.18310546875, -17.533935546875, -16.884765625, -16.235595703125, -15.58642578125, -14.937255859375, -14.2880859375, -13.638916015625, -12.98974609375, -12.340576171875, -11.69140625, -11.042236328125, -10.39306640625, -9.743896484375, -9.0947265625, -8.445556640625, -7.79638671875, -7.147216796875, -6.498046875, -5.848876953125, -5.19970703125, -4.550537109375, -3.9013671875, -3.252197265625, -2.60302734375, -1.953857421875, -1.3046875, -0.655517578125, -0.00634765625, 0.642822265625, 1.2919921875, 1.941162109375, 2.59033203125, 3.239501953125, 3.888671875, 4.537841796875, 5.18701171875, 5.836181640625, 6.4853515625, 7.134521484375, 7.78369140625, 8.432861328125, 9.08203125, 9.731201171875, 10.38037109375, 11.029541015625, 11.6787109375, 12.327880859375, 12.97705078125, 13.626220703125, 14.275390625, 14.924560546875, 15.57373046875, 16.222900390625, 16.8720703125, 17.521240234375, 18.17041015625, 18.819580078125, 19.46875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 10.0, 4.0, 8.0, 14.0, 4.0, 14.0, 14.0, 19.0, 13.0, 23.0, 26.0, 36.0, 32.0, 44.0, 42.0, 52.0, 49.0, 50.0, 48.0, 47.0, 44.0, 56.0, 48.0, 51.0, 36.0, 39.0, 31.0, 27.0, 17.0, 18.0, 14.0, 17.0, 12.0, 10.0, 8.0, 4.0, 1.0, 4.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.734375, -21.07275390625, -20.4111328125, -19.74951171875, -19.087890625, -18.42626953125, -17.7646484375, -17.10302734375, -16.44140625, -15.77978515625, -15.1181640625, -14.45654296875, -13.794921875, -13.13330078125, -12.4716796875, -11.81005859375, -11.1484375, -10.48681640625, -9.8251953125, -9.16357421875, -8.501953125, -7.84033203125, -7.1787109375, -6.51708984375, -5.85546875, -5.19384765625, -4.5322265625, -3.87060546875, -3.208984375, -2.54736328125, -1.8857421875, -1.22412109375, -0.5625, 0.09912109375, 0.7607421875, 1.42236328125, 2.083984375, 2.74560546875, 3.4072265625, 4.06884765625, 4.73046875, 5.39208984375, 6.0537109375, 6.71533203125, 7.376953125, 8.03857421875, 8.7001953125, 9.36181640625, 10.0234375, 10.68505859375, 11.3466796875, 12.00830078125, 12.669921875, 13.33154296875, 13.9931640625, 14.65478515625, 15.31640625, 15.97802734375, 16.6396484375, 17.30126953125, 17.962890625, 18.62451171875, 19.2861328125, 19.94775390625, 20.609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 6.0, 12.0, 24.0, 26.0, 44.0, 81.0, 118.0, 255.0, 626.0, 2045.0, 12326.0, 279040.0, 729075.0, 20539.0, 2851.0, 808.0, 304.0, 152.0, 68.0, 47.0, 45.0, 11.0, 15.0, 10.0, 4.0, 5.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.256591796875, -8.92724609375, -8.597900390625, -8.2685546875, -7.939208984375, -7.60986328125, -7.280517578125, -6.951171875, -6.621826171875, -6.29248046875, -5.963134765625, -5.6337890625, -5.304443359375, -4.97509765625, -4.645751953125, -4.31640625, -3.987060546875, -3.65771484375, -3.328369140625, -2.9990234375, -2.669677734375, -2.34033203125, -2.010986328125, -1.681640625, -1.352294921875, -1.02294921875, -0.693603515625, -0.3642578125, -0.034912109375, 0.29443359375, 0.623779296875, 0.953125, 1.282470703125, 1.61181640625, 1.941162109375, 2.2705078125, 2.599853515625, 2.92919921875, 3.258544921875, 3.587890625, 3.917236328125, 4.24658203125, 4.575927734375, 4.9052734375, 5.234619140625, 5.56396484375, 5.893310546875, 6.22265625, 6.552001953125, 6.88134765625, 7.210693359375, 7.5400390625, 7.869384765625, 8.19873046875, 8.528076171875, 8.857421875, 9.186767578125, 9.51611328125, 9.845458984375, 10.1748046875, 10.504150390625, 10.83349609375, 11.162841796875, 11.4921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 7.0, 20.0, 12.0, 13.0, 32.0, 35.0, 46.0, 64.0, 103.0, 170.0, 148.0, 84.0, 64.0, 43.0, 33.0, 19.0, 18.0, 18.0, 13.0, 12.0, 8.0, 10.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016412734985351562, -0.001597866415977478, -0.0015544593334197998, -0.0015110522508621216, -0.0014676451683044434, -0.0014242380857467651, -0.001380831003189087, -0.0013374239206314087, -0.0012940168380737305, -0.0012506097555160522, -0.001207202672958374, -0.0011637955904006958, -0.0011203885078430176, -0.0010769814252853394, -0.0010335743427276611, -0.000990167260169983, -0.0009467601776123047, -0.0009033530950546265, -0.0008599460124969482, -0.00081653892993927, -0.0007731318473815918, -0.0007297247648239136, -0.0006863176822662354, -0.0006429105997085571, -0.0005995035171508789, -0.0005560964345932007, -0.0005126893520355225, -0.00046928226947784424, -0.000425875186920166, -0.0003824681043624878, -0.00033906102180480957, -0.00029565393924713135, -0.0002522468566894531, -0.0002088397741317749, -0.00016543269157409668, -0.00012202560901641846, -7.861852645874023e-05, -3.521144390106201e-05, 8.195638656616211e-06, 5.1602721214294434e-05, 9.500980377197266e-05, 0.00013841688632965088, 0.0001818239688873291, 0.00022523105144500732, 0.00026863813400268555, 0.00031204521656036377, 0.000355452299118042, 0.0003988593816757202, 0.00044226646423339844, 0.00048567354679107666, 0.0005290806293487549, 0.0005724877119064331, 0.0006158947944641113, 0.0006593018770217896, 0.0007027089595794678, 0.000746116042137146, 0.0007895231246948242, 0.0008329302072525024, 0.0008763372898101807, 0.0009197443723678589, 0.0009631514549255371, 0.0010065585374832153, 0.0010499656200408936, 0.0010933727025985718, 0.00113677978515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 12.0, 16.0, 17.0, 43.0, 43.0, 73.0, 144.0, 225.0, 448.0, 945.0, 2598.0, 10818.0, 85530.0, 829588.0, 100775.0, 12385.0, 2791.0, 1022.0, 471.0, 259.0, 144.0, 76.0, 39.0, 28.0, 23.0, 17.0, 10.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1796875, -8.8790283203125, -8.578369140625, -8.2777099609375, -7.97705078125, -7.6763916015625, -7.375732421875, -7.0750732421875, -6.7744140625, -6.4737548828125, -6.173095703125, -5.8724365234375, -5.57177734375, -5.2711181640625, -4.970458984375, -4.6697998046875, -4.369140625, -4.0684814453125, -3.767822265625, -3.4671630859375, -3.16650390625, -2.8658447265625, -2.565185546875, -2.2645263671875, -1.9638671875, -1.6632080078125, -1.362548828125, -1.0618896484375, -0.76123046875, -0.4605712890625, -0.159912109375, 0.1407470703125, 0.44140625, 0.7420654296875, 1.042724609375, 1.3433837890625, 1.64404296875, 1.9447021484375, 2.245361328125, 2.5460205078125, 2.8466796875, 3.1473388671875, 3.447998046875, 3.7486572265625, 4.04931640625, 4.3499755859375, 4.650634765625, 4.9512939453125, 5.251953125, 5.5526123046875, 5.853271484375, 6.1539306640625, 6.45458984375, 6.7552490234375, 7.055908203125, 7.3565673828125, 7.6572265625, 7.9578857421875, 8.258544921875, 8.5592041015625, 8.85986328125, 9.1605224609375, 9.461181640625, 9.7618408203125, 10.0625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 12.0, 11.0, 19.0, 21.0, 37.0, 61.0, 69.0, 95.0, 124.0, 128.0, 103.0, 91.0, 58.0, 51.0, 32.0, 19.0, 20.0, 13.0, 12.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.03125, -11.75262451171875, -11.4739990234375, -11.19537353515625, -10.916748046875, -10.63812255859375, -10.3594970703125, -10.08087158203125, -9.80224609375, -9.52362060546875, -9.2449951171875, -8.96636962890625, -8.687744140625, -8.40911865234375, -8.1304931640625, -7.85186767578125, -7.5732421875, -7.29461669921875, -7.0159912109375, -6.73736572265625, -6.458740234375, -6.18011474609375, -5.9014892578125, -5.62286376953125, -5.34423828125, -5.06561279296875, -4.7869873046875, -4.50836181640625, -4.229736328125, -3.95111083984375, -3.6724853515625, -3.39385986328125, -3.115234375, -2.83660888671875, -2.5579833984375, -2.27935791015625, -2.000732421875, -1.72210693359375, -1.4434814453125, -1.16485595703125, -0.88623046875, -0.60760498046875, -0.3289794921875, -0.05035400390625, 0.228271484375, 0.50689697265625, 0.7855224609375, 1.06414794921875, 1.3427734375, 1.62139892578125, 1.9000244140625, 2.17864990234375, 2.457275390625, 2.73590087890625, 3.0145263671875, 3.29315185546875, 3.57177734375, 3.85040283203125, 4.1290283203125, 4.40765380859375, 4.686279296875, 4.96490478515625, 5.2435302734375, 5.52215576171875, 5.80078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 7.0, 7.0, 29.0, 69.0, 173.0, 286.0, 230.0, 123.0, 44.0, 17.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-263.8902282714844, -258.71234130859375, -253.5344696044922, -248.35658264160156, -243.17869567871094, -238.00082397460938, -232.82293701171875, -227.64505004882812, -222.4671630859375, -217.28927612304688, -212.1114044189453, -206.9335174560547, -201.75563049316406, -196.5777587890625, -191.39987182617188, -186.22198486328125, -181.0441131591797, -175.86622619628906, -170.6883544921875, -165.51046752929688, -160.33258056640625, -155.15469360351562, -149.97682189941406, -144.79893493652344, -139.62106323242188, -134.44317626953125, -129.2653045654297, -124.08741760253906, -118.90953063964844, -113.73165130615234, -108.55377197265625, -103.37588500976562, -98.19800567626953, -93.02012634277344, -87.84223937988281, -82.66436004638672, -77.48648071289062, -72.30859375, -67.1307144165039, -61.95283126831055, -56.77494812011719, -51.59706497192383, -46.41918182373047, -41.241302490234375, -36.063419342041016, -30.885536193847656, -25.70765495300293, -20.529773712158203, -15.351890563964844, -10.1740083694458, -4.996126174926758, 0.18175601959228516, 5.359638214111328, 10.537521362304688, 15.715402603149414, 20.89328384399414, 26.0711669921875, 31.24905014038086, 36.42693328857422, 41.60481262207031, 46.78269577026367, 51.96057891845703, 57.138458251953125, 62.316341400146484, 67.49422454833984]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 5.0, 4.0, 8.0, 9.0, 11.0, 16.0, 25.0, 19.0, 21.0, 24.0, 32.0, 28.0, 28.0, 42.0, 39.0, 44.0, 42.0, 42.0, 59.0, 44.0, 49.0, 44.0, 39.0, 37.0, 32.0, 35.0, 27.0, 32.0, 32.0, 20.0, 14.0, 19.0, 10.0, 10.0, 8.0, 6.0, 5.0, 9.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-70.36729431152344, -68.22250366210938, -66.07771301269531, -63.93292236328125, -61.78813171386719, -59.643341064453125, -57.49855422973633, -55.353763580322266, -53.2089729309082, -51.06418228149414, -48.91939163208008, -46.774600982666016, -44.62981414794922, -42.485023498535156, -40.340232849121094, -38.19544219970703, -36.05065155029297, -33.905860900878906, -31.761070251464844, -29.616281509399414, -27.47149085998535, -25.32670021057129, -23.18191146850586, -21.037120819091797, -18.892330169677734, -16.747539520263672, -14.602749824523926, -12.45796012878418, -10.313169479370117, -8.168378829956055, -6.023589134216309, -3.8787994384765625, -1.7340087890625, 0.4107813835144043, 2.5555715560913086, 4.700361728668213, 6.845151901245117, 8.98994255065918, 11.134732246398926, 13.279521942138672, 15.424312591552734, 17.569103240966797, 19.71389389038086, 21.85868263244629, 24.00347328186035, 26.148263931274414, 28.293052673339844, 30.437843322753906, 32.58263397216797, 34.72742462158203, 36.872215270996094, 39.017005920410156, 41.16179656982422, 43.30658721923828, 45.45137405395508, 47.59616470336914, 49.7409553527832, 51.885746002197266, 54.03053665161133, 56.17532730102539, 58.32011413574219, 60.46490478515625, 62.60969543457031, 64.75448608398438, 66.89927673339844]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 12.0, 6.0, 8.0, 13.0, 22.0, 35.0, 40.0, 57.0, 81.0, 129.0, 176.0, 502.0, 7916.0, 4156474.0, 27321.0, 785.0, 243.0, 146.0, 82.0, 59.0, 45.0, 24.0, 24.0, 18.0, 13.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-51.0, -49.607421875, -48.21484375, -46.822265625, -45.4296875, -44.037109375, -42.64453125, -41.251953125, -39.859375, -38.466796875, -37.07421875, -35.681640625, -34.2890625, -32.896484375, -31.50390625, -30.111328125, -28.71875, -27.326171875, -25.93359375, -24.541015625, -23.1484375, -21.755859375, -20.36328125, -18.970703125, -17.578125, -16.185546875, -14.79296875, -13.400390625, -12.0078125, -10.615234375, -9.22265625, -7.830078125, -6.4375, -5.044921875, -3.65234375, -2.259765625, -0.8671875, 0.525390625, 1.91796875, 3.310546875, 4.703125, 6.095703125, 7.48828125, 8.880859375, 10.2734375, 11.666015625, 13.05859375, 14.451171875, 15.84375, 17.236328125, 18.62890625, 20.021484375, 21.4140625, 22.806640625, 24.19921875, 25.591796875, 26.984375, 28.376953125, 29.76953125, 31.162109375, 32.5546875, 33.947265625, 35.33984375, 36.732421875, 38.125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 10.0, 16.0, 21.0, 29.0, 38.0, 49.0, 45.0, 68.0, 62.0, 81.0, 86.0, 82.0, 112.0, 77.0, 53.0, 53.0, 40.0, 30.0, 17.0, 12.0, 7.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.8763427734375, -7.627685546875, -7.3790283203125, -7.13037109375, -6.8817138671875, -6.633056640625, -6.3843994140625, -6.1357421875, -5.8870849609375, -5.638427734375, -5.3897705078125, -5.14111328125, -4.8924560546875, -4.643798828125, -4.3951416015625, -4.146484375, -3.8978271484375, -3.649169921875, -3.4005126953125, -3.15185546875, -2.9031982421875, -2.654541015625, -2.4058837890625, -2.1572265625, -1.9085693359375, -1.659912109375, -1.4112548828125, -1.16259765625, -0.9139404296875, -0.665283203125, -0.4166259765625, -0.16796875, 0.0806884765625, 0.329345703125, 0.5780029296875, 0.82666015625, 1.0753173828125, 1.323974609375, 1.5726318359375, 1.8212890625, 2.0699462890625, 2.318603515625, 2.5672607421875, 2.81591796875, 3.0645751953125, 3.313232421875, 3.5618896484375, 3.810546875, 4.0592041015625, 4.307861328125, 4.5565185546875, 4.80517578125, 5.0538330078125, 5.302490234375, 5.5511474609375, 5.7998046875, 6.0484619140625, 6.297119140625, 6.5457763671875, 6.79443359375, 7.0430908203125, 7.291748046875, 7.5404052734375, 7.7890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 15.0, 25.0, 26.0, 42.0, 86.0, 148.0, 251.0, 481.0, 882.0, 1862.0, 3928.0, 10466.0, 35082.0, 238416.0, 3240534.0, 579594.0, 57287.0, 15000.0, 5387.0, 2332.0, 1093.0, 599.0, 323.0, 169.0, 116.0, 48.0, 30.0, 20.0, 13.0, 5.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.8687744140625, -7.573486328125, -7.2781982421875, -6.98291015625, -6.6876220703125, -6.392333984375, -6.0970458984375, -5.8017578125, -5.5064697265625, -5.211181640625, -4.9158935546875, -4.62060546875, -4.3253173828125, -4.030029296875, -3.7347412109375, -3.439453125, -3.1441650390625, -2.848876953125, -2.5535888671875, -2.25830078125, -1.9630126953125, -1.667724609375, -1.3724365234375, -1.0771484375, -0.7818603515625, -0.486572265625, -0.1912841796875, 0.10400390625, 0.3992919921875, 0.694580078125, 0.9898681640625, 1.28515625, 1.5804443359375, 1.875732421875, 2.1710205078125, 2.46630859375, 2.7615966796875, 3.056884765625, 3.3521728515625, 3.6474609375, 3.9427490234375, 4.238037109375, 4.5333251953125, 4.82861328125, 5.1239013671875, 5.419189453125, 5.7144775390625, 6.009765625, 6.3050537109375, 6.600341796875, 6.8956298828125, 7.19091796875, 7.4862060546875, 7.781494140625, 8.0767822265625, 8.3720703125, 8.6673583984375, 8.962646484375, 9.2579345703125, 9.55322265625, 9.8485107421875, 10.143798828125, 10.4390869140625, 10.734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 7.0, 14.0, 8.0, 10.0, 13.0, 18.0, 28.0, 44.0, 85.0, 168.0, 331.0, 709.0, 1008.0, 782.0, 354.0, 194.0, 99.0, 74.0, 37.0, 31.0, 18.0, 13.0, 10.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-14.0859375, -13.7210693359375, -13.356201171875, -12.9913330078125, -12.62646484375, -12.2615966796875, -11.896728515625, -11.5318603515625, -11.1669921875, -10.8021240234375, -10.437255859375, -10.0723876953125, -9.70751953125, -9.3426513671875, -8.977783203125, -8.6129150390625, -8.248046875, -7.8831787109375, -7.518310546875, -7.1534423828125, -6.78857421875, -6.4237060546875, -6.058837890625, -5.6939697265625, -5.3291015625, -4.9642333984375, -4.599365234375, -4.2344970703125, -3.86962890625, -3.5047607421875, -3.139892578125, -2.7750244140625, -2.41015625, -2.0452880859375, -1.680419921875, -1.3155517578125, -0.95068359375, -0.5858154296875, -0.220947265625, 0.1439208984375, 0.5087890625, 0.8736572265625, 1.238525390625, 1.6033935546875, 1.96826171875, 2.3331298828125, 2.697998046875, 3.0628662109375, 3.427734375, 3.7926025390625, 4.157470703125, 4.5223388671875, 4.88720703125, 5.2520751953125, 5.616943359375, 5.9818115234375, 6.3466796875, 6.7115478515625, 7.076416015625, 7.4412841796875, 7.80615234375, 8.1710205078125, 8.535888671875, 8.9007568359375, 9.265625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 30.0, 58.0, 203.0, 311.0, 212.0, 100.0, 42.0, 16.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.87675476074219, -81.71676635742188, -77.55677795410156, -73.39678955078125, -69.23680877685547, -65.07682037353516, -60.916831970214844, -56.75684356689453, -52.596858978271484, -48.43687057495117, -44.276885986328125, -40.11689758300781, -35.9569091796875, -31.796924591064453, -27.63693618774414, -23.47694969177246, -19.31696319580078, -15.156976699829102, -10.996989250183105, -6.837001800537109, -2.6770153045654297, 1.48297119140625, 5.6429595947265625, 9.802946090698242, 13.962932586669922, 18.1229190826416, 22.28290557861328, 26.442893981933594, 30.602880477905273, 34.76286697387695, 38.922855377197266, 43.08283996582031, 47.242828369140625, 51.40281677246094, 55.562801361083984, 59.7227897644043, 63.882774353027344, 68.04276275634766, 72.20275115966797, 76.36273956298828, 80.52272033691406, 84.68270874023438, 88.84269714355469, 93.002685546875, 97.16266632080078, 101.3226547241211, 105.4826431274414, 109.64263153076172, 113.80261993408203, 117.96260833740234, 122.12259674072266, 126.28257751464844, 130.44256591796875, 134.60255432128906, 138.76254272460938, 142.9225311279297, 147.08251953125, 151.2425079345703, 155.40249633789062, 159.56248474121094, 163.72247314453125, 167.8824462890625, 172.04244995117188, 176.20242309570312, 180.36241149902344]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 10.0, 8.0, 12.0, 15.0, 19.0, 16.0, 18.0, 25.0, 39.0, 41.0, 47.0, 39.0, 55.0, 55.0, 36.0, 59.0, 67.0, 59.0, 54.0, 45.0, 50.0, 31.0, 44.0, 32.0, 29.0, 19.0, 17.0, 14.0, 4.0, 6.0, 11.0, 8.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.28738021850586, -47.83977508544922, -46.39216995239258, -44.94456481933594, -43.4969596862793, -42.049354553222656, -40.60174560546875, -39.154144287109375, -37.70653533935547, -36.25893020629883, -34.81132507324219, -33.36371994018555, -31.916114807128906, -30.468509674072266, -29.020902633666992, -27.57329750061035, -26.125694274902344, -24.678089141845703, -23.230484008789062, -21.782878875732422, -20.33527374267578, -18.88766860961914, -17.440061569213867, -15.992456436157227, -14.544851303100586, -13.097246170043945, -11.649641036987305, -10.202034950256348, -8.754429817199707, -7.306824684143066, -5.859218597412109, -4.411613464355469, -2.9640045166015625, -1.5163991451263428, -0.06879377365112305, 1.3788118362426758, 2.8264169692993164, 4.274022102355957, 5.721628189086914, 7.169233322143555, 8.616838455200195, 10.064443588256836, 11.512048721313477, 12.959654808044434, 14.407259941101074, 15.854865074157715, 17.302471160888672, 18.750076293945312, 20.197681427001953, 21.645286560058594, 23.092891693115234, 24.540496826171875, 25.988101959228516, 27.435707092285156, 28.88331413269043, 30.33091926574707, 31.77852439880371, 33.226131439208984, 34.673736572265625, 36.121341705322266, 37.568946838378906, 39.01655197143555, 40.46415710449219, 41.91176223754883, 43.35936737060547]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 22.0, 22.0, 46.0, 61.0, 108.0, 182.0, 288.0, 494.0, 855.0, 1591.0, 3016.0, 5524.0, 11425.0, 25043.0, 58091.0, 152241.0, 365459.0, 257978.0, 94021.0, 38071.0, 17006.0, 8055.0, 3989.0, 2148.0, 1166.0, 651.0, 388.0, 217.0, 142.0, 88.0, 52.0, 36.0, 15.0, 16.0, 10.0, 4.0, 5.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.88671875, -5.70135498046875, -5.5159912109375, -5.33062744140625, -5.145263671875, -4.95989990234375, -4.7745361328125, -4.58917236328125, -4.40380859375, -4.21844482421875, -4.0330810546875, -3.84771728515625, -3.662353515625, -3.47698974609375, -3.2916259765625, -3.10626220703125, -2.9208984375, -2.73553466796875, -2.5501708984375, -2.36480712890625, -2.179443359375, -1.99407958984375, -1.8087158203125, -1.62335205078125, -1.43798828125, -1.25262451171875, -1.0672607421875, -0.88189697265625, -0.696533203125, -0.51116943359375, -0.3258056640625, -0.14044189453125, 0.044921875, 0.23028564453125, 0.4156494140625, 0.60101318359375, 0.786376953125, 0.97174072265625, 1.1571044921875, 1.34246826171875, 1.52783203125, 1.71319580078125, 1.8985595703125, 2.08392333984375, 2.269287109375, 2.45465087890625, 2.6400146484375, 2.82537841796875, 3.0107421875, 3.19610595703125, 3.3814697265625, 3.56683349609375, 3.752197265625, 3.93756103515625, 4.1229248046875, 4.30828857421875, 4.49365234375, 4.67901611328125, 4.8643798828125, 5.04974365234375, 5.235107421875, 5.42047119140625, 5.6058349609375, 5.79119873046875, 5.9765625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 6.0, 8.0, 5.0, 16.0, 17.0, 15.0, 20.0, 19.0, 22.0, 26.0, 26.0, 22.0, 48.0, 51.0, 40.0, 45.0, 63.0, 47.0, 51.0, 55.0, 63.0, 45.0, 40.0, 29.0, 28.0, 30.0, 34.0, 29.0, 19.0, 19.0, 15.0, 9.0, 11.0, 10.0, 10.0, 0.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.706329345703125, -3.55914306640625, -3.411956787109375, -3.2647705078125, -3.117584228515625, -2.97039794921875, -2.823211669921875, -2.676025390625, -2.528839111328125, -2.38165283203125, -2.234466552734375, -2.0872802734375, -1.940093994140625, -1.79290771484375, -1.645721435546875, -1.49853515625, -1.351348876953125, -1.20416259765625, -1.056976318359375, -0.9097900390625, -0.762603759765625, -0.61541748046875, -0.468231201171875, -0.321044921875, -0.173858642578125, -0.02667236328125, 0.120513916015625, 0.2677001953125, 0.414886474609375, 0.56207275390625, 0.709259033203125, 0.8564453125, 1.003631591796875, 1.15081787109375, 1.298004150390625, 1.4451904296875, 1.592376708984375, 1.73956298828125, 1.886749267578125, 2.033935546875, 2.181121826171875, 2.32830810546875, 2.475494384765625, 2.6226806640625, 2.769866943359375, 2.91705322265625, 3.064239501953125, 3.21142578125, 3.358612060546875, 3.50579833984375, 3.652984619140625, 3.8001708984375, 3.947357177734375, 4.09454345703125, 4.241729736328125, 4.388916015625, 4.536102294921875, 4.68328857421875, 4.830474853515625, 4.9776611328125, 5.124847412109375, 5.27203369140625, 5.419219970703125, 5.56640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 6.0, 5.0, 10.0, 6.0, 7.0, 9.0, 26.0, 27.0, 51.0, 76.0, 107.0, 145.0, 287.0, 540.0, 1058.0, 3041.0, 11865.0, 77104.0, 724426.0, 198187.0, 23594.0, 4813.0, 1567.0, 721.0, 337.0, 192.0, 109.0, 68.0, 43.0, 32.0, 30.0, 13.0, 14.0, 6.0, 15.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.546875, -16.0833740234375, -15.619873046875, -15.1563720703125, -14.69287109375, -14.2293701171875, -13.765869140625, -13.3023681640625, -12.8388671875, -12.3753662109375, -11.911865234375, -11.4483642578125, -10.98486328125, -10.5213623046875, -10.057861328125, -9.5943603515625, -9.130859375, -8.6673583984375, -8.203857421875, -7.7403564453125, -7.27685546875, -6.8133544921875, -6.349853515625, -5.8863525390625, -5.4228515625, -4.9593505859375, -4.495849609375, -4.0323486328125, -3.56884765625, -3.1053466796875, -2.641845703125, -2.1783447265625, -1.71484375, -1.2513427734375, -0.787841796875, -0.3243408203125, 0.13916015625, 0.6026611328125, 1.066162109375, 1.5296630859375, 1.9931640625, 2.4566650390625, 2.920166015625, 3.3836669921875, 3.84716796875, 4.3106689453125, 4.774169921875, 5.2376708984375, 5.701171875, 6.1646728515625, 6.628173828125, 7.0916748046875, 7.55517578125, 8.0186767578125, 8.482177734375, 8.9456787109375, 9.4091796875, 9.8726806640625, 10.336181640625, 10.7996826171875, 11.26318359375, 11.7266845703125, 12.190185546875, 12.6536865234375, 13.1171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 7.0, 9.0, 8.0, 17.0, 11.0, 15.0, 17.0, 27.0, 37.0, 32.0, 37.0, 36.0, 59.0, 52.0, 60.0, 58.0, 45.0, 61.0, 56.0, 48.0, 54.0, 47.0, 38.0, 25.0, 23.0, 20.0, 18.0, 16.0, 12.0, 13.0, 5.0, 10.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.078125, -21.457275390625, -20.83642578125, -20.215576171875, -19.5947265625, -18.973876953125, -18.35302734375, -17.732177734375, -17.111328125, -16.490478515625, -15.86962890625, -15.248779296875, -14.6279296875, -14.007080078125, -13.38623046875, -12.765380859375, -12.14453125, -11.523681640625, -10.90283203125, -10.281982421875, -9.6611328125, -9.040283203125, -8.41943359375, -7.798583984375, -7.177734375, -6.556884765625, -5.93603515625, -5.315185546875, -4.6943359375, -4.073486328125, -3.45263671875, -2.831787109375, -2.2109375, -1.590087890625, -0.96923828125, -0.348388671875, 0.2724609375, 0.893310546875, 1.51416015625, 2.135009765625, 2.755859375, 3.376708984375, 3.99755859375, 4.618408203125, 5.2392578125, 5.860107421875, 6.48095703125, 7.101806640625, 7.72265625, 8.343505859375, 8.96435546875, 9.585205078125, 10.2060546875, 10.826904296875, 11.44775390625, 12.068603515625, 12.689453125, 13.310302734375, 13.93115234375, 14.552001953125, 15.1728515625, 15.793701171875, 16.41455078125, 17.035400390625, 17.65625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 3.0, 5.0, 7.0, 7.0, 21.0, 25.0, 49.0, 106.0, 253.0, 756.0, 3149.0, 30383.0, 877432.0, 127014.0, 7278.0, 1318.0, 366.0, 175.0, 83.0, 37.0, 18.0, 16.0, 14.0, 12.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.91796875, -10.5625, -10.20703125, -9.8515625, -9.49609375, -9.140625, -8.78515625, -8.4296875, -8.07421875, -7.71875, -7.36328125, -7.0078125, -6.65234375, -6.296875, -5.94140625, -5.5859375, -5.23046875, -4.875, -4.51953125, -4.1640625, -3.80859375, -3.453125, -3.09765625, -2.7421875, -2.38671875, -2.03125, -1.67578125, -1.3203125, -0.96484375, -0.609375, -0.25390625, 0.1015625, 0.45703125, 0.8125, 1.16796875, 1.5234375, 1.87890625, 2.234375, 2.58984375, 2.9453125, 3.30078125, 3.65625, 4.01171875, 4.3671875, 4.72265625, 5.078125, 5.43359375, 5.7890625, 6.14453125, 6.5, 6.85546875, 7.2109375, 7.56640625, 7.921875, 8.27734375, 8.6328125, 8.98828125, 9.34375, 9.69921875, 10.0546875, 10.41015625, 10.765625, 11.12109375, 11.4765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 9.0, 6.0, 6.0, 15.0, 15.0, 29.0, 37.0, 57.0, 61.0, 94.0, 116.0, 125.0, 118.0, 86.0, 63.0, 35.0, 18.0, 15.0, 21.0, 9.0, 9.0, 8.0, 8.0, 4.0, 6.0, 5.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012149810791015625, -0.0011805295944213867, -0.001146078109741211, -0.0011116266250610352, -0.0010771751403808594, -0.0010427236557006836, -0.0010082721710205078, -0.000973820686340332, -0.0009393692016601562, -0.0009049177169799805, -0.0008704662322998047, -0.0008360147476196289, -0.0008015632629394531, -0.0007671117782592773, -0.0007326602935791016, -0.0006982088088989258, -0.00066375732421875, -0.0006293058395385742, -0.0005948543548583984, -0.0005604028701782227, -0.0005259513854980469, -0.0004914999008178711, -0.0004570484161376953, -0.00042259693145751953, -0.00038814544677734375, -0.00035369396209716797, -0.0003192424774169922, -0.0002847909927368164, -0.0002503395080566406, -0.00021588802337646484, -0.00018143653869628906, -0.00014698505401611328, -0.0001125335693359375, -7.808208465576172e-05, -4.363059997558594e-05, -9.179115295410156e-06, 2.5272369384765625e-05, 5.9723854064941406e-05, 9.417533874511719e-05, 0.00012862682342529297, 0.00016307830810546875, 0.00019752979278564453, 0.0002319812774658203, 0.0002664327621459961, 0.0003008842468261719, 0.00033533573150634766, 0.00036978721618652344, 0.0004042387008666992, 0.000438690185546875, 0.0004731416702270508, 0.0005075931549072266, 0.0005420446395874023, 0.0005764961242675781, 0.0006109476089477539, 0.0006453990936279297, 0.0006798505783081055, 0.0007143020629882812, 0.000748753547668457, 0.0007832050323486328, 0.0008176565170288086, 0.0008521080017089844, 0.0008865594863891602, 0.0009210109710693359, 0.0009554624557495117, 0.0009899139404296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 8.0, 8.0, 17.0, 34.0, 52.0, 92.0, 155.0, 366.0, 777.0, 2161.0, 8029.0, 44676.0, 646346.0, 309173.0, 27889.0, 5784.0, 1685.0, 641.0, 295.0, 137.0, 83.0, 52.0, 25.0, 18.0, 13.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.66510009765625, -5.4278564453125, -5.19061279296875, -4.953369140625, -4.71612548828125, -4.4788818359375, -4.24163818359375, -4.00439453125, -3.76715087890625, -3.5299072265625, -3.29266357421875, -3.055419921875, -2.81817626953125, -2.5809326171875, -2.34368896484375, -2.1064453125, -1.86920166015625, -1.6319580078125, -1.39471435546875, -1.157470703125, -0.92022705078125, -0.6829833984375, -0.44573974609375, -0.20849609375, 0.02874755859375, 0.2659912109375, 0.50323486328125, 0.740478515625, 0.97772216796875, 1.2149658203125, 1.45220947265625, 1.689453125, 1.92669677734375, 2.1639404296875, 2.40118408203125, 2.638427734375, 2.87567138671875, 3.1129150390625, 3.35015869140625, 3.58740234375, 3.82464599609375, 4.0618896484375, 4.29913330078125, 4.536376953125, 4.77362060546875, 5.0108642578125, 5.24810791015625, 5.4853515625, 5.72259521484375, 5.9598388671875, 6.19708251953125, 6.434326171875, 6.67156982421875, 6.9088134765625, 7.14605712890625, 7.38330078125, 7.62054443359375, 7.8577880859375, 8.09503173828125, 8.332275390625, 8.56951904296875, 8.8067626953125, 9.04400634765625, 9.28125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 6.0, 11.0, 6.0, 15.0, 13.0, 19.0, 27.0, 26.0, 37.0, 46.0, 59.0, 86.0, 91.0, 94.0, 73.0, 65.0, 85.0, 50.0, 41.0, 25.0, 18.0, 16.0, 19.0, 12.0, 12.0, 9.0, 9.0, 9.0, 4.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.96343994140625, -4.8057861328125, -4.64813232421875, -4.490478515625, -4.33282470703125, -4.1751708984375, -4.01751708984375, -3.85986328125, -3.70220947265625, -3.5445556640625, -3.38690185546875, -3.229248046875, -3.07159423828125, -2.9139404296875, -2.75628662109375, -2.5986328125, -2.44097900390625, -2.2833251953125, -2.12567138671875, -1.968017578125, -1.81036376953125, -1.6527099609375, -1.49505615234375, -1.33740234375, -1.17974853515625, -1.0220947265625, -0.86444091796875, -0.706787109375, -0.54913330078125, -0.3914794921875, -0.23382568359375, -0.076171875, 0.08148193359375, 0.2391357421875, 0.39678955078125, 0.554443359375, 0.71209716796875, 0.8697509765625, 1.02740478515625, 1.18505859375, 1.34271240234375, 1.5003662109375, 1.65802001953125, 1.815673828125, 1.97332763671875, 2.1309814453125, 2.28863525390625, 2.4462890625, 2.60394287109375, 2.7615966796875, 2.91925048828125, 3.076904296875, 3.23455810546875, 3.3922119140625, 3.54986572265625, 3.70751953125, 3.86517333984375, 4.0228271484375, 4.18048095703125, 4.338134765625, 4.49578857421875, 4.6534423828125, 4.81109619140625, 4.96875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 9.0, 33.0, 92.0, 314.0, 373.0, 127.0, 23.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.34764099121094, -122.90054321289062, -116.45343780517578, -110.00634002685547, -103.55923461914062, -97.11213684082031, -90.6650390625, -84.21794128417969, -77.77083587646484, -71.32373809814453, -64.87663269042969, -58.429534912109375, -51.9824333190918, -45.53533172607422, -39.088233947753906, -32.64113235473633, -26.19403076171875, -19.746929168701172, -13.299829483032227, -6.852729797363281, -0.4056282043457031, 6.041473388671875, 12.488571166992188, 18.935672760009766, 25.382774353027344, 31.829875946044922, 38.2769775390625, 44.72407531738281, 51.17117691040039, 57.61827850341797, 64.06537628173828, 70.51248168945312, 76.9595947265625, 83.40669250488281, 89.85379791259766, 96.30089569091797, 102.74800109863281, 109.19509887695312, 115.64219665527344, 122.08929443359375, 128.53640747070312, 134.98350524902344, 141.43060302734375, 147.87771606445312, 154.32481384277344, 160.77191162109375, 167.21900939941406, 173.66610717773438, 180.1132049560547, 186.560302734375, 193.0074005126953, 199.45449829101562, 205.901611328125, 212.3487091064453, 218.79580688476562, 225.24290466308594, 231.69000244140625, 238.13710021972656, 244.58419799804688, 251.03131103515625, 257.4783935546875, 263.9255065917969, 270.37261962890625, 276.8197021484375, 283.2668151855469]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 10.0, 8.0, 9.0, 23.0, 15.0, 15.0, 23.0, 22.0, 36.0, 28.0, 48.0, 36.0, 50.0, 62.0, 57.0, 57.0, 69.0, 46.0, 52.0, 39.0, 38.0, 35.0, 38.0, 27.0, 18.0, 22.0, 19.0, 15.0, 15.0, 11.0, 13.0, 4.0, 9.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.213623046875, -72.89950561523438, -70.58538818359375, -68.27127075195312, -65.9571533203125, -63.643035888671875, -61.328914642333984, -59.01479721069336, -56.700679779052734, -54.38656234741211, -52.072444915771484, -49.75832748413086, -47.44420623779297, -45.130088806152344, -42.81597137451172, -40.501853942871094, -38.18773651123047, -35.873619079589844, -33.55950164794922, -31.24538230895996, -28.931264877319336, -26.61714744567871, -24.303028106689453, -21.988910675048828, -19.674793243408203, -17.360675811767578, -15.046557426452637, -12.732439041137695, -10.41832160949707, -8.104204177856445, -5.790085792541504, -3.4759674072265625, -1.1618499755859375, 1.1522679328918457, 3.466385841369629, 5.780503749847412, 8.094621658325195, 10.40873908996582, 12.722857475280762, 15.036975860595703, 17.351093292236328, 19.665210723876953, 21.979328155517578, 24.293447494506836, 26.60756492614746, 28.921682357788086, 31.235801696777344, 33.54991912841797, 35.864036560058594, 38.17815399169922, 40.492271423339844, 42.80638885498047, 45.120506286621094, 47.43462371826172, 49.74874496459961, 52.062862396240234, 54.37697982788086, 56.691097259521484, 59.00521469116211, 61.319332122802734, 63.633453369140625, 65.94757080078125, 68.26168823242188, 70.5758056640625, 72.88992309570312]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 16.0, 9.0, 21.0, 29.0, 35.0, 55.0, 104.0, 155.0, 284.0, 493.0, 889.0, 1682.0, 3440.0, 7669.0, 19620.0, 70516.0, 494427.0, 2579530.0, 864646.0, 106542.0, 25816.0, 9611.0, 4223.0, 1982.0, 1056.0, 608.0, 308.0, 179.0, 113.0, 64.0, 51.0, 33.0, 23.0, 14.0, 14.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-6.98828125, -6.7974853515625, -6.606689453125, -6.4158935546875, -6.22509765625, -6.0343017578125, -5.843505859375, -5.6527099609375, -5.4619140625, -5.2711181640625, -5.080322265625, -4.8895263671875, -4.69873046875, -4.5079345703125, -4.317138671875, -4.1263427734375, -3.935546875, -3.7447509765625, -3.553955078125, -3.3631591796875, -3.17236328125, -2.9815673828125, -2.790771484375, -2.5999755859375, -2.4091796875, -2.2183837890625, -2.027587890625, -1.8367919921875, -1.64599609375, -1.4552001953125, -1.264404296875, -1.0736083984375, -0.8828125, -0.6920166015625, -0.501220703125, -0.3104248046875, -0.11962890625, 0.0711669921875, 0.261962890625, 0.4527587890625, 0.6435546875, 0.8343505859375, 1.025146484375, 1.2159423828125, 1.40673828125, 1.5975341796875, 1.788330078125, 1.9791259765625, 2.169921875, 2.3607177734375, 2.551513671875, 2.7423095703125, 2.93310546875, 3.1239013671875, 3.314697265625, 3.5054931640625, 3.6962890625, 3.8870849609375, 4.077880859375, 4.2686767578125, 4.45947265625, 4.6502685546875, 4.841064453125, 5.0318603515625, 5.22265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 13.0, 14.0, 16.0, 23.0, 27.0, 37.0, 35.0, 27.0, 28.0, 43.0, 45.0, 46.0, 53.0, 34.0, 62.0, 67.0, 42.0, 42.0, 47.0, 37.0, 37.0, 40.0, 23.0, 21.0, 21.0, 18.0, 22.0, 9.0, 8.0, 11.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.539825439453125, -3.40972900390625, -3.279632568359375, -3.1495361328125, -3.019439697265625, -2.88934326171875, -2.759246826171875, -2.629150390625, -2.499053955078125, -2.36895751953125, -2.238861083984375, -2.1087646484375, -1.978668212890625, -1.84857177734375, -1.718475341796875, -1.58837890625, -1.458282470703125, -1.32818603515625, -1.198089599609375, -1.0679931640625, -0.937896728515625, -0.80780029296875, -0.677703857421875, -0.547607421875, -0.417510986328125, -0.28741455078125, -0.157318115234375, -0.0272216796875, 0.102874755859375, 0.23297119140625, 0.363067626953125, 0.4931640625, 0.623260498046875, 0.75335693359375, 0.883453369140625, 1.0135498046875, 1.143646240234375, 1.27374267578125, 1.403839111328125, 1.533935546875, 1.664031982421875, 1.79412841796875, 1.924224853515625, 2.0543212890625, 2.184417724609375, 2.31451416015625, 2.444610595703125, 2.57470703125, 2.704803466796875, 2.83489990234375, 2.964996337890625, 3.0950927734375, 3.225189208984375, 3.35528564453125, 3.485382080078125, 3.615478515625, 3.745574951171875, 3.87567138671875, 4.005767822265625, 4.1358642578125, 4.265960693359375, 4.39605712890625, 4.526153564453125, 4.65625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 15.0, 25.0, 15.0, 29.0, 32.0, 59.0, 87.0, 132.0, 244.0, 517.0, 979.0, 2215.0, 5011.0, 14441.0, 48753.0, 289734.0, 2954984.0, 752150.0, 89316.0, 22695.0, 7467.0, 2818.0, 1163.0, 575.0, 306.0, 175.0, 97.0, 46.0, 46.0, 35.0, 17.0, 20.0, 14.0, 7.0, 7.0, 6.0, 2.0, 2.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40625, -7.138671875, -6.87109375, -6.603515625, -6.3359375, -6.068359375, -5.80078125, -5.533203125, -5.265625, -4.998046875, -4.73046875, -4.462890625, -4.1953125, -3.927734375, -3.66015625, -3.392578125, -3.125, -2.857421875, -2.58984375, -2.322265625, -2.0546875, -1.787109375, -1.51953125, -1.251953125, -0.984375, -0.716796875, -0.44921875, -0.181640625, 0.0859375, 0.353515625, 0.62109375, 0.888671875, 1.15625, 1.423828125, 1.69140625, 1.958984375, 2.2265625, 2.494140625, 2.76171875, 3.029296875, 3.296875, 3.564453125, 3.83203125, 4.099609375, 4.3671875, 4.634765625, 4.90234375, 5.169921875, 5.4375, 5.705078125, 5.97265625, 6.240234375, 6.5078125, 6.775390625, 7.04296875, 7.310546875, 7.578125, 7.845703125, 8.11328125, 8.380859375, 8.6484375, 8.916015625, 9.18359375, 9.451171875, 9.71875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 11.0, 16.0, 25.0, 19.0, 39.0, 40.0, 82.0, 124.0, 230.0, 376.0, 577.0, 722.0, 639.0, 384.0, 247.0, 181.0, 105.0, 70.0, 43.0, 38.0, 21.0, 16.0, 15.0, 6.0, 10.0, 6.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3828125, -10.0443115234375, -9.705810546875, -9.3673095703125, -9.02880859375, -8.6903076171875, -8.351806640625, -8.0133056640625, -7.6748046875, -7.3363037109375, -6.997802734375, -6.6593017578125, -6.32080078125, -5.9822998046875, -5.643798828125, -5.3052978515625, -4.966796875, -4.6282958984375, -4.289794921875, -3.9512939453125, -3.61279296875, -3.2742919921875, -2.935791015625, -2.5972900390625, -2.2587890625, -1.9202880859375, -1.581787109375, -1.2432861328125, -0.90478515625, -0.5662841796875, -0.227783203125, 0.1107177734375, 0.44921875, 0.7877197265625, 1.126220703125, 1.4647216796875, 1.80322265625, 2.1417236328125, 2.480224609375, 2.8187255859375, 3.1572265625, 3.4957275390625, 3.834228515625, 4.1727294921875, 4.51123046875, 4.8497314453125, 5.188232421875, 5.5267333984375, 5.865234375, 6.2037353515625, 6.542236328125, 6.8807373046875, 7.21923828125, 7.5577392578125, 7.896240234375, 8.2347412109375, 8.5732421875, 8.9117431640625, 9.250244140625, 9.5887451171875, 9.92724609375, 10.2657470703125, 10.604248046875, 10.9427490234375, 11.28125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 22.0, 94.0, 279.0, 332.0, 176.0, 54.0, 15.0, 10.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.1763916015625, -186.99813842773438, -180.81988525390625, -174.64163208007812, -168.46337890625, -162.28512573242188, -156.10687255859375, -149.92861938476562, -143.7503662109375, -137.57211303710938, -131.39385986328125, -125.21560668945312, -119.037353515625, -112.85910034179688, -106.68084716796875, -100.50259399414062, -94.32433319091797, -88.14608001708984, -81.96782684326172, -75.7895736694336, -69.61132049560547, -63.433067321777344, -57.25481033325195, -51.07655715942383, -44.8983039855957, -38.72005081176758, -32.54179763793945, -26.363542556762695, -20.18528938293457, -14.007036209106445, -7.8287811279296875, -1.6505279541015625, 4.5277252197265625, 10.705978393554688, 16.884231567382812, 23.06248664855957, 29.240739822387695, 35.41899108886719, 41.59724807739258, 47.7755012512207, 53.95375442504883, 60.13200759887695, 66.31026458740234, 72.48851776123047, 78.6667709350586, 84.84502410888672, 91.02327728271484, 97.20153045654297, 103.3797836303711, 109.55803680419922, 115.73628997802734, 121.91454315185547, 128.09280395507812, 134.27105712890625, 140.44931030273438, 146.6275634765625, 152.80581665039062, 158.98406982421875, 165.16232299804688, 171.340576171875, 177.51882934570312, 183.69708251953125, 189.87533569335938, 196.0535888671875, 202.23184204101562]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 9.0, 9.0, 10.0, 15.0, 16.0, 15.0, 17.0, 31.0, 29.0, 27.0, 40.0, 21.0, 24.0, 38.0, 37.0, 55.0, 53.0, 51.0, 42.0, 40.0, 48.0, 46.0, 35.0, 34.0, 39.0, 25.0, 32.0, 25.0, 28.0, 14.0, 13.0, 14.0, 13.0, 11.0, 8.0, 8.0, 3.0, 5.0, 2.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.9694709777832, -44.469940185546875, -42.97040939331055, -41.47087860107422, -39.97134780883789, -38.47181701660156, -36.9722900390625, -35.472755432128906, -33.973228454589844, -32.473697662353516, -30.974166870117188, -29.47463607788086, -27.97510528564453, -26.475574493408203, -24.976045608520508, -23.47651481628418, -21.97698211669922, -20.47745132446289, -18.977920532226562, -17.478389739990234, -15.978859901428223, -14.479329109191895, -12.979799270629883, -11.480268478393555, -9.980737686157227, -8.481206893920898, -6.9816765785217285, -5.482146263122559, -3.9826154708862305, -2.4830846786499023, -0.9835548400878906, 0.5159759521484375, 2.0155105590820312, 3.5150411128997803, 5.014571666717529, 6.514101982116699, 8.013632774353027, 9.513163566589355, 11.012693405151367, 12.512224197387695, 14.011754989624023, 15.511285781860352, 17.01081657409668, 18.510345458984375, 20.009876251220703, 21.50940704345703, 23.00893783569336, 24.508468627929688, 26.007999420166016, 27.507530212402344, 29.007061004638672, 30.506591796875, 32.00612258911133, 33.505653381347656, 35.00518035888672, 36.50471496582031, 38.004241943359375, 39.5037727355957, 41.00330352783203, 42.50283432006836, 44.00236511230469, 45.501895904541016, 47.001426696777344, 48.500953674316406, 50.00048828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 11.0, 12.0, 17.0, 20.0, 26.0, 46.0, 72.0, 92.0, 172.0, 243.0, 416.0, 783.0, 1375.0, 2686.0, 5485.0, 11499.0, 24417.0, 53221.0, 115245.0, 240214.0, 294375.0, 159680.0, 73638.0, 34049.0, 15720.0, 7213.0, 3615.0, 1810.0, 972.0, 543.0, 319.0, 202.0, 116.0, 73.0, 63.0, 39.0, 17.0, 19.0, 9.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.36480712890625, -4.2100830078125, -4.05535888671875, -3.900634765625, -3.74591064453125, -3.5911865234375, -3.43646240234375, -3.28173828125, -3.12701416015625, -2.9722900390625, -2.81756591796875, -2.662841796875, -2.50811767578125, -2.3533935546875, -2.19866943359375, -2.0439453125, -1.88922119140625, -1.7344970703125, -1.57977294921875, -1.425048828125, -1.27032470703125, -1.1156005859375, -0.96087646484375, -0.80615234375, -0.65142822265625, -0.4967041015625, -0.34197998046875, -0.187255859375, -0.03253173828125, 0.1221923828125, 0.27691650390625, 0.431640625, 0.58636474609375, 0.7410888671875, 0.89581298828125, 1.050537109375, 1.20526123046875, 1.3599853515625, 1.51470947265625, 1.66943359375, 1.82415771484375, 1.9788818359375, 2.13360595703125, 2.288330078125, 2.44305419921875, 2.5977783203125, 2.75250244140625, 2.9072265625, 3.06195068359375, 3.2166748046875, 3.37139892578125, 3.526123046875, 3.68084716796875, 3.8355712890625, 3.99029541015625, 4.14501953125, 4.29974365234375, 4.4544677734375, 4.60919189453125, 4.763916015625, 4.91864013671875, 5.0733642578125, 5.22808837890625, 5.3828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 4.0, 7.0, 8.0, 6.0, 15.0, 12.0, 14.0, 22.0, 23.0, 33.0, 45.0, 32.0, 39.0, 57.0, 37.0, 36.0, 49.0, 48.0, 47.0, 56.0, 42.0, 42.0, 42.0, 43.0, 36.0, 34.0, 33.0, 20.0, 20.0, 24.0, 13.0, 12.0, 14.0, 12.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.564453125, -3.437103271484375, -3.30975341796875, -3.182403564453125, -3.0550537109375, -2.927703857421875, -2.80035400390625, -2.673004150390625, -2.545654296875, -2.418304443359375, -2.29095458984375, -2.163604736328125, -2.0362548828125, -1.908905029296875, -1.78155517578125, -1.654205322265625, -1.52685546875, -1.399505615234375, -1.27215576171875, -1.144805908203125, -1.0174560546875, -0.890106201171875, -0.76275634765625, -0.635406494140625, -0.508056640625, -0.380706787109375, -0.25335693359375, -0.126007080078125, 0.0013427734375, 0.128692626953125, 0.25604248046875, 0.383392333984375, 0.5107421875, 0.638092041015625, 0.76544189453125, 0.892791748046875, 1.0201416015625, 1.147491455078125, 1.27484130859375, 1.402191162109375, 1.529541015625, 1.656890869140625, 1.78424072265625, 1.911590576171875, 2.0389404296875, 2.166290283203125, 2.29364013671875, 2.420989990234375, 2.54833984375, 2.675689697265625, 2.80303955078125, 2.930389404296875, 3.0577392578125, 3.185089111328125, 3.31243896484375, 3.439788818359375, 3.567138671875, 3.694488525390625, 3.82183837890625, 3.949188232421875, 4.0765380859375, 4.203887939453125, 4.33123779296875, 4.458587646484375, 4.5859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 2.0, 7.0, 6.0, 3.0, 14.0, 20.0, 18.0, 34.0, 43.0, 80.0, 89.0, 143.0, 252.0, 400.0, 621.0, 1206.0, 2482.0, 7750.0, 45632.0, 649921.0, 301866.0, 27685.0, 5735.0, 1992.0, 1014.0, 521.0, 335.0, 218.0, 152.0, 92.0, 70.0, 45.0, 28.0, 18.0, 23.0, 7.0, 6.0, 3.0, 12.0, 8.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-17.234375, -16.7540283203125, -16.273681640625, -15.7933349609375, -15.31298828125, -14.8326416015625, -14.352294921875, -13.8719482421875, -13.3916015625, -12.9112548828125, -12.430908203125, -11.9505615234375, -11.47021484375, -10.9898681640625, -10.509521484375, -10.0291748046875, -9.548828125, -9.0684814453125, -8.588134765625, -8.1077880859375, -7.62744140625, -7.1470947265625, -6.666748046875, -6.1864013671875, -5.7060546875, -5.2257080078125, -4.745361328125, -4.2650146484375, -3.78466796875, -3.3043212890625, -2.823974609375, -2.3436279296875, -1.86328125, -1.3829345703125, -0.902587890625, -0.4222412109375, 0.05810546875, 0.5384521484375, 1.018798828125, 1.4991455078125, 1.9794921875, 2.4598388671875, 2.940185546875, 3.4205322265625, 3.90087890625, 4.3812255859375, 4.861572265625, 5.3419189453125, 5.822265625, 6.3026123046875, 6.782958984375, 7.2633056640625, 7.74365234375, 8.2239990234375, 8.704345703125, 9.1846923828125, 9.6650390625, 10.1453857421875, 10.625732421875, 11.1060791015625, 11.58642578125, 12.0667724609375, 12.547119140625, 13.0274658203125, 13.5078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 3.0, 6.0, 6.0, 7.0, 4.0, 7.0, 17.0, 11.0, 20.0, 11.0, 34.0, 34.0, 36.0, 44.0, 37.0, 33.0, 41.0, 52.0, 54.0, 56.0, 52.0, 41.0, 53.0, 37.0, 44.0, 41.0, 26.0, 37.0, 20.0, 28.0, 21.0, 23.0, 13.0, 7.0, 6.0, 11.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.578125, -16.022216796875, -15.46630859375, -14.910400390625, -14.3544921875, -13.798583984375, -13.24267578125, -12.686767578125, -12.130859375, -11.574951171875, -11.01904296875, -10.463134765625, -9.9072265625, -9.351318359375, -8.79541015625, -8.239501953125, -7.68359375, -7.127685546875, -6.57177734375, -6.015869140625, -5.4599609375, -4.904052734375, -4.34814453125, -3.792236328125, -3.236328125, -2.680419921875, -2.12451171875, -1.568603515625, -1.0126953125, -0.456787109375, 0.09912109375, 0.655029296875, 1.2109375, 1.766845703125, 2.32275390625, 2.878662109375, 3.4345703125, 3.990478515625, 4.54638671875, 5.102294921875, 5.658203125, 6.214111328125, 6.77001953125, 7.325927734375, 7.8818359375, 8.437744140625, 8.99365234375, 9.549560546875, 10.10546875, 10.661376953125, 11.21728515625, 11.773193359375, 12.3291015625, 12.885009765625, 13.44091796875, 13.996826171875, 14.552734375, 15.108642578125, 15.66455078125, 16.220458984375, 16.7763671875, 17.332275390625, 17.88818359375, 18.444091796875, 19.0]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 16.0, 18.0, 27.0, 41.0, 62.0, 113.0, 154.0, 266.0, 425.0, 835.0, 1901.0, 5364.0, 23170.0, 138958.0, 737189.0, 112293.0, 19288.0, 4881.0, 1745.0, 769.0, 426.0, 233.0, 145.0, 79.0, 37.0, 37.0, 29.0, 19.0, 9.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.8359375, -6.65338134765625, -6.4708251953125, -6.28826904296875, -6.105712890625, -5.92315673828125, -5.7406005859375, -5.55804443359375, -5.37548828125, -5.19293212890625, -5.0103759765625, -4.82781982421875, -4.645263671875, -4.46270751953125, -4.2801513671875, -4.09759521484375, -3.9150390625, -3.73248291015625, -3.5499267578125, -3.36737060546875, -3.184814453125, -3.00225830078125, -2.8197021484375, -2.63714599609375, -2.45458984375, -2.27203369140625, -2.0894775390625, -1.90692138671875, -1.724365234375, -1.54180908203125, -1.3592529296875, -1.17669677734375, -0.994140625, -0.81158447265625, -0.6290283203125, -0.44647216796875, -0.263916015625, -0.08135986328125, 0.1011962890625, 0.28375244140625, 0.46630859375, 0.64886474609375, 0.8314208984375, 1.01397705078125, 1.196533203125, 1.37908935546875, 1.5616455078125, 1.74420166015625, 1.9267578125, 2.10931396484375, 2.2918701171875, 2.47442626953125, 2.656982421875, 2.83953857421875, 3.0220947265625, 3.20465087890625, 3.38720703125, 3.56976318359375, 3.7523193359375, 3.93487548828125, 4.117431640625, 4.29998779296875, 4.4825439453125, 4.66510009765625, 4.84765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 11.0, 12.0, 12.0, 18.0, 14.0, 14.0, 23.0, 29.0, 28.0, 31.0, 39.0, 64.0, 90.0, 116.0, 108.0, 73.0, 47.0, 35.0, 32.0, 34.0, 20.0, 28.0, 17.0, 11.0, 10.0, 11.0, 8.0, 7.0, 5.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0011053085327148438, -0.001072719693183899, -0.001040130853652954, -0.0010075420141220093, -0.0009749531745910645, -0.0009423643350601196, -0.0009097754955291748, -0.00087718665599823, -0.0008445978164672852, -0.0008120089769363403, -0.0007794201374053955, -0.0007468312978744507, -0.0007142424583435059, -0.000681653618812561, -0.0006490647792816162, -0.0006164759397506714, -0.0005838871002197266, -0.0005512982606887817, -0.0005187094211578369, -0.0004861205816268921, -0.00045353174209594727, -0.00042094290256500244, -0.0003883540630340576, -0.0003557652235031128, -0.00032317638397216797, -0.00029058754444122314, -0.0002579987049102783, -0.0002254098653793335, -0.00019282102584838867, -0.00016023218631744385, -0.00012764334678649902, -9.50545072555542e-05, -6.246566772460938e-05, -2.987682819366455e-05, 2.7120113372802734e-06, 3.53008508682251e-05, 6.788969039916992e-05, 0.00010047852993011475, 0.00013306736946105957, 0.0001656562089920044, 0.00019824504852294922, 0.00023083388805389404, 0.00026342272758483887, 0.0002960115671157837, 0.0003286004066467285, 0.00036118924617767334, 0.00039377808570861816, 0.000426366925239563, 0.0004589557647705078, 0.0004915446043014526, 0.0005241334438323975, 0.0005567222833633423, 0.0005893111228942871, 0.0006218999624252319, 0.0006544888019561768, 0.0006870776414871216, 0.0007196664810180664, 0.0007522553205490112, 0.0007848441600799561, 0.0008174329996109009, 0.0008500218391418457, 0.0008826106786727905, 0.0009151995182037354, 0.0009477883577346802, 0.000980377197265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 0.0, 3.0, 5.0, 7.0, 22.0, 29.0, 35.0, 35.0, 65.0, 68.0, 110.0, 133.0, 198.0, 310.0, 527.0, 945.0, 1786.0, 3914.0, 10468.0, 37252.0, 184946.0, 666731.0, 103724.0, 23334.0, 7413.0, 2975.0, 1403.0, 786.0, 438.0, 268.0, 175.0, 122.0, 104.0, 48.0, 46.0, 24.0, 29.0, 22.0, 8.0, 14.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.6171875, -5.44866943359375, -5.2801513671875, -5.11163330078125, -4.943115234375, -4.77459716796875, -4.6060791015625, -4.43756103515625, -4.26904296875, -4.10052490234375, -3.9320068359375, -3.76348876953125, -3.594970703125, -3.42645263671875, -3.2579345703125, -3.08941650390625, -2.9208984375, -2.75238037109375, -2.5838623046875, -2.41534423828125, -2.246826171875, -2.07830810546875, -1.9097900390625, -1.74127197265625, -1.57275390625, -1.40423583984375, -1.2357177734375, -1.06719970703125, -0.898681640625, -0.73016357421875, -0.5616455078125, -0.39312744140625, -0.224609375, -0.05609130859375, 0.1124267578125, 0.28094482421875, 0.449462890625, 0.61798095703125, 0.7864990234375, 0.95501708984375, 1.12353515625, 1.29205322265625, 1.4605712890625, 1.62908935546875, 1.797607421875, 1.96612548828125, 2.1346435546875, 2.30316162109375, 2.4716796875, 2.64019775390625, 2.8087158203125, 2.97723388671875, 3.145751953125, 3.31427001953125, 3.4827880859375, 3.65130615234375, 3.81982421875, 3.98834228515625, 4.1568603515625, 4.32537841796875, 4.493896484375, 4.66241455078125, 4.8309326171875, 4.99945068359375, 5.16796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 7.0, 13.0, 14.0, 11.0, 14.0, 22.0, 21.0, 27.0, 35.0, 30.0, 45.0, 57.0, 78.0, 89.0, 73.0, 87.0, 54.0, 56.0, 47.0, 31.0, 32.0, 26.0, 20.0, 24.0, 12.0, 8.0, 8.0, 11.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.8046875, -4.66387939453125, -4.5230712890625, -4.38226318359375, -4.241455078125, -4.10064697265625, -3.9598388671875, -3.81903076171875, -3.67822265625, -3.53741455078125, -3.3966064453125, -3.25579833984375, -3.114990234375, -2.97418212890625, -2.8333740234375, -2.69256591796875, -2.5517578125, -2.41094970703125, -2.2701416015625, -2.12933349609375, -1.988525390625, -1.84771728515625, -1.7069091796875, -1.56610107421875, -1.42529296875, -1.28448486328125, -1.1436767578125, -1.00286865234375, -0.862060546875, -0.72125244140625, -0.5804443359375, -0.43963623046875, -0.298828125, -0.15802001953125, -0.0172119140625, 0.12359619140625, 0.264404296875, 0.40521240234375, 0.5460205078125, 0.68682861328125, 0.82763671875, 0.96844482421875, 1.1092529296875, 1.25006103515625, 1.390869140625, 1.53167724609375, 1.6724853515625, 1.81329345703125, 1.9541015625, 2.09490966796875, 2.2357177734375, 2.37652587890625, 2.517333984375, 2.65814208984375, 2.7989501953125, 2.93975830078125, 3.08056640625, 3.22137451171875, 3.3621826171875, 3.50299072265625, 3.643798828125, 3.78460693359375, 3.9254150390625, 4.06622314453125, 4.20703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 10.0, 11.0, 27.0, 193.0, 510.0, 200.0, 34.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.8846435546875, -288.7700500488281, -280.6554870605469, -272.5408935546875, -264.42633056640625, -256.3117370605469, -248.1971435546875, -240.0825653076172, -231.96798706054688, -223.85340881347656, -215.73883056640625, -207.62423706054688, -199.50965881347656, -191.39508056640625, -183.28048706054688, -175.16590881347656, -167.05133056640625, -158.93675231933594, -150.82217407226562, -142.70758056640625, -134.59300231933594, -126.47842407226562, -118.36383819580078, -110.24925231933594, -102.13467407226562, -94.02009582519531, -85.90550994873047, -77.79092407226562, -69.67634582519531, -61.561763763427734, -53.447181701660156, -45.33259963989258, -37.217987060546875, -29.103404998779297, -20.98882293701172, -12.87424087524414, -4.7596588134765625, 3.3549232482910156, 11.469505310058594, 19.584087371826172, 27.69866943359375, 35.81325149536133, 43.927833557128906, 52.042415618896484, 60.15699768066406, 68.27157592773438, 76.38616180419922, 84.50074768066406, 92.61532592773438, 100.72990417480469, 108.84449005126953, 116.95907592773438, 125.07365417480469, 133.188232421875, 141.30282592773438, 149.4174041748047, 157.531982421875, 165.6465606689453, 173.76113891601562, 181.875732421875, 189.9903106689453, 198.10488891601562, 206.219482421875, 214.3340606689453, 222.44863891601562]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 16.0, 10.0, 9.0, 16.0, 28.0, 20.0, 30.0, 33.0, 48.0, 46.0, 50.0, 57.0, 90.0, 102.0, 84.0, 60.0, 50.0, 44.0, 33.0, 50.0, 23.0, 32.0, 21.0, 18.0, 7.0, 8.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.2222900390625, -68.44380950927734, -65.66533660888672, -62.88685607910156, -60.10837936401367, -57.32990264892578, -54.55142593383789, -51.77294921875, -48.994468688964844, -46.21599197387695, -43.43751525878906, -40.659034729003906, -37.880558013916016, -35.102081298828125, -32.323604583740234, -29.54512596130371, -26.766651153564453, -23.988174438476562, -21.20969581604004, -18.43121910095215, -15.652741432189941, -12.874263763427734, -10.095787048339844, -7.31730842590332, -4.53883171081543, -1.7603542804718018, 1.0181231498718262, 3.796600341796875, 6.575078010559082, 9.353555679321289, 12.13203239440918, 14.910511016845703, 17.688987731933594, 20.467464447021484, 23.245943069458008, 26.0244197845459, 28.802898406982422, 31.581375122070312, 34.3598518371582, 37.138328552246094, 39.91680908203125, 42.69528579711914, 45.47376251220703, 48.25224304199219, 51.03071975708008, 53.80919647216797, 56.58767318725586, 59.36614990234375, 62.14462661743164, 64.92310333251953, 67.70158386230469, 70.48005676269531, 73.25853729248047, 76.03701782226562, 78.81549072265625, 81.5939712524414, 84.37244415283203, 87.15092468261719, 89.92939758300781, 92.70787811279297, 95.4863510131836, 98.26483154296875, 101.04330444335938, 103.82178497314453, 106.60026550292969]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 9.0, 15.0, 17.0, 23.0, 35.0, 39.0, 71.0, 124.0, 213.0, 289.0, 631.0, 1159.0, 2235.0, 5046.0, 12384.0, 39241.0, 271947.0, 2616698.0, 1112624.0, 96135.0, 21296.0, 7436.0, 3221.0, 1444.0, 718.0, 425.0, 270.0, 156.0, 112.0, 61.0, 60.0, 35.0, 22.0, 24.0, 12.0, 9.0, 6.0, 7.0, 6.0, 7.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.171875, -5.9495849609375, -5.727294921875, -5.5050048828125, -5.28271484375, -5.0604248046875, -4.838134765625, -4.6158447265625, -4.3935546875, -4.1712646484375, -3.948974609375, -3.7266845703125, -3.50439453125, -3.2821044921875, -3.059814453125, -2.8375244140625, -2.615234375, -2.3929443359375, -2.170654296875, -1.9483642578125, -1.72607421875, -1.5037841796875, -1.281494140625, -1.0592041015625, -0.8369140625, -0.6146240234375, -0.392333984375, -0.1700439453125, 0.05224609375, 0.2745361328125, 0.496826171875, 0.7191162109375, 0.94140625, 1.1636962890625, 1.385986328125, 1.6082763671875, 1.83056640625, 2.0528564453125, 2.275146484375, 2.4974365234375, 2.7197265625, 2.9420166015625, 3.164306640625, 3.3865966796875, 3.60888671875, 3.8311767578125, 4.053466796875, 4.2757568359375, 4.498046875, 4.7203369140625, 4.942626953125, 5.1649169921875, 5.38720703125, 5.6094970703125, 5.831787109375, 6.0540771484375, 6.2763671875, 6.4986572265625, 6.720947265625, 6.9432373046875, 7.16552734375, 7.3878173828125, 7.610107421875, 7.8323974609375, 8.0546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 14.0, 7.0, 12.0, 24.0, 22.0, 36.0, 39.0, 42.0, 71.0, 70.0, 84.0, 71.0, 71.0, 87.0, 76.0, 58.0, 44.0, 39.0, 35.0, 33.0, 22.0, 17.0, 15.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7109375, -3.515869140625, -3.32080078125, -3.125732421875, -2.9306640625, -2.735595703125, -2.54052734375, -2.345458984375, -2.150390625, -1.955322265625, -1.76025390625, -1.565185546875, -1.3701171875, -1.175048828125, -0.97998046875, -0.784912109375, -0.58984375, -0.394775390625, -0.19970703125, -0.004638671875, 0.1904296875, 0.385498046875, 0.58056640625, 0.775634765625, 0.970703125, 1.165771484375, 1.36083984375, 1.555908203125, 1.7509765625, 1.946044921875, 2.14111328125, 2.336181640625, 2.53125, 2.726318359375, 2.92138671875, 3.116455078125, 3.3115234375, 3.506591796875, 3.70166015625, 3.896728515625, 4.091796875, 4.286865234375, 4.48193359375, 4.677001953125, 4.8720703125, 5.067138671875, 5.26220703125, 5.457275390625, 5.65234375, 5.847412109375, 6.04248046875, 6.237548828125, 6.4326171875, 6.627685546875, 6.82275390625, 7.017822265625, 7.212890625, 7.407958984375, 7.60302734375, 7.798095703125, 7.9931640625, 8.188232421875, 8.38330078125, 8.578369140625, 8.7734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 9.0, 10.0, 18.0, 23.0, 43.0, 71.0, 110.0, 152.0, 252.0, 506.0, 1066.0, 2947.0, 11935.0, 96999.0, 3437162.0, 602955.0, 31475.0, 5639.0, 1592.0, 611.0, 301.0, 156.0, 96.0, 61.0, 34.0, 15.0, 15.0, 5.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.390625, -11.9595947265625, -11.528564453125, -11.0975341796875, -10.66650390625, -10.2354736328125, -9.804443359375, -9.3734130859375, -8.9423828125, -8.5113525390625, -8.080322265625, -7.6492919921875, -7.21826171875, -6.7872314453125, -6.356201171875, -5.9251708984375, -5.494140625, -5.0631103515625, -4.632080078125, -4.2010498046875, -3.77001953125, -3.3389892578125, -2.907958984375, -2.4769287109375, -2.0458984375, -1.6148681640625, -1.183837890625, -0.7528076171875, -0.32177734375, 0.1092529296875, 0.540283203125, 0.9713134765625, 1.40234375, 1.8333740234375, 2.264404296875, 2.6954345703125, 3.12646484375, 3.5574951171875, 3.988525390625, 4.4195556640625, 4.8505859375, 5.2816162109375, 5.712646484375, 6.1436767578125, 6.57470703125, 7.0057373046875, 7.436767578125, 7.8677978515625, 8.298828125, 8.7298583984375, 9.160888671875, 9.5919189453125, 10.02294921875, 10.4539794921875, 10.885009765625, 11.3160400390625, 11.7470703125, 12.1781005859375, 12.609130859375, 13.0401611328125, 13.47119140625, 13.9022216796875, 14.333251953125, 14.7642822265625, 15.1953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 11.0, 9.0, 10.0, 15.0, 28.0, 24.0, 64.0, 85.0, 202.0, 362.0, 693.0, 949.0, 725.0, 369.0, 211.0, 136.0, 72.0, 30.0, 28.0, 17.0, 8.0, 6.0, 6.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-17.25, -16.8624267578125, -16.474853515625, -16.0872802734375, -15.69970703125, -15.3121337890625, -14.924560546875, -14.5369873046875, -14.1494140625, -13.7618408203125, -13.374267578125, -12.9866943359375, -12.59912109375, -12.2115478515625, -11.823974609375, -11.4364013671875, -11.048828125, -10.6612548828125, -10.273681640625, -9.8861083984375, -9.49853515625, -9.1109619140625, -8.723388671875, -8.3358154296875, -7.9482421875, -7.5606689453125, -7.173095703125, -6.7855224609375, -6.39794921875, -6.0103759765625, -5.622802734375, -5.2352294921875, -4.84765625, -4.4600830078125, -4.072509765625, -3.6849365234375, -3.29736328125, -2.9097900390625, -2.522216796875, -2.1346435546875, -1.7470703125, -1.3594970703125, -0.971923828125, -0.5843505859375, -0.19677734375, 0.1907958984375, 0.578369140625, 0.9659423828125, 1.353515625, 1.7410888671875, 2.128662109375, 2.5162353515625, 2.90380859375, 3.2913818359375, 3.678955078125, 4.0665283203125, 4.4541015625, 4.8416748046875, 5.229248046875, 5.6168212890625, 6.00439453125, 6.3919677734375, 6.779541015625, 7.1671142578125, 7.5546875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 20.0, 36.0, 75.0, 140.0, 205.0, 195.0, 150.0, 77.0, 44.0, 21.0, 6.0, 4.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-131.5286102294922, -127.94721984863281, -124.3658218383789, -120.78443145751953, -117.20304107666016, -113.62164306640625, -110.04025268554688, -106.4588623046875, -102.8774642944336, -99.29607391357422, -95.71467590332031, -92.13328552246094, -88.55189514160156, -84.97049713134766, -81.38910675048828, -77.80770874023438, -74.226318359375, -70.64492797851562, -67.06352996826172, -63.482139587402344, -59.9007453918457, -56.31935119628906, -52.73796081542969, -49.15656661987305, -45.57518005371094, -41.9937858581543, -38.41239547729492, -34.83100128173828, -31.24960708618164, -27.668214797973633, -24.086822509765625, -20.505428314208984, -16.924034118652344, -13.34264087677002, -9.761247634887695, -6.1798553466796875, -2.5984621047973633, 0.9829311370849609, 4.564323425292969, 8.14571762084961, 11.727109909057617, 15.308503150939941, 18.889896392822266, 22.471288681030273, 26.05268096923828, 29.634075164794922, 33.21546936035156, 36.79685974121094, 40.37825393676758, 43.95964813232422, 47.541038513183594, 51.122432708740234, 54.703826904296875, 58.28521728515625, 61.86661148071289, 65.44800567626953, 69.0293960571289, 72.61078643798828, 76.19218444824219, 79.77357482910156, 83.35496520996094, 86.93636322021484, 90.51775360107422, 94.09915161132812, 97.6805419921875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 12.0, 15.0, 19.0, 21.0, 37.0, 49.0, 81.0, 71.0, 82.0, 76.0, 72.0, 71.0, 69.0, 81.0, 66.0, 51.0, 34.0, 32.0, 15.0, 14.0, 18.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.54129028320312, -91.36346435546875, -89.1856460571289, -87.00782012939453, -84.83000183105469, -82.65217590332031, -80.47435760498047, -78.2965316772461, -76.11871337890625, -73.94088745117188, -71.76306915283203, -69.58524322509766, -67.40742492675781, -65.22959899902344, -63.051780700683594, -60.87395477294922, -58.69613265991211, -56.518310546875, -54.34048843383789, -52.16266632080078, -49.98484420776367, -47.80702209472656, -45.62919616699219, -43.451377868652344, -41.27355194091797, -39.09572982788086, -36.91790771484375, -34.74008560180664, -32.56226348876953, -30.384441375732422, -28.20661735534668, -26.02879524230957, -23.850975036621094, -21.673152923583984, -19.495330810546875, -17.317508697509766, -15.13968563079834, -12.96186351776123, -10.784040451049805, -8.606218338012695, -6.428396224975586, -4.250574111938477, -2.072751522064209, 0.1050710678100586, 2.282893180847168, 4.460715293884277, 6.638538360595703, 8.816360473632812, 10.994182586669922, 13.172004699707031, 15.34982681274414, 17.52764892578125, 19.70547103881836, 21.88329315185547, 24.06111717224121, 26.23893928527832, 28.41676139831543, 30.59458351135254, 32.77240753173828, 34.95022964477539, 37.1280517578125, 39.30587387084961, 41.48369598388672, 43.66151809692383, 45.83934020996094]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 12.0, 15.0, 17.0, 22.0, 21.0, 57.0, 87.0, 142.0, 293.0, 503.0, 1203.0, 2567.0, 6556.0, 19558.0, 66666.0, 251319.0, 467590.0, 164503.0, 44865.0, 13971.0, 4909.0, 1870.0, 849.0, 389.0, 223.0, 126.0, 69.0, 42.0, 39.0, 25.0, 10.0, 14.0, 8.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1171875, -8.84375, -8.5703125, -8.296875, -8.0234375, -7.75, -7.4765625, -7.203125, -6.9296875, -6.65625, -6.3828125, -6.109375, -5.8359375, -5.5625, -5.2890625, -5.015625, -4.7421875, -4.46875, -4.1953125, -3.921875, -3.6484375, -3.375, -3.1015625, -2.828125, -2.5546875, -2.28125, -2.0078125, -1.734375, -1.4609375, -1.1875, -0.9140625, -0.640625, -0.3671875, -0.09375, 0.1796875, 0.453125, 0.7265625, 1.0, 1.2734375, 1.546875, 1.8203125, 2.09375, 2.3671875, 2.640625, 2.9140625, 3.1875, 3.4609375, 3.734375, 4.0078125, 4.28125, 4.5546875, 4.828125, 5.1015625, 5.375, 5.6484375, 5.921875, 6.1953125, 6.46875, 6.7421875, 7.015625, 7.2890625, 7.5625, 7.8359375, 8.109375, 8.3828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 10.0, 14.0, 12.0, 11.0, 18.0, 17.0, 26.0, 34.0, 24.0, 27.0, 46.0, 48.0, 34.0, 63.0, 51.0, 48.0, 42.0, 52.0, 44.0, 50.0, 59.0, 51.0, 32.0, 33.0, 35.0, 22.0, 21.0, 14.0, 14.0, 9.0, 13.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.96929931640625, -3.8370361328125, -3.70477294921875, -3.572509765625, -3.44024658203125, -3.3079833984375, -3.17572021484375, -3.04345703125, -2.91119384765625, -2.7789306640625, -2.64666748046875, -2.514404296875, -2.38214111328125, -2.2498779296875, -2.11761474609375, -1.9853515625, -1.85308837890625, -1.7208251953125, -1.58856201171875, -1.456298828125, -1.32403564453125, -1.1917724609375, -1.05950927734375, -0.92724609375, -0.79498291015625, -0.6627197265625, -0.53045654296875, -0.398193359375, -0.26593017578125, -0.1336669921875, -0.00140380859375, 0.130859375, 0.26312255859375, 0.3953857421875, 0.52764892578125, 0.659912109375, 0.79217529296875, 0.9244384765625, 1.05670166015625, 1.18896484375, 1.32122802734375, 1.4534912109375, 1.58575439453125, 1.718017578125, 1.85028076171875, 1.9825439453125, 2.11480712890625, 2.2470703125, 2.37933349609375, 2.5115966796875, 2.64385986328125, 2.776123046875, 2.90838623046875, 3.0406494140625, 3.17291259765625, 3.30517578125, 3.43743896484375, 3.5697021484375, 3.70196533203125, 3.834228515625, 3.96649169921875, 4.0987548828125, 4.23101806640625, 4.36328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 8.0, 14.0, 19.0, 17.0, 31.0, 43.0, 82.0, 102.0, 171.0, 273.0, 576.0, 1107.0, 3429.0, 17172.0, 259679.0, 724554.0, 33278.0, 4953.0, 1533.0, 625.0, 324.0, 178.0, 127.0, 89.0, 46.0, 33.0, 23.0, 20.0, 10.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.9375, -19.25341796875, -18.5693359375, -17.88525390625, -17.201171875, -16.51708984375, -15.8330078125, -15.14892578125, -14.46484375, -13.78076171875, -13.0966796875, -12.41259765625, -11.728515625, -11.04443359375, -10.3603515625, -9.67626953125, -8.9921875, -8.30810546875, -7.6240234375, -6.93994140625, -6.255859375, -5.57177734375, -4.8876953125, -4.20361328125, -3.51953125, -2.83544921875, -2.1513671875, -1.46728515625, -0.783203125, -0.09912109375, 0.5849609375, 1.26904296875, 1.953125, 2.63720703125, 3.3212890625, 4.00537109375, 4.689453125, 5.37353515625, 6.0576171875, 6.74169921875, 7.42578125, 8.10986328125, 8.7939453125, 9.47802734375, 10.162109375, 10.84619140625, 11.5302734375, 12.21435546875, 12.8984375, 13.58251953125, 14.2666015625, 14.95068359375, 15.634765625, 16.31884765625, 17.0029296875, 17.68701171875, 18.37109375, 19.05517578125, 19.7392578125, 20.42333984375, 21.107421875, 21.79150390625, 22.4755859375, 23.15966796875, 23.84375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 6.0, 8.0, 9.0, 10.0, 25.0, 10.0, 20.0, 19.0, 30.0, 23.0, 37.0, 32.0, 40.0, 16.0, 49.0, 41.0, 48.0, 39.0, 53.0, 40.0, 64.0, 37.0, 46.0, 45.0, 30.0, 27.0, 29.0, 19.0, 24.0, 21.0, 13.0, 14.0, 14.0, 12.0, 7.0, 4.0, 8.0, 4.0, 6.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8515625, -13.3984375, -12.9453125, -12.4921875, -12.0390625, -11.5859375, -11.1328125, -10.6796875, -10.2265625, -9.7734375, -9.3203125, -8.8671875, -8.4140625, -7.9609375, -7.5078125, -7.0546875, -6.6015625, -6.1484375, -5.6953125, -5.2421875, -4.7890625, -4.3359375, -3.8828125, -3.4296875, -2.9765625, -2.5234375, -2.0703125, -1.6171875, -1.1640625, -0.7109375, -0.2578125, 0.1953125, 0.6484375, 1.1015625, 1.5546875, 2.0078125, 2.4609375, 2.9140625, 3.3671875, 3.8203125, 4.2734375, 4.7265625, 5.1796875, 5.6328125, 6.0859375, 6.5390625, 6.9921875, 7.4453125, 7.8984375, 8.3515625, 8.8046875, 9.2578125, 9.7109375, 10.1640625, 10.6171875, 11.0703125, 11.5234375, 11.9765625, 12.4296875, 12.8828125, 13.3359375, 13.7890625, 14.2421875, 14.6953125, 15.1484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 6.0, 8.0, 11.0, 12.0, 13.0, 20.0, 39.0, 41.0, 72.0, 81.0, 135.0, 193.0, 358.0, 590.0, 1106.0, 2416.0, 6742.0, 23272.0, 106854.0, 725231.0, 138921.0, 28648.0, 7937.0, 2857.0, 1217.0, 639.0, 383.0, 209.0, 178.0, 103.0, 70.0, 58.0, 34.0, 19.0, 16.0, 15.0, 16.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-7.33984375, -7.114501953125, -6.88916015625, -6.663818359375, -6.4384765625, -6.213134765625, -5.98779296875, -5.762451171875, -5.537109375, -5.311767578125, -5.08642578125, -4.861083984375, -4.6357421875, -4.410400390625, -4.18505859375, -3.959716796875, -3.734375, -3.509033203125, -3.28369140625, -3.058349609375, -2.8330078125, -2.607666015625, -2.38232421875, -2.156982421875, -1.931640625, -1.706298828125, -1.48095703125, -1.255615234375, -1.0302734375, -0.804931640625, -0.57958984375, -0.354248046875, -0.12890625, 0.096435546875, 0.32177734375, 0.547119140625, 0.7724609375, 0.997802734375, 1.22314453125, 1.448486328125, 1.673828125, 1.899169921875, 2.12451171875, 2.349853515625, 2.5751953125, 2.800537109375, 3.02587890625, 3.251220703125, 3.4765625, 3.701904296875, 3.92724609375, 4.152587890625, 4.3779296875, 4.603271484375, 4.82861328125, 5.053955078125, 5.279296875, 5.504638671875, 5.72998046875, 5.955322265625, 6.1806640625, 6.406005859375, 6.63134765625, 6.856689453125, 7.08203125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 1.0, 5.0, 6.0, 5.0, 7.0, 15.0, 18.0, 9.0, 16.0, 23.0, 36.0, 39.0, 57.0, 96.0, 168.0, 152.0, 106.0, 51.0, 50.0, 36.0, 21.0, 17.0, 11.0, 14.0, 8.0, 14.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018329620361328125, -0.0017670989036560059, -0.0017012357711791992, -0.0016353726387023926, -0.001569509506225586, -0.0015036463737487793, -0.0014377832412719727, -0.001371920108795166, -0.0013060569763183594, -0.0012401938438415527, -0.001174330711364746, -0.0011084675788879395, -0.0010426044464111328, -0.0009767413139343262, -0.0009108781814575195, -0.0008450150489807129, -0.0007791519165039062, -0.0007132887840270996, -0.000647425651550293, -0.0005815625190734863, -0.0005156993865966797, -0.00044983625411987305, -0.0003839731216430664, -0.00031810998916625977, -0.0002522468566894531, -0.00018638372421264648, -0.00012052059173583984, -5.46574592590332e-05, 1.1205673217773438e-05, 7.706880569458008e-05, 0.00014293193817138672, 0.00020879507064819336, 0.000274658203125, 0.00034052133560180664, 0.0004063844680786133, 0.0004722476005554199, 0.0005381107330322266, 0.0006039738655090332, 0.0006698369979858398, 0.0007357001304626465, 0.0008015632629394531, 0.0008674263954162598, 0.0009332895278930664, 0.000999152660369873, 0.0010650157928466797, 0.0011308789253234863, 0.001196742057800293, 0.0012626051902770996, 0.0013284683227539062, 0.0013943314552307129, 0.0014601945877075195, 0.0015260577201843262, 0.0015919208526611328, 0.0016577839851379395, 0.001723647117614746, 0.0017895102500915527, 0.0018553733825683594, 0.001921236515045166, 0.0019870996475219727, 0.0020529627799987793, 0.002118825912475586, 0.0021846890449523926, 0.0022505521774291992, 0.002316415309906006, 0.0023822784423828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 4.0, 13.0, 20.0, 28.0, 47.0, 63.0, 92.0, 146.0, 262.0, 514.0, 1073.0, 2538.0, 8136.0, 39307.0, 523327.0, 421825.0, 38345.0, 8012.0, 2566.0, 1041.0, 526.0, 256.0, 136.0, 95.0, 71.0, 32.0, 21.0, 21.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.984375, -9.6817626953125, -9.379150390625, -9.0765380859375, -8.77392578125, -8.4713134765625, -8.168701171875, -7.8660888671875, -7.5634765625, -7.2608642578125, -6.958251953125, -6.6556396484375, -6.35302734375, -6.0504150390625, -5.747802734375, -5.4451904296875, -5.142578125, -4.8399658203125, -4.537353515625, -4.2347412109375, -3.93212890625, -3.6295166015625, -3.326904296875, -3.0242919921875, -2.7216796875, -2.4190673828125, -2.116455078125, -1.8138427734375, -1.51123046875, -1.2086181640625, -0.906005859375, -0.6033935546875, -0.30078125, 0.0018310546875, 0.304443359375, 0.6070556640625, 0.90966796875, 1.2122802734375, 1.514892578125, 1.8175048828125, 2.1201171875, 2.4227294921875, 2.725341796875, 3.0279541015625, 3.33056640625, 3.6331787109375, 3.935791015625, 4.2384033203125, 4.541015625, 4.8436279296875, 5.146240234375, 5.4488525390625, 5.75146484375, 6.0540771484375, 6.356689453125, 6.6593017578125, 6.9619140625, 7.2645263671875, 7.567138671875, 7.8697509765625, 8.17236328125, 8.4749755859375, 8.777587890625, 9.0802001953125, 9.3828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 5.0, 8.0, 6.0, 8.0, 5.0, 13.0, 13.0, 17.0, 22.0, 25.0, 35.0, 42.0, 56.0, 75.0, 111.0, 131.0, 101.0, 82.0, 61.0, 35.0, 26.0, 27.0, 18.0, 8.0, 11.0, 4.0, 10.0, 10.0, 8.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0, -5.8016357421875, -5.603271484375, -5.4049072265625, -5.20654296875, -5.0081787109375, -4.809814453125, -4.6114501953125, -4.4130859375, -4.2147216796875, -4.016357421875, -3.8179931640625, -3.61962890625, -3.4212646484375, -3.222900390625, -3.0245361328125, -2.826171875, -2.6278076171875, -2.429443359375, -2.2310791015625, -2.03271484375, -1.8343505859375, -1.635986328125, -1.4376220703125, -1.2392578125, -1.0408935546875, -0.842529296875, -0.6441650390625, -0.44580078125, -0.2474365234375, -0.049072265625, 0.1492919921875, 0.34765625, 0.5460205078125, 0.744384765625, 0.9427490234375, 1.14111328125, 1.3394775390625, 1.537841796875, 1.7362060546875, 1.9345703125, 2.1329345703125, 2.331298828125, 2.5296630859375, 2.72802734375, 2.9263916015625, 3.124755859375, 3.3231201171875, 3.521484375, 3.7198486328125, 3.918212890625, 4.1165771484375, 4.31494140625, 4.5133056640625, 4.711669921875, 4.9100341796875, 5.1083984375, 5.3067626953125, 5.505126953125, 5.7034912109375, 5.90185546875, 6.1002197265625, 6.298583984375, 6.4969482421875, 6.6953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 18.0, 53.0, 181.0, 407.0, 193.0, 78.0, 31.0, 19.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.91183471679688, -199.8923797607422, -192.87294006347656, -185.85348510742188, -178.83404541015625, -171.81459045410156, -164.79513549804688, -157.77569580078125, -150.75625610351562, -143.73680114746094, -136.7173614501953, -129.69790649414062, -122.678466796875, -115.65901184082031, -108.63956451416016, -101.6201171875, -94.60066223144531, -87.58121490478516, -80.561767578125, -73.54231262207031, -66.52287292480469, -59.503421783447266, -52.483970642089844, -45.46452331542969, -38.44507598876953, -31.425628662109375, -24.406179428100586, -17.386730194091797, -10.36728286743164, -3.3478355407714844, 3.6716156005859375, 10.691062927246094, 17.710525512695312, 24.72997283935547, 31.749422073364258, 38.76887130737305, 45.7883186340332, 52.80776596069336, 59.82721710205078, 66.84666442871094, 73.8661117553711, 80.88555908203125, 87.9050064086914, 94.92445373535156, 101.94390869140625, 108.96334838867188, 115.98280334472656, 123.00225067138672, 130.02169799804688, 137.04115295410156, 144.0605926513672, 151.08004760742188, 158.0994873046875, 165.1189422607422, 172.13839721679688, 179.1578369140625, 186.17727661132812, 193.1967315673828, 200.21617126464844, 207.23562622070312, 214.25506591796875, 221.27452087402344, 228.29397583007812, 235.31341552734375, 242.33287048339844]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 7.0, 7.0, 11.0, 8.0, 17.0, 11.0, 19.0, 19.0, 25.0, 21.0, 17.0, 25.0, 23.0, 29.0, 35.0, 41.0, 27.0, 57.0, 56.0, 89.0, 55.0, 50.0, 34.0, 32.0, 30.0, 24.0, 36.0, 30.0, 17.0, 16.0, 17.0, 15.0, 22.0, 16.0, 10.0, 9.0, 11.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.49586868286133, -51.54290771484375, -49.58994674682617, -47.636985778808594, -45.684024810791016, -43.73106384277344, -41.778106689453125, -39.82514190673828, -37.87218475341797, -35.91922378540039, -33.96626281738281, -32.013301849365234, -30.060340881347656, -28.107379913330078, -26.154420852661133, -24.201459884643555, -22.248497009277344, -20.295536041259766, -18.342575073242188, -16.38961410522461, -14.436654090881348, -12.48369312286377, -10.530733108520508, -8.57777214050293, -6.624811172485352, -4.671850204467773, -2.7188897132873535, -0.7659292221069336, 1.1870317459106445, 3.1399927139282227, 5.092952728271484, 7.0459136962890625, 8.998870849609375, 10.951831817626953, 12.904792785644531, 14.857752799987793, 16.810714721679688, 18.763675689697266, 20.71663475036621, 22.66959571838379, 24.622556686401367, 26.575517654418945, 28.528478622436523, 30.48143768310547, 32.43439865112305, 34.387359619140625, 36.3403205871582, 38.29328155517578, 40.24624252319336, 42.19920349121094, 44.152164459228516, 46.105125427246094, 48.05808639526367, 50.01104736328125, 51.96400451660156, 53.916969299316406, 55.86992645263672, 57.8228874206543, 59.775848388671875, 61.72880935668945, 63.68177032470703, 65.63472747802734, 67.58769226074219, 69.5406494140625, 71.49361419677734]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 5.0, 10.0, 17.0, 26.0, 31.0, 43.0, 76.0, 100.0, 159.0, 282.0, 616.0, 1257.0, 3316.0, 11619.0, 85372.0, 2980998.0, 1062461.0, 36733.0, 6848.0, 2244.0, 932.0, 454.0, 241.0, 139.0, 94.0, 53.0, 34.0, 32.0, 23.0, 15.0, 16.0, 9.0, 3.0, 1.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.28662109375, -9.9169921875, -9.54736328125, -9.177734375, -8.80810546875, -8.4384765625, -8.06884765625, -7.69921875, -7.32958984375, -6.9599609375, -6.59033203125, -6.220703125, -5.85107421875, -5.4814453125, -5.11181640625, -4.7421875, -4.37255859375, -4.0029296875, -3.63330078125, -3.263671875, -2.89404296875, -2.5244140625, -2.15478515625, -1.78515625, -1.41552734375, -1.0458984375, -0.67626953125, -0.306640625, 0.06298828125, 0.4326171875, 0.80224609375, 1.171875, 1.54150390625, 1.9111328125, 2.28076171875, 2.650390625, 3.02001953125, 3.3896484375, 3.75927734375, 4.12890625, 4.49853515625, 4.8681640625, 5.23779296875, 5.607421875, 5.97705078125, 6.3466796875, 6.71630859375, 7.0859375, 7.45556640625, 7.8251953125, 8.19482421875, 8.564453125, 8.93408203125, 9.3037109375, 9.67333984375, 10.04296875, 10.41259765625, 10.7822265625, 11.15185546875, 11.521484375, 11.89111328125, 12.2607421875, 12.63037109375, 13.0]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 9.0, 10.0, 19.0, 16.0, 20.0, 27.0, 41.0, 28.0, 46.0, 41.0, 54.0, 44.0, 50.0, 51.0, 44.0, 57.0, 55.0, 46.0, 52.0, 37.0, 37.0, 41.0, 23.0, 33.0, 27.0, 19.0, 11.0, 13.0, 5.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.0718994140625, -3.932861328125, -3.7938232421875, -3.65478515625, -3.5157470703125, -3.376708984375, -3.2376708984375, -3.0986328125, -2.9595947265625, -2.820556640625, -2.6815185546875, -2.54248046875, -2.4034423828125, -2.264404296875, -2.1253662109375, -1.986328125, -1.8472900390625, -1.708251953125, -1.5692138671875, -1.43017578125, -1.2911376953125, -1.152099609375, -1.0130615234375, -0.8740234375, -0.7349853515625, -0.595947265625, -0.4569091796875, -0.31787109375, -0.1788330078125, -0.039794921875, 0.0992431640625, 0.23828125, 0.3773193359375, 0.516357421875, 0.6553955078125, 0.79443359375, 0.9334716796875, 1.072509765625, 1.2115478515625, 1.3505859375, 1.4896240234375, 1.628662109375, 1.7677001953125, 1.90673828125, 2.0457763671875, 2.184814453125, 2.3238525390625, 2.462890625, 2.6019287109375, 2.740966796875, 2.8800048828125, 3.01904296875, 3.1580810546875, 3.297119140625, 3.4361572265625, 3.5751953125, 3.7142333984375, 3.853271484375, 3.9923095703125, 4.13134765625, 4.2703857421875, 4.409423828125, 4.5484619140625, 4.6875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 12.0, 9.0, 18.0, 28.0, 54.0, 84.0, 118.0, 223.0, 420.0, 748.0, 1633.0, 5670.0, 75600.0, 4028576.0, 72808.0, 5540.0, 1471.0, 591.0, 291.0, 155.0, 97.0, 43.0, 28.0, 27.0, 10.0, 13.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -27.09716796875, -26.2880859375, -25.47900390625, -24.669921875, -23.86083984375, -23.0517578125, -22.24267578125, -21.43359375, -20.62451171875, -19.8154296875, -19.00634765625, -18.197265625, -17.38818359375, -16.5791015625, -15.77001953125, -14.9609375, -14.15185546875, -13.3427734375, -12.53369140625, -11.724609375, -10.91552734375, -10.1064453125, -9.29736328125, -8.48828125, -7.67919921875, -6.8701171875, -6.06103515625, -5.251953125, -4.44287109375, -3.6337890625, -2.82470703125, -2.015625, -1.20654296875, -0.3974609375, 0.41162109375, 1.220703125, 2.02978515625, 2.8388671875, 3.64794921875, 4.45703125, 5.26611328125, 6.0751953125, 6.88427734375, 7.693359375, 8.50244140625, 9.3115234375, 10.12060546875, 10.9296875, 11.73876953125, 12.5478515625, 13.35693359375, 14.166015625, 14.97509765625, 15.7841796875, 16.59326171875, 17.40234375, 18.21142578125, 19.0205078125, 19.82958984375, 20.638671875, 21.44775390625, 22.2568359375, 23.06591796875, 23.875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 10.0, 16.0, 27.0, 43.0, 137.0, 332.0, 1022.0, 1432.0, 650.0, 224.0, 69.0, 46.0, 22.0, 22.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.15625, -24.51611328125, -23.8759765625, -23.23583984375, -22.595703125, -21.95556640625, -21.3154296875, -20.67529296875, -20.03515625, -19.39501953125, -18.7548828125, -18.11474609375, -17.474609375, -16.83447265625, -16.1943359375, -15.55419921875, -14.9140625, -14.27392578125, -13.6337890625, -12.99365234375, -12.353515625, -11.71337890625, -11.0732421875, -10.43310546875, -9.79296875, -9.15283203125, -8.5126953125, -7.87255859375, -7.232421875, -6.59228515625, -5.9521484375, -5.31201171875, -4.671875, -4.03173828125, -3.3916015625, -2.75146484375, -2.111328125, -1.47119140625, -0.8310546875, -0.19091796875, 0.44921875, 1.08935546875, 1.7294921875, 2.36962890625, 3.009765625, 3.64990234375, 4.2900390625, 4.93017578125, 5.5703125, 6.21044921875, 6.8505859375, 7.49072265625, 8.130859375, 8.77099609375, 9.4111328125, 10.05126953125, 10.69140625, 11.33154296875, 11.9716796875, 12.61181640625, 13.251953125, 13.89208984375, 14.5322265625, 15.17236328125, 15.8125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 5.0, 34.0, 94.0, 349.0, 345.0, 113.0, 37.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.16969299316406, -132.783203125, -125.3967056274414, -118.01021575927734, -110.62371826171875, -103.23722839355469, -95.85073852539062, -88.46424865722656, -81.07775115966797, -73.6912612915039, -66.30476379394531, -58.91827392578125, -51.53178024291992, -44.145286560058594, -36.75879669189453, -29.372303009033203, -21.985809326171875, -14.599316596984863, -7.212823867797852, 0.17366790771484375, 7.560161590576172, 14.9466552734375, 22.333145141601562, 29.71963882446289, 37.10613250732422, 44.49262619018555, 51.879119873046875, 59.26560974121094, 66.652099609375, 74.0385971069336, 81.42508697509766, 88.81158447265625, 96.19808959960938, 103.58457946777344, 110.97107696533203, 118.3575668334961, 125.74406433105469, 133.13055419921875, 140.5170440673828, 147.90353393554688, 155.2900390625, 162.67652893066406, 170.06301879882812, 177.44952392578125, 184.8360137939453, 192.22250366210938, 199.60899353027344, 206.9954833984375, 214.38197326660156, 221.76846313476562, 229.1549530029297, 236.54144287109375, 243.92794799804688, 251.31443786621094, 258.700927734375, 266.0874328613281, 273.4739074707031, 280.86041259765625, 288.24688720703125, 295.6333923339844, 303.0198669433594, 310.4063720703125, 317.7928466796875, 325.1793518066406, 332.56585693359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 22.0, 28.0, 36.0, 64.0, 85.0, 134.0, 156.0, 132.0, 100.0, 81.0, 60.0, 39.0, 27.0, 12.0, 8.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.11483764648438, -122.36213684082031, -118.60943603515625, -114.85672760009766, -111.1040267944336, -107.35132598876953, -103.59862518310547, -99.84591674804688, -96.09321594238281, -92.34051513671875, -88.58781433105469, -84.8351058959961, -81.08240509033203, -77.32970428466797, -73.5770034790039, -69.82429504394531, -66.07159423828125, -62.31889343261719, -58.56618881225586, -54.8134880065918, -51.06078338623047, -47.308082580566406, -43.555381774902344, -39.802677154541016, -36.04998016357422, -32.297279357910156, -28.544574737548828, -24.791873931884766, -21.039169311523438, -17.286468505859375, -13.53376579284668, -9.781063079833984, -6.028358459472656, -2.27565598487854, 1.4770464897155762, 5.229748725891113, 8.982451438903809, 12.735153198242188, 16.487855911254883, 20.240558624267578, 23.993261337280273, 27.74596405029297, 31.498666763305664, 35.25136947631836, 39.00407028198242, 42.75677490234375, 46.50947570800781, 50.262176513671875, 54.0148811340332, 57.767581939697266, 61.520286560058594, 65.27298736572266, 69.02568817138672, 72.77839660644531, 76.53109741210938, 80.28379821777344, 84.0364990234375, 87.78919982910156, 91.54190063476562, 95.29460906982422, 99.04730987548828, 102.80001068115234, 106.5527114868164, 110.305419921875, 114.05812072753906]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 8.0, 4.0, 4.0, 17.0, 17.0, 27.0, 30.0, 40.0, 74.0, 116.0, 268.0, 479.0, 1116.0, 3078.0, 9866.0, 39643.0, 200317.0, 549616.0, 191064.0, 37857.0, 9599.0, 3081.0, 1184.0, 461.0, 227.0, 132.0, 71.0, 52.0, 31.0, 23.0, 13.0, 14.0, 9.0, 8.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.484375, -9.1627197265625, -8.841064453125, -8.5194091796875, -8.19775390625, -7.8760986328125, -7.554443359375, -7.2327880859375, -6.9111328125, -6.5894775390625, -6.267822265625, -5.9461669921875, -5.62451171875, -5.3028564453125, -4.981201171875, -4.6595458984375, -4.337890625, -4.0162353515625, -3.694580078125, -3.3729248046875, -3.05126953125, -2.7296142578125, -2.407958984375, -2.0863037109375, -1.7646484375, -1.4429931640625, -1.121337890625, -0.7996826171875, -0.47802734375, -0.1563720703125, 0.165283203125, 0.4869384765625, 0.80859375, 1.1302490234375, 1.451904296875, 1.7735595703125, 2.09521484375, 2.4168701171875, 2.738525390625, 3.0601806640625, 3.3818359375, 3.7034912109375, 4.025146484375, 4.3468017578125, 4.66845703125, 4.9901123046875, 5.311767578125, 5.6334228515625, 5.955078125, 6.2767333984375, 6.598388671875, 6.9200439453125, 7.24169921875, 7.5633544921875, 7.885009765625, 8.2066650390625, 8.5283203125, 8.8499755859375, 9.171630859375, 9.4932861328125, 9.81494140625, 10.1365966796875, 10.458251953125, 10.7799072265625, 11.1015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 18.0, 22.0, 21.0, 24.0, 39.0, 52.0, 63.0, 49.0, 80.0, 64.0, 82.0, 83.0, 79.0, 80.0, 55.0, 57.0, 33.0, 28.0, 24.0, 14.0, 13.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.765625, -7.54058837890625, -7.3155517578125, -7.09051513671875, -6.865478515625, -6.64044189453125, -6.4154052734375, -6.19036865234375, -5.96533203125, -5.74029541015625, -5.5152587890625, -5.29022216796875, -5.065185546875, -4.84014892578125, -4.6151123046875, -4.39007568359375, -4.1650390625, -3.94000244140625, -3.7149658203125, -3.48992919921875, -3.264892578125, -3.03985595703125, -2.8148193359375, -2.58978271484375, -2.36474609375, -2.13970947265625, -1.9146728515625, -1.68963623046875, -1.464599609375, -1.23956298828125, -1.0145263671875, -0.78948974609375, -0.564453125, -0.33941650390625, -0.1143798828125, 0.11065673828125, 0.335693359375, 0.56072998046875, 0.7857666015625, 1.01080322265625, 1.23583984375, 1.46087646484375, 1.6859130859375, 1.91094970703125, 2.135986328125, 2.36102294921875, 2.5860595703125, 2.81109619140625, 3.0361328125, 3.26116943359375, 3.4862060546875, 3.71124267578125, 3.936279296875, 4.16131591796875, 4.3863525390625, 4.61138916015625, 4.83642578125, 5.06146240234375, 5.2864990234375, 5.51153564453125, 5.736572265625, 5.96160888671875, 6.1866455078125, 6.41168212890625, 6.63671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 5.0, 6.0, 10.0, 14.0, 20.0, 31.0, 28.0, 49.0, 56.0, 64.0, 131.0, 173.0, 312.0, 706.0, 2141.0, 8751.0, 52893.0, 532824.0, 389990.0, 48339.0, 8315.0, 2042.0, 704.0, 351.0, 192.0, 115.0, 74.0, 56.0, 38.0, 32.0, 19.0, 20.0, 12.0, 9.0, 8.0, 5.0, 3.0, 0.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.942626953125, -11.55712890625, -11.171630859375, -10.7861328125, -10.400634765625, -10.01513671875, -9.629638671875, -9.244140625, -8.858642578125, -8.47314453125, -8.087646484375, -7.7021484375, -7.316650390625, -6.93115234375, -6.545654296875, -6.16015625, -5.774658203125, -5.38916015625, -5.003662109375, -4.6181640625, -4.232666015625, -3.84716796875, -3.461669921875, -3.076171875, -2.690673828125, -2.30517578125, -1.919677734375, -1.5341796875, -1.148681640625, -0.76318359375, -0.377685546875, 0.0078125, 0.393310546875, 0.77880859375, 1.164306640625, 1.5498046875, 1.935302734375, 2.32080078125, 2.706298828125, 3.091796875, 3.477294921875, 3.86279296875, 4.248291015625, 4.6337890625, 5.019287109375, 5.40478515625, 5.790283203125, 6.17578125, 6.561279296875, 6.94677734375, 7.332275390625, 7.7177734375, 8.103271484375, 8.48876953125, 8.874267578125, 9.259765625, 9.645263671875, 10.03076171875, 10.416259765625, 10.8017578125, 11.187255859375, 11.57275390625, 11.958251953125, 12.34375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 11.0, 16.0, 17.0, 11.0, 22.0, 17.0, 29.0, 41.0, 28.0, 47.0, 56.0, 48.0, 60.0, 64.0, 69.0, 49.0, 59.0, 35.0, 44.0, 40.0, 44.0, 43.0, 24.0, 24.0, 17.0, 24.0, 11.0, 18.0, 10.0, 5.0, 4.0, 6.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8671875, -14.2974853515625, -13.727783203125, -13.1580810546875, -12.58837890625, -12.0186767578125, -11.448974609375, -10.8792724609375, -10.3095703125, -9.7398681640625, -9.170166015625, -8.6004638671875, -8.03076171875, -7.4610595703125, -6.891357421875, -6.3216552734375, -5.751953125, -5.1822509765625, -4.612548828125, -4.0428466796875, -3.47314453125, -2.9034423828125, -2.333740234375, -1.7640380859375, -1.1943359375, -0.6246337890625, -0.054931640625, 0.5147705078125, 1.08447265625, 1.6541748046875, 2.223876953125, 2.7935791015625, 3.36328125, 3.9329833984375, 4.502685546875, 5.0723876953125, 5.64208984375, 6.2117919921875, 6.781494140625, 7.3511962890625, 7.9208984375, 8.4906005859375, 9.060302734375, 9.6300048828125, 10.19970703125, 10.7694091796875, 11.339111328125, 11.9088134765625, 12.478515625, 13.0482177734375, 13.617919921875, 14.1876220703125, 14.75732421875, 15.3270263671875, 15.896728515625, 16.4664306640625, 17.0361328125, 17.6058349609375, 18.175537109375, 18.7452392578125, 19.31494140625, 19.8846435546875, 20.454345703125, 21.0240478515625, 21.59375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 7.0, 11.0, 22.0, 23.0, 33.0, 66.0, 114.0, 190.0, 314.0, 621.0, 1198.0, 2557.0, 6322.0, 19009.0, 74269.0, 512086.0, 334012.0, 68863.0, 17731.0, 6056.0, 2510.0, 1168.0, 601.0, 316.0, 161.0, 102.0, 82.0, 29.0, 28.0, 17.0, 8.0, 9.0, 10.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1875, -3.077484130859375, -2.96746826171875, -2.857452392578125, -2.7474365234375, -2.637420654296875, -2.52740478515625, -2.417388916015625, -2.307373046875, -2.197357177734375, -2.08734130859375, -1.977325439453125, -1.8673095703125, -1.757293701171875, -1.64727783203125, -1.537261962890625, -1.42724609375, -1.317230224609375, -1.20721435546875, -1.097198486328125, -0.9871826171875, -0.877166748046875, -0.76715087890625, -0.657135009765625, -0.547119140625, -0.437103271484375, -0.32708740234375, -0.217071533203125, -0.1070556640625, 0.002960205078125, 0.11297607421875, 0.222991943359375, 0.3330078125, 0.443023681640625, 0.55303955078125, 0.663055419921875, 0.7730712890625, 0.883087158203125, 0.99310302734375, 1.103118896484375, 1.213134765625, 1.323150634765625, 1.43316650390625, 1.543182373046875, 1.6531982421875, 1.763214111328125, 1.87322998046875, 1.983245849609375, 2.09326171875, 2.203277587890625, 2.31329345703125, 2.423309326171875, 2.5333251953125, 2.643341064453125, 2.75335693359375, 2.863372802734375, 2.973388671875, 3.083404541015625, 3.19342041015625, 3.303436279296875, 3.4134521484375, 3.523468017578125, 3.63348388671875, 3.743499755859375, 3.853515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 6.0, 12.0, 29.0, 26.0, 48.0, 58.0, 78.0, 117.0, 110.0, 103.0, 104.0, 82.0, 55.0, 42.0, 31.0, 19.0, 14.0, 10.0, 13.0, 5.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012664794921875, -0.0012311935424804688, -0.0011959075927734375, -0.0011606216430664062, -0.001125335693359375, -0.0010900497436523438, -0.0010547637939453125, -0.0010194778442382812, -0.00098419189453125, -0.0009489059448242188, -0.0009136199951171875, -0.0008783340454101562, -0.000843048095703125, -0.0008077621459960938, -0.0007724761962890625, -0.0007371902465820312, -0.000701904296875, -0.0006666183471679688, -0.0006313323974609375, -0.0005960464477539062, -0.000560760498046875, -0.0005254745483398438, -0.0004901885986328125, -0.00045490264892578125, -0.00041961669921875, -0.00038433074951171875, -0.0003490447998046875, -0.00031375885009765625, -0.000278472900390625, -0.00024318695068359375, -0.0002079010009765625, -0.00017261505126953125, -0.0001373291015625, -0.00010204315185546875, -6.67572021484375e-05, -3.147125244140625e-05, 3.814697265625e-06, 3.910064697265625e-05, 7.43865966796875e-05, 0.00010967254638671875, 0.00014495849609375, 0.00018024444580078125, 0.0002155303955078125, 0.00025081634521484375, 0.000286102294921875, 0.00032138824462890625, 0.0003566741943359375, 0.00039196014404296875, 0.00042724609375, 0.00046253204345703125, 0.0004978179931640625, 0.0005331039428710938, 0.000568389892578125, 0.0006036758422851562, 0.0006389617919921875, 0.0006742477416992188, 0.00070953369140625, 0.0007448196411132812, 0.0007801055908203125, 0.0008153915405273438, 0.000850677490234375, 0.0008859634399414062, 0.0009212493896484375, 0.0009565353393554688, 0.0009918212890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 13.0, 22.0, 24.0, 43.0, 44.0, 92.0, 153.0, 290.0, 552.0, 1234.0, 2568.0, 6464.0, 18455.0, 64486.0, 268754.0, 546672.0, 97176.0, 26126.0, 8826.0, 3595.0, 1476.0, 652.0, 340.0, 195.0, 92.0, 64.0, 33.0, 25.0, 20.0, 16.0, 14.0, 9.0, 4.0, 7.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0078125, -3.896942138671875, -3.78607177734375, -3.675201416015625, -3.5643310546875, -3.453460693359375, -3.34259033203125, -3.231719970703125, -3.120849609375, -3.009979248046875, -2.89910888671875, -2.788238525390625, -2.6773681640625, -2.566497802734375, -2.45562744140625, -2.344757080078125, -2.23388671875, -2.123016357421875, -2.01214599609375, -1.901275634765625, -1.7904052734375, -1.679534912109375, -1.56866455078125, -1.457794189453125, -1.346923828125, -1.236053466796875, -1.12518310546875, -1.014312744140625, -0.9034423828125, -0.792572021484375, -0.68170166015625, -0.570831298828125, -0.4599609375, -0.349090576171875, -0.23822021484375, -0.127349853515625, -0.0164794921875, 0.094390869140625, 0.20526123046875, 0.316131591796875, 0.427001953125, 0.537872314453125, 0.64874267578125, 0.759613037109375, 0.8704833984375, 0.981353759765625, 1.09222412109375, 1.203094482421875, 1.31396484375, 1.424835205078125, 1.53570556640625, 1.646575927734375, 1.7574462890625, 1.868316650390625, 1.97918701171875, 2.090057373046875, 2.200927734375, 2.311798095703125, 2.42266845703125, 2.533538818359375, 2.6444091796875, 2.755279541015625, 2.86614990234375, 2.977020263671875, 3.087890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 12.0, 11.0, 16.0, 17.0, 13.0, 17.0, 37.0, 50.0, 58.0, 67.0, 62.0, 88.0, 62.0, 70.0, 61.0, 69.0, 51.0, 51.0, 26.0, 27.0, 25.0, 23.0, 18.0, 12.0, 12.0, 5.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.640625, -3.54388427734375, -3.4471435546875, -3.35040283203125, -3.253662109375, -3.15692138671875, -3.0601806640625, -2.96343994140625, -2.86669921875, -2.76995849609375, -2.6732177734375, -2.57647705078125, -2.479736328125, -2.38299560546875, -2.2862548828125, -2.18951416015625, -2.0927734375, -1.99603271484375, -1.8992919921875, -1.80255126953125, -1.705810546875, -1.60906982421875, -1.5123291015625, -1.41558837890625, -1.31884765625, -1.22210693359375, -1.1253662109375, -1.02862548828125, -0.931884765625, -0.83514404296875, -0.7384033203125, -0.64166259765625, -0.544921875, -0.44818115234375, -0.3514404296875, -0.25469970703125, -0.157958984375, -0.06121826171875, 0.0355224609375, 0.13226318359375, 0.22900390625, 0.32574462890625, 0.4224853515625, 0.51922607421875, 0.615966796875, 0.71270751953125, 0.8094482421875, 0.90618896484375, 1.0029296875, 1.09967041015625, 1.1964111328125, 1.29315185546875, 1.389892578125, 1.48663330078125, 1.5833740234375, 1.68011474609375, 1.77685546875, 1.87359619140625, 1.9703369140625, 2.06707763671875, 2.163818359375, 2.26055908203125, 2.3572998046875, 2.45404052734375, 2.55078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 14.0, 23.0, 35.0, 64.0, 99.0, 213.0, 234.0, 148.0, 78.0, 39.0, 15.0, 11.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.12248992919922, -60.266807556152344, -57.41112518310547, -54.555442810058594, -51.69976043701172, -48.844078063964844, -45.98839569091797, -43.132713317871094, -40.27703094482422, -37.421348571777344, -34.56566619873047, -31.709983825683594, -28.85430145263672, -25.998619079589844, -23.14293670654297, -20.287254333496094, -17.43157196044922, -14.575889587402344, -11.720207214355469, -8.864524841308594, -6.008842468261719, -3.1531600952148438, -0.29747772216796875, 2.5582046508789062, 5.413887023925781, 8.269569396972656, 11.125251770019531, 13.980934143066406, 16.83661651611328, 19.692298889160156, 22.54798126220703, 25.403663635253906, 28.25933837890625, 31.115020751953125, 33.970703125, 36.826385498046875, 39.68206787109375, 42.537750244140625, 45.3934326171875, 48.249114990234375, 51.10479736328125, 53.960479736328125, 56.816162109375, 59.671844482421875, 62.52752685546875, 65.38320922851562, 68.2388916015625, 71.09457397460938, 73.95025634765625, 76.80593872070312, 79.66162109375, 82.51730346679688, 85.37298583984375, 88.22866821289062, 91.0843505859375, 93.94003295898438, 96.79571533203125, 99.65139770507812, 102.507080078125, 105.36276245117188, 108.21844482421875, 111.07412719726562, 113.9298095703125, 116.78549194335938, 119.64117431640625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 6.0, 5.0, 9.0, 7.0, 11.0, 18.0, 17.0, 18.0, 16.0, 20.0, 27.0, 31.0, 39.0, 37.0, 51.0, 65.0, 72.0, 83.0, 74.0, 48.0, 47.0, 39.0, 35.0, 31.0, 19.0, 25.0, 19.0, 21.0, 15.0, 15.0, 8.0, 12.0, 6.0, 15.0, 8.0, 5.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.111228942871094, -57.178802490234375, -55.24637222290039, -53.31394577026367, -51.38151550292969, -49.44908905029297, -47.51666259765625, -45.584232330322266, -43.65180587768555, -41.71937942504883, -39.786949157714844, -37.854522705078125, -35.92209243774414, -33.98966598510742, -32.05723571777344, -30.12480926513672, -28.192380905151367, -26.259952545166016, -24.327524185180664, -22.395095825195312, -20.462669372558594, -18.530241012573242, -16.59781265258789, -14.665385246276855, -12.732956886291504, -10.800528526306152, -8.868101119995117, -6.935672760009766, -5.003244876861572, -3.070816993713379, -1.1383886337280273, 0.7940387725830078, 2.7264671325683594, 4.658895015716553, 6.591322898864746, 8.523751258850098, 10.456178665161133, 12.388607025146484, 14.321035385131836, 16.253463745117188, 18.185890197753906, 20.118318557739258, 22.05074691772461, 23.983173370361328, 25.91560173034668, 27.84803009033203, 29.780458450317383, 31.712886810302734, 33.64531707763672, 35.57774353027344, 37.51017379760742, 39.44260025024414, 41.375030517578125, 43.307456970214844, 45.23988342285156, 47.17231369018555, 49.104740142822266, 51.037166595458984, 52.96959686279297, 54.90202331542969, 56.83445358276367, 58.76688003540039, 60.699310302734375, 62.631736755371094, 64.56416320800781]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 10.0, 16.0, 27.0, 35.0, 49.0, 102.0, 171.0, 349.0, 733.0, 1785.0, 5224.0, 21369.0, 263109.0, 3478944.0, 389039.0, 24667.0, 5404.0, 1759.0, 703.0, 317.0, 184.0, 99.0, 68.0, 43.0, 25.0, 16.0, 11.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.484375, -12.123046875, -11.76171875, -11.400390625, -11.0390625, -10.677734375, -10.31640625, -9.955078125, -9.59375, -9.232421875, -8.87109375, -8.509765625, -8.1484375, -7.787109375, -7.42578125, -7.064453125, -6.703125, -6.341796875, -5.98046875, -5.619140625, -5.2578125, -4.896484375, -4.53515625, -4.173828125, -3.8125, -3.451171875, -3.08984375, -2.728515625, -2.3671875, -2.005859375, -1.64453125, -1.283203125, -0.921875, -0.560546875, -0.19921875, 0.162109375, 0.5234375, 0.884765625, 1.24609375, 1.607421875, 1.96875, 2.330078125, 2.69140625, 3.052734375, 3.4140625, 3.775390625, 4.13671875, 4.498046875, 4.859375, 5.220703125, 5.58203125, 5.943359375, 6.3046875, 6.666015625, 7.02734375, 7.388671875, 7.75, 8.111328125, 8.47265625, 8.833984375, 9.1953125, 9.556640625, 9.91796875, 10.279296875, 10.640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 11.0, 14.0, 15.0, 30.0, 29.0, 26.0, 46.0, 40.0, 38.0, 39.0, 53.0, 42.0, 60.0, 63.0, 55.0, 46.0, 40.0, 62.0, 35.0, 60.0, 27.0, 38.0, 26.0, 23.0, 18.0, 12.0, 13.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.595703125, -3.443511962890625, -3.29132080078125, -3.139129638671875, -2.9869384765625, -2.834747314453125, -2.68255615234375, -2.530364990234375, -2.378173828125, -2.225982666015625, -2.07379150390625, -1.921600341796875, -1.7694091796875, -1.617218017578125, -1.46502685546875, -1.312835693359375, -1.16064453125, -1.008453369140625, -0.85626220703125, -0.704071044921875, -0.5518798828125, -0.399688720703125, -0.24749755859375, -0.095306396484375, 0.056884765625, 0.209075927734375, 0.36126708984375, 0.513458251953125, 0.6656494140625, 0.817840576171875, 0.97003173828125, 1.122222900390625, 1.2744140625, 1.426605224609375, 1.57879638671875, 1.730987548828125, 1.8831787109375, 2.035369873046875, 2.18756103515625, 2.339752197265625, 2.491943359375, 2.644134521484375, 2.79632568359375, 2.948516845703125, 3.1007080078125, 3.252899169921875, 3.40509033203125, 3.557281494140625, 3.70947265625, 3.861663818359375, 4.01385498046875, 4.166046142578125, 4.3182373046875, 4.470428466796875, 4.62261962890625, 4.774810791015625, 4.927001953125, 5.079193115234375, 5.23138427734375, 5.383575439453125, 5.5357666015625, 5.687957763671875, 5.84014892578125, 5.992340087890625, 6.14453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 9.0, 15.0, 19.0, 41.0, 68.0, 176.0, 470.0, 2039.0, 31543.0, 4088515.0, 67474.0, 2952.0, 575.0, 182.0, 88.0, 51.0, 27.0, 20.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.46875, -32.4091796875, -31.349609375, -30.2900390625, -29.23046875, -28.1708984375, -27.111328125, -26.0517578125, -24.9921875, -23.9326171875, -22.873046875, -21.8134765625, -20.75390625, -19.6943359375, -18.634765625, -17.5751953125, -16.515625, -15.4560546875, -14.396484375, -13.3369140625, -12.27734375, -11.2177734375, -10.158203125, -9.0986328125, -8.0390625, -6.9794921875, -5.919921875, -4.8603515625, -3.80078125, -2.7412109375, -1.681640625, -0.6220703125, 0.4375, 1.4970703125, 2.556640625, 3.6162109375, 4.67578125, 5.7353515625, 6.794921875, 7.8544921875, 8.9140625, 9.9736328125, 11.033203125, 12.0927734375, 13.15234375, 14.2119140625, 15.271484375, 16.3310546875, 17.390625, 18.4501953125, 19.509765625, 20.5693359375, 21.62890625, 22.6884765625, 23.748046875, 24.8076171875, 25.8671875, 26.9267578125, 27.986328125, 29.0458984375, 30.10546875, 31.1650390625, 32.224609375, 33.2841796875, 34.34375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 12.0, 10.0, 15.0, 26.0, 38.0, 52.0, 76.0, 159.0, 316.0, 581.0, 841.0, 771.0, 530.0, 250.0, 146.0, 73.0, 59.0, 34.0, 13.0, 12.0, 9.0, 12.0, 9.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.2371826171875, -8.864990234375, -8.4927978515625, -8.12060546875, -7.7484130859375, -7.376220703125, -7.0040283203125, -6.6318359375, -6.2596435546875, -5.887451171875, -5.5152587890625, -5.14306640625, -4.7708740234375, -4.398681640625, -4.0264892578125, -3.654296875, -3.2821044921875, -2.909912109375, -2.5377197265625, -2.16552734375, -1.7933349609375, -1.421142578125, -1.0489501953125, -0.6767578125, -0.3045654296875, 0.067626953125, 0.4398193359375, 0.81201171875, 1.1842041015625, 1.556396484375, 1.9285888671875, 2.30078125, 2.6729736328125, 3.045166015625, 3.4173583984375, 3.78955078125, 4.1617431640625, 4.533935546875, 4.9061279296875, 5.2783203125, 5.6505126953125, 6.022705078125, 6.3948974609375, 6.76708984375, 7.1392822265625, 7.511474609375, 7.8836669921875, 8.255859375, 8.6280517578125, 9.000244140625, 9.3724365234375, 9.74462890625, 10.1168212890625, 10.489013671875, 10.8612060546875, 11.2333984375, 11.6055908203125, 11.977783203125, 12.3499755859375, 12.72216796875, 13.0943603515625, 13.466552734375, 13.8387451171875, 14.2109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 11.0, 32.0, 47.0, 110.0, 211.0, 231.0, 165.0, 91.0, 44.0, 20.0, 15.0, 9.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-178.6913604736328, -174.558837890625, -170.42630004882812, -166.2937774658203, -162.1612548828125, -158.02871704101562, -153.8961944580078, -149.763671875, -145.63113403320312, -141.4986114501953, -137.36607360839844, -133.23355102539062, -129.1010284423828, -124.96849822998047, -120.83596801757812, -116.70344543457031, -112.5709228515625, -108.43839263916016, -104.30587005615234, -100.17333984375, -96.04081726074219, -91.90828704833984, -87.7757568359375, -83.64323425292969, -79.51070404052734, -75.378173828125, -71.24565124511719, -67.11312103271484, -62.980594635009766, -58.84806823730469, -54.715538024902344, -50.583011627197266, -46.45048522949219, -42.31795883178711, -38.18543243408203, -34.05290222167969, -29.92037582397461, -25.78784942626953, -21.65532112121582, -17.52279281616211, -13.390266418457031, -9.257739067077637, -5.125211715698242, -0.9926843643188477, 3.139842987060547, 7.272369384765625, 11.404897689819336, 15.537425994873047, 19.669952392578125, 23.802478790283203, 27.935007095336914, 32.067535400390625, 36.2000617980957, 40.33258819580078, 44.465118408203125, 48.5976448059082, 52.73017120361328, 56.86269760131836, 60.99522399902344, 65.12775421142578, 69.26028442382812, 73.39280700683594, 77.52533721923828, 81.65786743164062, 85.79039001464844]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 10.0, 12.0, 11.0, 26.0, 18.0, 18.0, 31.0, 25.0, 34.0, 42.0, 48.0, 44.0, 48.0, 58.0, 59.0, 58.0, 37.0, 50.0, 55.0, 49.0, 34.0, 35.0, 36.0, 27.0, 30.0, 26.0, 17.0, 8.0, 6.0, 9.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.94472885131836, -46.5534553527832, -45.16218566894531, -43.770912170410156, -42.379642486572266, -40.98836898803711, -39.59709930419922, -38.20582580566406, -36.81455612182617, -35.423282623291016, -34.032012939453125, -32.64073944091797, -31.249469757080078, -29.858198165893555, -28.46692657470703, -27.075653076171875, -25.68438148498535, -24.293109893798828, -22.901838302612305, -21.51056671142578, -20.119295120239258, -18.728023529052734, -17.336750030517578, -15.945479393005371, -14.554207801818848, -13.162936210632324, -11.7716646194458, -10.380392074584961, -8.989120483398438, -7.597849369049072, -6.206577301025391, -4.815305709838867, -3.4240341186523438, -2.0327625274658203, -0.6414906978607178, 0.7497811317443848, 2.141052722930908, 3.5323243141174316, 4.923596382141113, 6.314867973327637, 7.70613956451416, 9.097411155700684, 10.488682746887207, 11.879955291748047, 13.27122688293457, 14.662498474121094, 16.053770065307617, 17.44504165649414, 18.836313247680664, 20.227584838867188, 21.61885643005371, 23.010128021240234, 24.401399612426758, 25.79267120361328, 27.183944702148438, 28.575214385986328, 29.966487884521484, 31.357759475708008, 32.74903106689453, 34.14030456542969, 35.53157424926758, 36.922847747802734, 38.314117431640625, 39.70539093017578, 41.09666061401367]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 4.0, 11.0, 17.0, 21.0, 27.0, 49.0, 71.0, 131.0, 228.0, 427.0, 858.0, 1868.0, 4477.0, 12150.0, 39552.0, 160371.0, 532359.0, 219814.0, 50894.0, 15423.0, 5439.0, 2205.0, 998.0, 482.0, 252.0, 163.0, 88.0, 58.0, 30.0, 17.0, 21.0, 6.0, 10.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.3885498046875, -7.120849609375, -6.8531494140625, -6.58544921875, -6.3177490234375, -6.050048828125, -5.7823486328125, -5.5146484375, -5.2469482421875, -4.979248046875, -4.7115478515625, -4.44384765625, -4.1761474609375, -3.908447265625, -3.6407470703125, -3.373046875, -3.1053466796875, -2.837646484375, -2.5699462890625, -2.30224609375, -2.0345458984375, -1.766845703125, -1.4991455078125, -1.2314453125, -0.9637451171875, -0.696044921875, -0.4283447265625, -0.16064453125, 0.1070556640625, 0.374755859375, 0.6424560546875, 0.91015625, 1.1778564453125, 1.445556640625, 1.7132568359375, 1.98095703125, 2.2486572265625, 2.516357421875, 2.7840576171875, 3.0517578125, 3.3194580078125, 3.587158203125, 3.8548583984375, 4.12255859375, 4.3902587890625, 4.657958984375, 4.9256591796875, 5.193359375, 5.4610595703125, 5.728759765625, 5.9964599609375, 6.26416015625, 6.5318603515625, 6.799560546875, 7.0672607421875, 7.3349609375, 7.6026611328125, 7.870361328125, 8.1380615234375, 8.40576171875, 8.6734619140625, 8.941162109375, 9.2088623046875, 9.4765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 5.0, 12.0, 18.0, 32.0, 14.0, 22.0, 29.0, 27.0, 42.0, 49.0, 31.0, 50.0, 55.0, 57.0, 43.0, 60.0, 43.0, 49.0, 46.0, 48.0, 36.0, 45.0, 20.0, 30.0, 19.0, 21.0, 19.0, 22.0, 15.0, 6.0, 9.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8671875, -4.71954345703125, -4.5718994140625, -4.42425537109375, -4.276611328125, -4.12896728515625, -3.9813232421875, -3.83367919921875, -3.68603515625, -3.53839111328125, -3.3907470703125, -3.24310302734375, -3.095458984375, -2.94781494140625, -2.8001708984375, -2.65252685546875, -2.5048828125, -2.35723876953125, -2.2095947265625, -2.06195068359375, -1.914306640625, -1.76666259765625, -1.6190185546875, -1.47137451171875, -1.32373046875, -1.17608642578125, -1.0284423828125, -0.88079833984375, -0.733154296875, -0.58551025390625, -0.4378662109375, -0.29022216796875, -0.142578125, 0.00506591796875, 0.1527099609375, 0.30035400390625, 0.447998046875, 0.59564208984375, 0.7432861328125, 0.89093017578125, 1.03857421875, 1.18621826171875, 1.3338623046875, 1.48150634765625, 1.629150390625, 1.77679443359375, 1.9244384765625, 2.07208251953125, 2.2197265625, 2.36737060546875, 2.5150146484375, 2.66265869140625, 2.810302734375, 2.95794677734375, 3.1055908203125, 3.25323486328125, 3.40087890625, 3.54852294921875, 3.6961669921875, 3.84381103515625, 3.991455078125, 4.13909912109375, 4.2867431640625, 4.43438720703125, 4.58203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 8.0, 5.0, 9.0, 12.0, 27.0, 22.0, 44.0, 39.0, 56.0, 75.0, 144.0, 205.0, 366.0, 638.0, 1092.0, 2668.0, 8387.0, 44567.0, 620313.0, 322978.0, 34926.0, 7133.0, 2395.0, 1024.0, 491.0, 300.0, 196.0, 138.0, 87.0, 54.0, 41.0, 32.0, 26.0, 11.0, 10.0, 5.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.8515625, -10.463134765625, -10.07470703125, -9.686279296875, -9.2978515625, -8.909423828125, -8.52099609375, -8.132568359375, -7.744140625, -7.355712890625, -6.96728515625, -6.578857421875, -6.1904296875, -5.802001953125, -5.41357421875, -5.025146484375, -4.63671875, -4.248291015625, -3.85986328125, -3.471435546875, -3.0830078125, -2.694580078125, -2.30615234375, -1.917724609375, -1.529296875, -1.140869140625, -0.75244140625, -0.364013671875, 0.0244140625, 0.412841796875, 0.80126953125, 1.189697265625, 1.578125, 1.966552734375, 2.35498046875, 2.743408203125, 3.1318359375, 3.520263671875, 3.90869140625, 4.297119140625, 4.685546875, 5.073974609375, 5.46240234375, 5.850830078125, 6.2392578125, 6.627685546875, 7.01611328125, 7.404541015625, 7.79296875, 8.181396484375, 8.56982421875, 8.958251953125, 9.3466796875, 9.735107421875, 10.12353515625, 10.511962890625, 10.900390625, 11.288818359375, 11.67724609375, 12.065673828125, 12.4541015625, 12.842529296875, 13.23095703125, 13.619384765625, 14.0078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 17.0, 15.0, 14.0, 14.0, 29.0, 35.0, 31.0, 28.0, 47.0, 43.0, 56.0, 61.0, 67.0, 49.0, 57.0, 44.0, 48.0, 48.0, 34.0, 36.0, 33.0, 30.0, 22.0, 31.0, 14.0, 19.0, 11.0, 11.0, 6.0, 3.0, 4.0, 1.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-21.5, -20.9466552734375, -20.393310546875, -19.8399658203125, -19.28662109375, -18.7332763671875, -18.179931640625, -17.6265869140625, -17.0732421875, -16.5198974609375, -15.966552734375, -15.4132080078125, -14.85986328125, -14.3065185546875, -13.753173828125, -13.1998291015625, -12.646484375, -12.0931396484375, -11.539794921875, -10.9864501953125, -10.43310546875, -9.8797607421875, -9.326416015625, -8.7730712890625, -8.2197265625, -7.6663818359375, -7.113037109375, -6.5596923828125, -6.00634765625, -5.4530029296875, -4.899658203125, -4.3463134765625, -3.79296875, -3.2396240234375, -2.686279296875, -2.1329345703125, -1.57958984375, -1.0262451171875, -0.472900390625, 0.0804443359375, 0.6337890625, 1.1871337890625, 1.740478515625, 2.2938232421875, 2.84716796875, 3.4005126953125, 3.953857421875, 4.5072021484375, 5.060546875, 5.6138916015625, 6.167236328125, 6.7205810546875, 7.27392578125, 7.8272705078125, 8.380615234375, 8.9339599609375, 9.4873046875, 10.0406494140625, 10.593994140625, 11.1473388671875, 11.70068359375, 12.2540283203125, 12.807373046875, 13.3607177734375, 13.9140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 4.0, 7.0, 3.0, 5.0, 13.0, 17.0, 28.0, 27.0, 40.0, 52.0, 100.0, 154.0, 270.0, 468.0, 810.0, 1656.0, 3153.0, 7342.0, 18179.0, 54425.0, 276918.0, 580713.0, 66832.0, 21279.0, 8349.0, 3807.0, 1683.0, 948.0, 455.0, 293.0, 164.0, 90.0, 64.0, 45.0, 37.0, 30.0, 25.0, 17.0, 8.0, 11.0, 8.0, 4.0, 6.0, 2.0, 1.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.282440185546875, -3.18011474609375, -3.077789306640625, -2.9754638671875, -2.873138427734375, -2.77081298828125, -2.668487548828125, -2.566162109375, -2.463836669921875, -2.36151123046875, -2.259185791015625, -2.1568603515625, -2.054534912109375, -1.95220947265625, -1.849884033203125, -1.74755859375, -1.645233154296875, -1.54290771484375, -1.440582275390625, -1.3382568359375, -1.235931396484375, -1.13360595703125, -1.031280517578125, -0.928955078125, -0.826629638671875, -0.72430419921875, -0.621978759765625, -0.5196533203125, -0.417327880859375, -0.31500244140625, -0.212677001953125, -0.1103515625, -0.008026123046875, 0.09429931640625, 0.196624755859375, 0.2989501953125, 0.401275634765625, 0.50360107421875, 0.605926513671875, 0.708251953125, 0.810577392578125, 0.91290283203125, 1.015228271484375, 1.1175537109375, 1.219879150390625, 1.32220458984375, 1.424530029296875, 1.52685546875, 1.629180908203125, 1.73150634765625, 1.833831787109375, 1.9361572265625, 2.038482666015625, 2.14080810546875, 2.243133544921875, 2.345458984375, 2.447784423828125, 2.55010986328125, 2.652435302734375, 2.7547607421875, 2.857086181640625, 2.95941162109375, 3.061737060546875, 3.1640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 6.0, 10.0, 4.0, 7.0, 8.0, 18.0, 15.0, 18.0, 38.0, 41.0, 66.0, 96.0, 117.0, 116.0, 90.0, 66.0, 59.0, 40.0, 33.0, 31.0, 15.0, 17.0, 12.0, 10.0, 6.0, 11.0, 4.0, 8.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0009512901306152344, -0.0009226873517036438, -0.0008940845727920532, -0.0008654817938804626, -0.0008368790149688721, -0.0008082762360572815, -0.0007796734571456909, -0.0007510706782341003, -0.0007224678993225098, -0.0006938651204109192, -0.0006652623414993286, -0.000636659562587738, -0.0006080567836761475, -0.0005794540047645569, -0.0005508512258529663, -0.0005222484469413757, -0.0004936456680297852, -0.0004650428891181946, -0.000436440110206604, -0.00040783733129501343, -0.00037923455238342285, -0.0003506317734718323, -0.0003220289945602417, -0.0002934262156486511, -0.00026482343673706055, -0.00023622065782546997, -0.0002076178789138794, -0.00017901510000228882, -0.00015041232109069824, -0.00012180954217910767, -9.320676326751709e-05, -6.460398435592651e-05, -3.600120544433594e-05, -7.398426532745361e-06, 2.1204352378845215e-05, 4.980713129043579e-05, 7.840991020202637e-05, 0.00010701268911361694, 0.00013561546802520752, 0.0001642182469367981, 0.00019282102584838867, 0.00022142380475997925, 0.0002500265836715698, 0.0002786293625831604, 0.000307232141494751, 0.00033583492040634155, 0.00036443769931793213, 0.0003930404782295227, 0.0004216432571411133, 0.00045024603605270386, 0.00047884881496429443, 0.000507451593875885, 0.0005360543727874756, 0.0005646571516990662, 0.0005932599306106567, 0.0006218627095222473, 0.0006504654884338379, 0.0006790682673454285, 0.000707671046257019, 0.0007362738251686096, 0.0007648766040802002, 0.0007934793829917908, 0.0008220821619033813, 0.0008506849408149719, 0.0008792877197265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 7.0, 6.0, 21.0, 12.0, 25.0, 39.0, 68.0, 122.0, 186.0, 436.0, 856.0, 2082.0, 6174.0, 23047.0, 133069.0, 770712.0, 86435.0, 17031.0, 4988.0, 1742.0, 717.0, 329.0, 184.0, 93.0, 70.0, 39.0, 28.0, 14.0, 6.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.490631103515625, -3.33477783203125, -3.178924560546875, -3.0230712890625, -2.867218017578125, -2.71136474609375, -2.555511474609375, -2.399658203125, -2.243804931640625, -2.08795166015625, -1.932098388671875, -1.7762451171875, -1.620391845703125, -1.46453857421875, -1.308685302734375, -1.15283203125, -0.996978759765625, -0.84112548828125, -0.685272216796875, -0.5294189453125, -0.373565673828125, -0.21771240234375, -0.061859130859375, 0.093994140625, 0.249847412109375, 0.40570068359375, 0.561553955078125, 0.7174072265625, 0.873260498046875, 1.02911376953125, 1.184967041015625, 1.3408203125, 1.496673583984375, 1.65252685546875, 1.808380126953125, 1.9642333984375, 2.120086669921875, 2.27593994140625, 2.431793212890625, 2.587646484375, 2.743499755859375, 2.89935302734375, 3.055206298828125, 3.2110595703125, 3.366912841796875, 3.52276611328125, 3.678619384765625, 3.83447265625, 3.990325927734375, 4.14617919921875, 4.302032470703125, 4.4578857421875, 4.613739013671875, 4.76959228515625, 4.925445556640625, 5.081298828125, 5.237152099609375, 5.39300537109375, 5.548858642578125, 5.7047119140625, 5.860565185546875, 6.01641845703125, 6.172271728515625, 6.328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 10.0, 7.0, 3.0, 9.0, 11.0, 14.0, 24.0, 30.0, 42.0, 34.0, 47.0, 94.0, 123.0, 140.0, 116.0, 82.0, 53.0, 35.0, 23.0, 27.0, 25.0, 11.0, 15.0, 5.0, 5.0, 7.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7421875, -3.61041259765625, -3.4786376953125, -3.34686279296875, -3.215087890625, -3.08331298828125, -2.9515380859375, -2.81976318359375, -2.68798828125, -2.55621337890625, -2.4244384765625, -2.29266357421875, -2.160888671875, -2.02911376953125, -1.8973388671875, -1.76556396484375, -1.6337890625, -1.50201416015625, -1.3702392578125, -1.23846435546875, -1.106689453125, -0.97491455078125, -0.8431396484375, -0.71136474609375, -0.57958984375, -0.44781494140625, -0.3160400390625, -0.18426513671875, -0.052490234375, 0.07928466796875, 0.2110595703125, 0.34283447265625, 0.474609375, 0.60638427734375, 0.7381591796875, 0.86993408203125, 1.001708984375, 1.13348388671875, 1.2652587890625, 1.39703369140625, 1.52880859375, 1.66058349609375, 1.7923583984375, 1.92413330078125, 2.055908203125, 2.18768310546875, 2.3194580078125, 2.45123291015625, 2.5830078125, 2.71478271484375, 2.8465576171875, 2.97833251953125, 3.110107421875, 3.24188232421875, 3.3736572265625, 3.50543212890625, 3.63720703125, 3.76898193359375, 3.9007568359375, 4.03253173828125, 4.164306640625, 4.29608154296875, 4.4278564453125, 4.55963134765625, 4.69140625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 11.0, 8.0, 38.0, 66.0, 128.0, 326.0, 202.0, 95.0, 51.0, 25.0, 20.0, 11.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.0772933959961, -72.72566223144531, -69.37403106689453, -66.02239990234375, -62.6707763671875, -59.31914520263672, -55.96751403808594, -52.615882873535156, -49.26425552368164, -45.91262435913086, -42.560997009277344, -39.20936584472656, -35.85773468017578, -32.506107330322266, -29.154476165771484, -25.802846908569336, -22.451217651367188, -19.09958839416504, -15.747958183288574, -12.39632797241211, -9.044698715209961, -5.6930694580078125, -2.3414382934570312, 1.0101909637451172, 4.361820220947266, 7.713449954986572, 11.065079689025879, 14.416709899902344, 17.768339157104492, 21.11996841430664, 24.471599578857422, 27.82322883605957, 31.17486572265625, 34.52649688720703, 37.87812423706055, 41.22975540161133, 44.581382751464844, 47.933013916015625, 51.284645080566406, 54.63627624511719, 57.9879035949707, 61.339534759521484, 64.691162109375, 68.04279327392578, 71.39442443847656, 74.74604797363281, 78.09768676757812, 81.44931030273438, 84.80094146728516, 88.15257263183594, 91.50420379638672, 94.8558349609375, 98.20745849609375, 101.55908966064453, 104.91072082519531, 108.2623519897461, 111.61398315429688, 114.96561431884766, 118.31724548339844, 121.66886901855469, 125.02050018310547, 128.37213134765625, 131.7237548828125, 135.0753936767578, 138.42701721191406]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 10.0, 7.0, 7.0, 21.0, 16.0, 26.0, 21.0, 23.0, 31.0, 33.0, 29.0, 40.0, 47.0, 104.0, 142.0, 101.0, 52.0, 42.0, 37.0, 35.0, 28.0, 21.0, 26.0, 21.0, 14.0, 16.0, 10.0, 11.0, 5.0, 6.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-109.59367370605469, -106.89695739746094, -104.20023345947266, -101.5035171508789, -98.80680084228516, -96.1100845336914, -93.41336059570312, -90.71664428710938, -88.01992797851562, -85.32321166992188, -82.6264877319336, -79.92977142333984, -77.2330551147461, -74.53633880615234, -71.83961486816406, -69.14289855957031, -66.44618225097656, -63.74946212768555, -61.0527458190918, -58.35602569580078, -55.65930938720703, -52.962589263916016, -50.265869140625, -47.56915283203125, -44.87242889404297, -42.17570877075195, -39.4789924621582, -36.78227233886719, -34.08555603027344, -31.388835906982422, -28.69211769104004, -25.995399475097656, -23.298683166503906, -20.601964950561523, -17.90524673461914, -15.208527565002441, -12.511809349060059, -9.815091133117676, -7.118371963500977, -4.421653747558594, -1.724935531616211, 0.971782922744751, 3.668501377105713, 6.365220069885254, 9.061938285827637, 11.75865650177002, 14.455375671386719, 17.1520938873291, 19.848812103271484, 22.545530319213867, 25.24224853515625, 27.938968658447266, 30.635684967041016, 33.33240509033203, 36.02912139892578, 38.7258415222168, 41.42256164550781, 44.11928176879883, 46.81599807739258, 49.512718200683594, 52.209434509277344, 54.90615463256836, 57.602874755859375, 60.299591064453125, 62.996307373046875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 5.0, 13.0, 13.0, 21.0, 41.0, 54.0, 94.0, 136.0, 219.0, 416.0, 800.0, 1540.0, 3409.0, 9770.0, 50205.0, 866719.0, 2967832.0, 256902.0, 24542.0, 6435.0, 2507.0, 1143.0, 648.0, 328.0, 183.0, 108.0, 74.0, 40.0, 25.0, 25.0, 10.0, 5.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.5048828125, -10.189453125, -9.8740234375, -9.55859375, -9.2431640625, -8.927734375, -8.6123046875, -8.296875, -7.9814453125, -7.666015625, -7.3505859375, -7.03515625, -6.7197265625, -6.404296875, -6.0888671875, -5.7734375, -5.4580078125, -5.142578125, -4.8271484375, -4.51171875, -4.1962890625, -3.880859375, -3.5654296875, -3.25, -2.9345703125, -2.619140625, -2.3037109375, -1.98828125, -1.6728515625, -1.357421875, -1.0419921875, -0.7265625, -0.4111328125, -0.095703125, 0.2197265625, 0.53515625, 0.8505859375, 1.166015625, 1.4814453125, 1.796875, 2.1123046875, 2.427734375, 2.7431640625, 3.05859375, 3.3740234375, 3.689453125, 4.0048828125, 4.3203125, 4.6357421875, 4.951171875, 5.2666015625, 5.58203125, 5.8974609375, 6.212890625, 6.5283203125, 6.84375, 7.1591796875, 7.474609375, 7.7900390625, 8.10546875, 8.4208984375, 8.736328125, 9.0517578125, 9.3671875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 4.0, 12.0, 11.0, 15.0, 20.0, 38.0, 32.0, 46.0, 46.0, 57.0, 52.0, 59.0, 74.0, 68.0, 71.0, 69.0, 49.0, 60.0, 50.0, 31.0, 22.0, 32.0, 21.0, 15.0, 14.0, 12.0, 7.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.74609375, -6.5494384765625, -6.352783203125, -6.1561279296875, -5.95947265625, -5.7628173828125, -5.566162109375, -5.3695068359375, -5.1728515625, -4.9761962890625, -4.779541015625, -4.5828857421875, -4.38623046875, -4.1895751953125, -3.992919921875, -3.7962646484375, -3.599609375, -3.4029541015625, -3.206298828125, -3.0096435546875, -2.81298828125, -2.6163330078125, -2.419677734375, -2.2230224609375, -2.0263671875, -1.8297119140625, -1.633056640625, -1.4364013671875, -1.23974609375, -1.0430908203125, -0.846435546875, -0.6497802734375, -0.453125, -0.2564697265625, -0.059814453125, 0.1368408203125, 0.33349609375, 0.5301513671875, 0.726806640625, 0.9234619140625, 1.1201171875, 1.3167724609375, 1.513427734375, 1.7100830078125, 1.90673828125, 2.1033935546875, 2.300048828125, 2.4967041015625, 2.693359375, 2.8900146484375, 3.086669921875, 3.2833251953125, 3.47998046875, 3.6766357421875, 3.873291015625, 4.0699462890625, 4.2666015625, 4.4632568359375, 4.659912109375, 4.8565673828125, 5.05322265625, 5.2498779296875, 5.446533203125, 5.6431884765625, 5.83984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 14.0, 20.0, 23.0, 53.0, 116.0, 289.0, 943.0, 5010.0, 89740.0, 4011573.0, 79852.0, 5126.0, 960.0, 275.0, 111.0, 65.0, 30.0, 12.0, 16.0, 13.0, 6.0, 10.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.3125, -22.5478515625, -21.783203125, -21.0185546875, -20.25390625, -19.4892578125, -18.724609375, -17.9599609375, -17.1953125, -16.4306640625, -15.666015625, -14.9013671875, -14.13671875, -13.3720703125, -12.607421875, -11.8427734375, -11.078125, -10.3134765625, -9.548828125, -8.7841796875, -8.01953125, -7.2548828125, -6.490234375, -5.7255859375, -4.9609375, -4.1962890625, -3.431640625, -2.6669921875, -1.90234375, -1.1376953125, -0.373046875, 0.3916015625, 1.15625, 1.9208984375, 2.685546875, 3.4501953125, 4.21484375, 4.9794921875, 5.744140625, 6.5087890625, 7.2734375, 8.0380859375, 8.802734375, 9.5673828125, 10.33203125, 11.0966796875, 11.861328125, 12.6259765625, 13.390625, 14.1552734375, 14.919921875, 15.6845703125, 16.44921875, 17.2138671875, 17.978515625, 18.7431640625, 19.5078125, 20.2724609375, 21.037109375, 21.8017578125, 22.56640625, 23.3310546875, 24.095703125, 24.8603515625, 25.625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 13.0, 12.0, 14.0, 21.0, 31.0, 45.0, 62.0, 71.0, 155.0, 230.0, 388.0, 546.0, 687.0, 576.0, 431.0, 288.0, 176.0, 91.0, 79.0, 49.0, 29.0, 17.0, 15.0, 9.0, 9.0, 6.0, 7.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.287841796875, -7.95068359375, -7.613525390625, -7.2763671875, -6.939208984375, -6.60205078125, -6.264892578125, -5.927734375, -5.590576171875, -5.25341796875, -4.916259765625, -4.5791015625, -4.241943359375, -3.90478515625, -3.567626953125, -3.23046875, -2.893310546875, -2.55615234375, -2.218994140625, -1.8818359375, -1.544677734375, -1.20751953125, -0.870361328125, -0.533203125, -0.196044921875, 0.14111328125, 0.478271484375, 0.8154296875, 1.152587890625, 1.48974609375, 1.826904296875, 2.1640625, 2.501220703125, 2.83837890625, 3.175537109375, 3.5126953125, 3.849853515625, 4.18701171875, 4.524169921875, 4.861328125, 5.198486328125, 5.53564453125, 5.872802734375, 6.2099609375, 6.547119140625, 6.88427734375, 7.221435546875, 7.55859375, 7.895751953125, 8.23291015625, 8.570068359375, 8.9072265625, 9.244384765625, 9.58154296875, 9.918701171875, 10.255859375, 10.593017578125, 10.93017578125, 11.267333984375, 11.6044921875, 11.941650390625, 12.27880859375, 12.615966796875, 12.953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 20.0, 82.0, 243.0, 374.0, 179.0, 67.0, 22.0, 9.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.60047912597656, -192.05999755859375, -185.51951599121094, -178.97903442382812, -172.4385528564453, -165.8980712890625, -159.35760498046875, -152.81710815429688, -146.27664184570312, -139.7361602783203, -133.1956787109375, -126.65519714355469, -120.11471557617188, -113.57423400878906, -107.03376007080078, -100.49327850341797, -93.95278930664062, -87.41230773925781, -80.871826171875, -74.33134460449219, -67.79086303710938, -61.25038528442383, -54.70990753173828, -48.16942596435547, -41.628944396972656, -35.088462829589844, -28.547983169555664, -22.007503509521484, -15.467021942138672, -8.92654037475586, -2.3860626220703125, 4.1544189453125, 10.694915771484375, 17.235397338867188, 23.775876998901367, 30.316356658935547, 36.85683822631836, 43.39731979370117, 49.93779754638672, 56.47827911376953, 63.018760681152344, 69.55924224853516, 76.09972381591797, 82.64019775390625, 89.18067932128906, 95.72116088867188, 102.26164245605469, 108.8021240234375, 115.34260559082031, 121.88308715820312, 128.42356872558594, 134.96405029296875, 141.50453186035156, 148.04501342773438, 154.58547973632812, 161.1259765625, 167.66644287109375, 174.20692443847656, 180.74740600585938, 187.2878875732422, 193.828369140625, 200.3688507080078, 206.90933227539062, 213.44979858398438, 219.99029541015625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 9.0, 3.0, 5.0, 8.0, 10.0, 11.0, 16.0, 9.0, 20.0, 16.0, 20.0, 30.0, 28.0, 33.0, 38.0, 42.0, 47.0, 43.0, 51.0, 41.0, 38.0, 41.0, 46.0, 41.0, 36.0, 39.0, 33.0, 37.0, 33.0, 20.0, 25.0, 24.0, 23.0, 17.0, 12.0, 12.0, 6.0, 14.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-47.3223876953125, -45.875431060791016, -44.428470611572266, -42.98151397705078, -41.5345573425293, -40.08760070800781, -38.64064025878906, -37.19368362426758, -35.746726989746094, -34.29977035522461, -32.85280990600586, -31.405853271484375, -29.95889663696289, -28.511938095092773, -27.064979553222656, -25.618022918701172, -24.171064376831055, -22.724105834960938, -21.277149200439453, -19.830190658569336, -18.38323402404785, -16.936275482177734, -15.489317893981934, -14.042360305786133, -12.595402717590332, -11.148445129394531, -9.70148754119873, -8.25452995300293, -6.807571887969971, -5.36061429977417, -3.913656234741211, -2.46669864654541, -1.0197410583496094, 0.42721664905548096, 1.8741743564605713, 3.321132183074951, 4.768089771270752, 6.215047359466553, 7.662005424499512, 9.108963012695312, 10.555920600891113, 12.002878189086914, 13.449835777282715, 14.896793365478516, 16.343751907348633, 17.790708541870117, 19.237667083740234, 20.68462371826172, 22.131582260131836, 23.578540802001953, 25.025497436523438, 26.472455978393555, 27.91941261291504, 29.366371154785156, 30.81332778930664, 32.260284423828125, 33.707244873046875, 35.15420150756836, 36.60116195678711, 38.048118591308594, 39.49507522583008, 40.94203186035156, 42.38899230957031, 43.8359489440918, 45.28290557861328]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 27.0, 29.0, 69.0, 67.0, 129.0, 251.0, 408.0, 827.0, 1587.0, 3437.0, 8132.0, 20684.0, 60677.0, 212830.0, 473546.0, 180741.0, 53259.0, 18302.0, 7268.0, 3150.0, 1399.0, 700.0, 387.0, 246.0, 142.0, 99.0, 41.0, 38.0, 14.0, 17.0, 12.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.68658447265625, -6.4669189453125, -6.24725341796875, -6.027587890625, -5.80792236328125, -5.5882568359375, -5.36859130859375, -5.14892578125, -4.92926025390625, -4.7095947265625, -4.48992919921875, -4.270263671875, -4.05059814453125, -3.8309326171875, -3.61126708984375, -3.3916015625, -3.17193603515625, -2.9522705078125, -2.73260498046875, -2.512939453125, -2.29327392578125, -2.0736083984375, -1.85394287109375, -1.63427734375, -1.41461181640625, -1.1949462890625, -0.97528076171875, -0.755615234375, -0.53594970703125, -0.3162841796875, -0.09661865234375, 0.123046875, 0.34271240234375, 0.5623779296875, 0.78204345703125, 1.001708984375, 1.22137451171875, 1.4410400390625, 1.66070556640625, 1.88037109375, 2.10003662109375, 2.3197021484375, 2.53936767578125, 2.759033203125, 2.97869873046875, 3.1983642578125, 3.41802978515625, 3.6376953125, 3.85736083984375, 4.0770263671875, 4.29669189453125, 4.516357421875, 4.73602294921875, 4.9556884765625, 5.17535400390625, 5.39501953125, 5.61468505859375, 5.8343505859375, 6.05401611328125, 6.273681640625, 6.49334716796875, 6.7130126953125, 6.93267822265625, 7.15234375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 10.0, 12.0, 10.0, 19.0, 21.0, 25.0, 34.0, 30.0, 41.0, 46.0, 45.0, 51.0, 63.0, 63.0, 48.0, 67.0, 46.0, 50.0, 44.0, 42.0, 48.0, 36.0, 29.0, 34.0, 21.0, 14.0, 8.0, 15.0, 4.0, 7.0, 3.0, 4.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -4.9976806640625, -4.815673828125, -4.6336669921875, -4.45166015625, -4.2696533203125, -4.087646484375, -3.9056396484375, -3.7236328125, -3.5416259765625, -3.359619140625, -3.1776123046875, -2.99560546875, -2.8135986328125, -2.631591796875, -2.4495849609375, -2.267578125, -2.0855712890625, -1.903564453125, -1.7215576171875, -1.53955078125, -1.3575439453125, -1.175537109375, -0.9935302734375, -0.8115234375, -0.6295166015625, -0.447509765625, -0.2655029296875, -0.08349609375, 0.0985107421875, 0.280517578125, 0.4625244140625, 0.64453125, 0.8265380859375, 1.008544921875, 1.1905517578125, 1.37255859375, 1.5545654296875, 1.736572265625, 1.9185791015625, 2.1005859375, 2.2825927734375, 2.464599609375, 2.6466064453125, 2.82861328125, 3.0106201171875, 3.192626953125, 3.3746337890625, 3.556640625, 3.7386474609375, 3.920654296875, 4.1026611328125, 4.28466796875, 4.4666748046875, 4.648681640625, 4.8306884765625, 5.0126953125, 5.1947021484375, 5.376708984375, 5.5587158203125, 5.74072265625, 5.9227294921875, 6.104736328125, 6.2867431640625, 6.46875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 10.0, 10.0, 14.0, 27.0, 49.0, 60.0, 116.0, 183.0, 386.0, 766.0, 2052.0, 13295.0, 854102.0, 168471.0, 6184.0, 1527.0, 595.0, 298.0, 137.0, 112.0, 51.0, 33.0, 21.0, 20.0, 12.0, 7.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.171875, -27.36328125, -26.5546875, -25.74609375, -24.9375, -24.12890625, -23.3203125, -22.51171875, -21.703125, -20.89453125, -20.0859375, -19.27734375, -18.46875, -17.66015625, -16.8515625, -16.04296875, -15.234375, -14.42578125, -13.6171875, -12.80859375, -12.0, -11.19140625, -10.3828125, -9.57421875, -8.765625, -7.95703125, -7.1484375, -6.33984375, -5.53125, -4.72265625, -3.9140625, -3.10546875, -2.296875, -1.48828125, -0.6796875, 0.12890625, 0.9375, 1.74609375, 2.5546875, 3.36328125, 4.171875, 4.98046875, 5.7890625, 6.59765625, 7.40625, 8.21484375, 9.0234375, 9.83203125, 10.640625, 11.44921875, 12.2578125, 13.06640625, 13.875, 14.68359375, 15.4921875, 16.30078125, 17.109375, 17.91796875, 18.7265625, 19.53515625, 20.34375, 21.15234375, 21.9609375, 22.76953125, 23.578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 12.0, 10.0, 18.0, 14.0, 36.0, 39.0, 42.0, 53.0, 77.0, 76.0, 68.0, 89.0, 78.0, 76.0, 63.0, 50.0, 42.0, 41.0, 28.0, 19.0, 17.0, 7.0, 14.0, 4.0, 2.0, 6.0, 1.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.203125, -25.279052734375, -24.35498046875, -23.430908203125, -22.5068359375, -21.582763671875, -20.65869140625, -19.734619140625, -18.810546875, -17.886474609375, -16.96240234375, -16.038330078125, -15.1142578125, -14.190185546875, -13.26611328125, -12.342041015625, -11.41796875, -10.493896484375, -9.56982421875, -8.645751953125, -7.7216796875, -6.797607421875, -5.87353515625, -4.949462890625, -4.025390625, -3.101318359375, -2.17724609375, -1.253173828125, -0.3291015625, 0.594970703125, 1.51904296875, 2.443115234375, 3.3671875, 4.291259765625, 5.21533203125, 6.139404296875, 7.0634765625, 7.987548828125, 8.91162109375, 9.835693359375, 10.759765625, 11.683837890625, 12.60791015625, 13.531982421875, 14.4560546875, 15.380126953125, 16.30419921875, 17.228271484375, 18.15234375, 19.076416015625, 20.00048828125, 20.924560546875, 21.8486328125, 22.772705078125, 23.69677734375, 24.620849609375, 25.544921875, 26.468994140625, 27.39306640625, 28.317138671875, 29.2412109375, 30.165283203125, 31.08935546875, 32.013427734375, 32.9375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 4.0, 8.0, 10.0, 13.0, 17.0, 34.0, 52.0, 69.0, 104.0, 163.0, 312.0, 728.0, 1908.0, 6032.0, 28176.0, 663859.0, 313606.0, 24712.0, 5477.0, 1721.0, 693.0, 315.0, 163.0, 106.0, 68.0, 42.0, 39.0, 23.0, 14.0, 10.0, 7.0, 10.0, 8.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-5.92578125, -5.75628662109375, -5.5867919921875, -5.41729736328125, -5.247802734375, -5.07830810546875, -4.9088134765625, -4.73931884765625, -4.56982421875, -4.40032958984375, -4.2308349609375, -4.06134033203125, -3.891845703125, -3.72235107421875, -3.5528564453125, -3.38336181640625, -3.2138671875, -3.04437255859375, -2.8748779296875, -2.70538330078125, -2.535888671875, -2.36639404296875, -2.1968994140625, -2.02740478515625, -1.85791015625, -1.68841552734375, -1.5189208984375, -1.34942626953125, -1.179931640625, -1.01043701171875, -0.8409423828125, -0.67144775390625, -0.501953125, -0.33245849609375, -0.1629638671875, 0.00653076171875, 0.176025390625, 0.34552001953125, 0.5150146484375, 0.68450927734375, 0.85400390625, 1.02349853515625, 1.1929931640625, 1.36248779296875, 1.531982421875, 1.70147705078125, 1.8709716796875, 2.04046630859375, 2.2099609375, 2.37945556640625, 2.5489501953125, 2.71844482421875, 2.887939453125, 3.05743408203125, 3.2269287109375, 3.39642333984375, 3.56591796875, 3.73541259765625, 3.9049072265625, 4.07440185546875, 4.243896484375, 4.41339111328125, 4.5828857421875, 4.75238037109375, 4.921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 4.0, 9.0, 19.0, 31.0, 42.0, 52.0, 106.0, 185.0, 200.0, 119.0, 65.0, 38.0, 28.0, 13.0, 9.0, 11.0, 4.0, 5.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013914108276367188, -0.0013463646173477173, -0.0013013184070587158, -0.0012562721967697144, -0.0012112259864807129, -0.0011661797761917114, -0.00112113356590271, -0.0010760873556137085, -0.001031041145324707, -0.0009859949350357056, -0.0009409487247467041, -0.0008959025144577026, -0.0008508563041687012, -0.0008058100938796997, -0.0007607638835906982, -0.0007157176733016968, -0.0006706714630126953, -0.0006256252527236938, -0.0005805790424346924, -0.0005355328321456909, -0.0004904866218566895, -0.000445440411567688, -0.0004003942012786865, -0.00035534799098968506, -0.0003103017807006836, -0.00026525557041168213, -0.00022020936012268066, -0.0001751631498336792, -0.00013011693954467773, -8.507072925567627e-05, -4.0024518966674805e-05, 5.02169132232666e-06, 5.0067901611328125e-05, 9.511411190032959e-05, 0.00014016032218933105, 0.00018520653247833252, 0.00023025274276733398, 0.00027529895305633545, 0.0003203451633453369, 0.0003653913736343384, 0.00041043758392333984, 0.0004554837942123413, 0.0005005300045013428, 0.0005455762147903442, 0.0005906224250793457, 0.0006356686353683472, 0.0006807148456573486, 0.0007257610559463501, 0.0007708072662353516, 0.000815853476524353, 0.0008608996868133545, 0.000905945897102356, 0.0009509921073913574, 0.0009960383176803589, 0.0010410845279693604, 0.0010861307382583618, 0.0011311769485473633, 0.0011762231588363647, 0.0012212693691253662, 0.0012663155794143677, 0.0013113617897033691, 0.0013564079999923706, 0.001401454210281372, 0.0014465004205703735, 0.001491546630859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 13.0, 10.0, 15.0, 14.0, 46.0, 48.0, 80.0, 134.0, 214.0, 436.0, 905.0, 2108.0, 5778.0, 20230.0, 118307.0, 786926.0, 87850.0, 16658.0, 5002.0, 1923.0, 818.0, 429.0, 244.0, 127.0, 76.0, 57.0, 33.0, 18.0, 13.0, 10.0, 7.0, 7.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.974853515625, -3.84423828125, -3.713623046875, -3.5830078125, -3.452392578125, -3.32177734375, -3.191162109375, -3.060546875, -2.929931640625, -2.79931640625, -2.668701171875, -2.5380859375, -2.407470703125, -2.27685546875, -2.146240234375, -2.015625, -1.885009765625, -1.75439453125, -1.623779296875, -1.4931640625, -1.362548828125, -1.23193359375, -1.101318359375, -0.970703125, -0.840087890625, -0.70947265625, -0.578857421875, -0.4482421875, -0.317626953125, -0.18701171875, -0.056396484375, 0.07421875, 0.204833984375, 0.33544921875, 0.466064453125, 0.5966796875, 0.727294921875, 0.85791015625, 0.988525390625, 1.119140625, 1.249755859375, 1.38037109375, 1.510986328125, 1.6416015625, 1.772216796875, 1.90283203125, 2.033447265625, 2.1640625, 2.294677734375, 2.42529296875, 2.555908203125, 2.6865234375, 2.817138671875, 2.94775390625, 3.078369140625, 3.208984375, 3.339599609375, 3.47021484375, 3.600830078125, 3.7314453125, 3.862060546875, 3.99267578125, 4.123291015625, 4.25390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 10.0, 8.0, 19.0, 12.0, 28.0, 40.0, 43.0, 48.0, 73.0, 104.0, 98.0, 104.0, 92.0, 69.0, 56.0, 45.0, 44.0, 18.0, 15.0, 8.0, 11.0, 6.0, 8.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.0234375, -3.91168212890625, -3.7999267578125, -3.68817138671875, -3.576416015625, -3.46466064453125, -3.3529052734375, -3.24114990234375, -3.12939453125, -3.01763916015625, -2.9058837890625, -2.79412841796875, -2.682373046875, -2.57061767578125, -2.4588623046875, -2.34710693359375, -2.2353515625, -2.12359619140625, -2.0118408203125, -1.90008544921875, -1.788330078125, -1.67657470703125, -1.5648193359375, -1.45306396484375, -1.34130859375, -1.22955322265625, -1.1177978515625, -1.00604248046875, -0.894287109375, -0.78253173828125, -0.6707763671875, -0.55902099609375, -0.447265625, -0.33551025390625, -0.2237548828125, -0.11199951171875, -0.000244140625, 0.11151123046875, 0.2232666015625, 0.33502197265625, 0.44677734375, 0.55853271484375, 0.6702880859375, 0.78204345703125, 0.893798828125, 1.00555419921875, 1.1173095703125, 1.22906494140625, 1.3408203125, 1.45257568359375, 1.5643310546875, 1.67608642578125, 1.787841796875, 1.89959716796875, 2.0113525390625, 2.12310791015625, 2.23486328125, 2.34661865234375, 2.4583740234375, 2.57012939453125, 2.681884765625, 2.79364013671875, 2.9053955078125, 3.01715087890625, 3.12890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 11.0, 2.0, 16.0, 106.0, 574.0, 239.0, 44.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-302.7991027832031, -294.3559875488281, -285.9128723144531, -277.4697570800781, -269.0266418457031, -260.5835266113281, -252.1404266357422, -243.6973114013672, -235.2541961669922, -226.8110809326172, -218.3679656982422, -209.9248504638672, -201.48175048828125, -193.03863525390625, -184.59552001953125, -176.15240478515625, -167.70928955078125, -159.26617431640625, -150.82305908203125, -142.37994384765625, -133.93682861328125, -125.49372100830078, -117.05061340332031, -108.60749816894531, -100.16438293457031, -91.72126770019531, -83.27815246582031, -74.83504486083984, -66.39192962646484, -57.948814392089844, -49.50570297241211, -41.062591552734375, -32.61944580078125, -24.176332473754883, -15.733219146728516, -7.290105819702148, 1.1530075073242188, 9.596122741699219, 18.039234161376953, 26.482345581054688, 34.92546081542969, 43.36857604980469, 51.81168746948242, 60.254798889160156, 68.69791412353516, 77.14102935791016, 85.58413696289062, 94.02725219726562, 102.47036743164062, 110.91348266601562, 119.35659790039062, 127.7997055053711, 136.24282836914062, 144.68594360351562, 153.12904357910156, 161.57215881347656, 170.01527404785156, 178.45838928222656, 186.90150451660156, 195.34461975097656, 203.7877197265625, 212.2308349609375, 220.6739501953125, 229.1170654296875, 237.5601806640625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 11.0, 13.0, 11.0, 17.0, 20.0, 27.0, 36.0, 32.0, 33.0, 38.0, 39.0, 66.0, 137.0, 163.0, 52.0, 41.0, 35.0, 44.0, 30.0, 17.0, 27.0, 24.0, 15.0, 13.0, 11.0, 9.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-124.73792266845703, -121.45777130126953, -118.17762756347656, -114.89747619628906, -111.61732482910156, -108.3371810913086, -105.0570297241211, -101.77688598632812, -98.49673461914062, -95.21658325195312, -91.93643951416016, -88.65628814697266, -85.37614440917969, -82.09599304199219, -78.81584167480469, -75.53569030761719, -72.25554656982422, -68.97539520263672, -65.69525146484375, -62.41510009765625, -59.134952545166016, -55.85480499267578, -52.57465362548828, -49.29450607299805, -46.01435852050781, -42.73421096801758, -39.454063415527344, -36.173912048339844, -32.89376449584961, -29.613616943359375, -26.333467483520508, -23.05331802368164, -19.773178100585938, -16.493030548095703, -13.212881088256836, -9.932732582092285, -6.652584075927734, -3.3724365234375, -0.09228706359863281, 3.1878623962402344, 6.468009948730469, 9.74815845489502, 13.02830696105957, 16.308456420898438, 19.588603973388672, 22.868751525878906, 26.148900985717773, 29.42905044555664, 32.709197998046875, 35.98934555053711, 39.269493103027344, 42.549644470214844, 45.82979202270508, 49.10993957519531, 52.39009094238281, 55.67023849487305, 58.95038604736328, 62.230533599853516, 65.51068115234375, 68.79083251953125, 72.07098388671875, 75.35112762451172, 78.63127899169922, 81.91142272949219, 85.19157409667969]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 9.0, 5.0, 10.0, 18.0, 23.0, 38.0, 47.0, 120.0, 163.0, 271.0, 446.0, 747.0, 1442.0, 2485.0, 5001.0, 10932.0, 29954.0, 128923.0, 762794.0, 2142285.0, 893663.0, 156047.0, 35133.0, 12134.0, 5433.0, 2708.0, 1416.0, 820.0, 461.0, 241.0, 160.0, 102.0, 67.0, 62.0, 29.0, 19.0, 20.0, 14.0, 11.0, 2.0, 6.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.9375, -8.671142578125, -8.40478515625, -8.138427734375, -7.8720703125, -7.605712890625, -7.33935546875, -7.072998046875, -6.806640625, -6.540283203125, -6.27392578125, -6.007568359375, -5.7412109375, -5.474853515625, -5.20849609375, -4.942138671875, -4.67578125, -4.409423828125, -4.14306640625, -3.876708984375, -3.6103515625, -3.343994140625, -3.07763671875, -2.811279296875, -2.544921875, -2.278564453125, -2.01220703125, -1.745849609375, -1.4794921875, -1.213134765625, -0.94677734375, -0.680419921875, -0.4140625, -0.147705078125, 0.11865234375, 0.385009765625, 0.6513671875, 0.917724609375, 1.18408203125, 1.450439453125, 1.716796875, 1.983154296875, 2.24951171875, 2.515869140625, 2.7822265625, 3.048583984375, 3.31494140625, 3.581298828125, 3.84765625, 4.114013671875, 4.38037109375, 4.646728515625, 4.9130859375, 5.179443359375, 5.44580078125, 5.712158203125, 5.978515625, 6.244873046875, 6.51123046875, 6.777587890625, 7.0439453125, 7.310302734375, 7.57666015625, 7.843017578125, 8.109375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 6.0, 9.0, 16.0, 22.0, 15.0, 27.0, 49.0, 45.0, 38.0, 48.0, 69.0, 61.0, 59.0, 57.0, 56.0, 48.0, 49.0, 53.0, 42.0, 31.0, 40.0, 25.0, 24.0, 21.0, 19.0, 16.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19140625, -5.01495361328125, -4.8385009765625, -4.66204833984375, -4.485595703125, -4.30914306640625, -4.1326904296875, -3.95623779296875, -3.77978515625, -3.60333251953125, -3.4268798828125, -3.25042724609375, -3.073974609375, -2.89752197265625, -2.7210693359375, -2.54461669921875, -2.3681640625, -2.19171142578125, -2.0152587890625, -1.83880615234375, -1.662353515625, -1.48590087890625, -1.3094482421875, -1.13299560546875, -0.95654296875, -0.78009033203125, -0.6036376953125, -0.42718505859375, -0.250732421875, -0.07427978515625, 0.1021728515625, 0.27862548828125, 0.455078125, 0.63153076171875, 0.8079833984375, 0.98443603515625, 1.160888671875, 1.33734130859375, 1.5137939453125, 1.69024658203125, 1.86669921875, 2.04315185546875, 2.2196044921875, 2.39605712890625, 2.572509765625, 2.74896240234375, 2.9254150390625, 3.10186767578125, 3.2783203125, 3.45477294921875, 3.6312255859375, 3.80767822265625, 3.984130859375, 4.16058349609375, 4.3370361328125, 4.51348876953125, 4.68994140625, 4.86639404296875, 5.0428466796875, 5.21929931640625, 5.395751953125, 5.57220458984375, 5.7486572265625, 5.92510986328125, 6.1015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 6.0, 19.0, 43.0, 52.0, 81.0, 147.0, 341.0, 634.0, 1651.0, 6407.0, 176527.0, 3978184.0, 24948.0, 3191.0, 1038.0, 451.0, 236.0, 125.0, 66.0, 35.0, 29.0, 14.0, 16.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.80078125, -33.5703125, -32.33984375, -31.109375, -29.87890625, -28.6484375, -27.41796875, -26.1875, -24.95703125, -23.7265625, -22.49609375, -21.265625, -20.03515625, -18.8046875, -17.57421875, -16.34375, -15.11328125, -13.8828125, -12.65234375, -11.421875, -10.19140625, -8.9609375, -7.73046875, -6.5, -5.26953125, -4.0390625, -2.80859375, -1.578125, -0.34765625, 0.8828125, 2.11328125, 3.34375, 4.57421875, 5.8046875, 7.03515625, 8.265625, 9.49609375, 10.7265625, 11.95703125, 13.1875, 14.41796875, 15.6484375, 16.87890625, 18.109375, 19.33984375, 20.5703125, 21.80078125, 23.03125, 24.26171875, 25.4921875, 26.72265625, 27.953125, 29.18359375, 30.4140625, 31.64453125, 32.875, 34.10546875, 35.3359375, 36.56640625, 37.796875, 39.02734375, 40.2578125, 41.48828125, 42.71875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 11.0, 27.0, 26.0, 42.0, 77.0, 109.0, 180.0, 283.0, 423.0, 595.0, 667.0, 563.0, 351.0, 256.0, 132.0, 110.0, 72.0, 37.0, 32.0, 20.0, 10.0, 10.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-24.40625, -23.7877197265625, -23.169189453125, -22.5506591796875, -21.93212890625, -21.3135986328125, -20.695068359375, -20.0765380859375, -19.4580078125, -18.8394775390625, -18.220947265625, -17.6024169921875, -16.98388671875, -16.3653564453125, -15.746826171875, -15.1282958984375, -14.509765625, -13.8912353515625, -13.272705078125, -12.6541748046875, -12.03564453125, -11.4171142578125, -10.798583984375, -10.1800537109375, -9.5615234375, -8.9429931640625, -8.324462890625, -7.7059326171875, -7.08740234375, -6.4688720703125, -5.850341796875, -5.2318115234375, -4.61328125, -3.9947509765625, -3.376220703125, -2.7576904296875, -2.13916015625, -1.5206298828125, -0.902099609375, -0.2835693359375, 0.3349609375, 0.9534912109375, 1.572021484375, 2.1905517578125, 2.80908203125, 3.4276123046875, 4.046142578125, 4.6646728515625, 5.283203125, 5.9017333984375, 6.520263671875, 7.1387939453125, 7.75732421875, 8.3758544921875, 8.994384765625, 9.6129150390625, 10.2314453125, 10.8499755859375, 11.468505859375, 12.0870361328125, 12.70556640625, 13.3240966796875, 13.942626953125, 14.5611572265625, 15.1796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 10.0, 7.0, 14.0, 18.0, 32.0, 68.0, 115.0, 174.0, 205.0, 139.0, 96.0, 49.0, 22.0, 11.0, 7.0, 8.0, 3.0, 1.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-186.98609924316406, -180.78042602539062, -174.5747528076172, -168.36907958984375, -162.16342163085938, -155.95774841308594, -149.7520751953125, -143.54640197753906, -137.34072875976562, -131.1350555419922, -124.92938232421875, -118.72371673583984, -112.5180435180664, -106.31237030029297, -100.10670471191406, -93.90103149414062, -87.69535827636719, -81.48968505859375, -75.28401184082031, -69.0783462524414, -62.87267303466797, -56.66699981689453, -50.46133041381836, -44.25566101074219, -38.04998779296875, -31.844316482543945, -25.63864517211914, -19.432973861694336, -13.227302551269531, -7.021631240844727, -0.8159599304199219, 5.38970947265625, 11.59539794921875, 17.801069259643555, 24.00674057006836, 30.212411880493164, 36.41808319091797, 42.623756408691406, 48.82942581176758, 55.03509521484375, 61.24076843261719, 67.44644165039062, 73.65211486816406, 79.85778045654297, 86.0634536743164, 92.26912689208984, 98.47479248046875, 104.68046569824219, 110.88613891601562, 117.09181213378906, 123.2974853515625, 129.50315856933594, 135.70883178710938, 141.91448974609375, 148.1201629638672, 154.32583618164062, 160.53150939941406, 166.7371826171875, 172.94285583496094, 179.14852905273438, 185.35418701171875, 191.5598602294922, 197.76553344726562, 203.97120666503906, 210.1768798828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 16.0, 21.0, 30.0, 39.0, 50.0, 50.0, 84.0, 80.0, 88.0, 115.0, 84.0, 67.0, 62.0, 64.0, 45.0, 30.0, 15.0, 17.0, 14.0, 6.0, 10.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0], "bins": [-221.938720703125, -216.66555786132812, -211.39239501953125, -206.11923217773438, -200.8460693359375, -195.57290649414062, -190.29974365234375, -185.02659606933594, -179.75343322753906, -174.4802703857422, -169.2071075439453, -163.93394470214844, -158.66078186035156, -153.38763427734375, -148.11447143554688, -142.84130859375, -137.56814575195312, -132.29498291015625, -127.02182006835938, -121.7486572265625, -116.47550201416016, -111.20233917236328, -105.9291763305664, -100.65602111816406, -95.38284301757812, -90.10968017578125, -84.83651733398438, -79.5633544921875, -74.29019927978516, -69.01703643798828, -63.743873596191406, -58.4707145690918, -53.19755554199219, -47.92439270019531, -42.6512336730957, -37.37807083129883, -32.10491180419922, -26.831748962402344, -21.55858612060547, -16.28542709350586, -11.012264251708984, -5.739102840423584, -0.4659414291381836, 4.807220458984375, 10.080381393432617, 15.35354232788086, 20.626705169677734, 25.899864196777344, 31.17302703857422, 36.446189880371094, 41.7193489074707, 46.99251174926758, 52.26567077636719, 57.53883361816406, 62.81199645996094, 68.08515930175781, 73.35832214355469, 78.63148498535156, 83.90464782714844, 89.17781066894531, 94.45096588134766, 99.72412872314453, 104.9972915649414, 110.27044677734375, 115.54360961914062]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 8.0, 21.0, 22.0, 40.0, 69.0, 177.0, 417.0, 950.0, 3220.0, 14263.0, 141692.0, 817576.0, 58386.0, 8299.0, 2081.0, 728.0, 326.0, 144.0, 62.0, 30.0, 17.0, 7.0, 10.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.9375, -16.4442138671875, -15.950927734375, -15.4576416015625, -14.96435546875, -14.4710693359375, -13.977783203125, -13.4844970703125, -12.9912109375, -12.4979248046875, -12.004638671875, -11.5113525390625, -11.01806640625, -10.5247802734375, -10.031494140625, -9.5382080078125, -9.044921875, -8.5516357421875, -8.058349609375, -7.5650634765625, -7.07177734375, -6.5784912109375, -6.085205078125, -5.5919189453125, -5.0986328125, -4.6053466796875, -4.112060546875, -3.6187744140625, -3.12548828125, -2.6322021484375, -2.138916015625, -1.6456298828125, -1.15234375, -0.6590576171875, -0.165771484375, 0.3275146484375, 0.82080078125, 1.3140869140625, 1.807373046875, 2.3006591796875, 2.7939453125, 3.2872314453125, 3.780517578125, 4.2738037109375, 4.76708984375, 5.2603759765625, 5.753662109375, 6.2469482421875, 6.740234375, 7.2335205078125, 7.726806640625, 8.2200927734375, 8.71337890625, 9.2066650390625, 9.699951171875, 10.1932373046875, 10.6865234375, 11.1798095703125, 11.673095703125, 12.1663818359375, 12.65966796875, 13.1529541015625, 13.646240234375, 14.1395263671875, 14.6328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 13.0, 22.0, 36.0, 26.0, 51.0, 78.0, 74.0, 99.0, 84.0, 92.0, 93.0, 88.0, 76.0, 48.0, 39.0, 25.0, 20.0, 7.0, 12.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.421875, -16.038818359375, -15.65576171875, -15.272705078125, -14.8896484375, -14.506591796875, -14.12353515625, -13.740478515625, -13.357421875, -12.974365234375, -12.59130859375, -12.208251953125, -11.8251953125, -11.442138671875, -11.05908203125, -10.676025390625, -10.29296875, -9.909912109375, -9.52685546875, -9.143798828125, -8.7607421875, -8.377685546875, -7.99462890625, -7.611572265625, -7.228515625, -6.845458984375, -6.46240234375, -6.079345703125, -5.6962890625, -5.313232421875, -4.93017578125, -4.547119140625, -4.1640625, -3.781005859375, -3.39794921875, -3.014892578125, -2.6318359375, -2.248779296875, -1.86572265625, -1.482666015625, -1.099609375, -0.716552734375, -0.33349609375, 0.049560546875, 0.4326171875, 0.815673828125, 1.19873046875, 1.581787109375, 1.96484375, 2.347900390625, 2.73095703125, 3.114013671875, 3.4970703125, 3.880126953125, 4.26318359375, 4.646240234375, 5.029296875, 5.412353515625, 5.79541015625, 6.178466796875, 6.5615234375, 6.944580078125, 7.32763671875, 7.710693359375, 8.09375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 8.0, 11.0, 8.0, 13.0, 18.0, 33.0, 30.0, 45.0, 60.0, 69.0, 79.0, 117.0, 194.0, 331.0, 587.0, 1346.0, 4201.0, 23196.0, 750687.0, 242807.0, 18359.0, 3617.0, 1155.0, 531.0, 339.0, 217.0, 112.0, 93.0, 64.0, 52.0, 39.0, 34.0, 17.0, 11.0, 18.0, 7.0, 8.0, 7.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.5390625, -11.1661376953125, -10.793212890625, -10.4202880859375, -10.04736328125, -9.6744384765625, -9.301513671875, -8.9285888671875, -8.5556640625, -8.1827392578125, -7.809814453125, -7.4368896484375, -7.06396484375, -6.6910400390625, -6.318115234375, -5.9451904296875, -5.572265625, -5.1993408203125, -4.826416015625, -4.4534912109375, -4.08056640625, -3.7076416015625, -3.334716796875, -2.9617919921875, -2.5888671875, -2.2159423828125, -1.843017578125, -1.4700927734375, -1.09716796875, -0.7242431640625, -0.351318359375, 0.0216064453125, 0.39453125, 0.7674560546875, 1.140380859375, 1.5133056640625, 1.88623046875, 2.2591552734375, 2.632080078125, 3.0050048828125, 3.3779296875, 3.7508544921875, 4.123779296875, 4.4967041015625, 4.86962890625, 5.2425537109375, 5.615478515625, 5.9884033203125, 6.361328125, 6.7342529296875, 7.107177734375, 7.4801025390625, 7.85302734375, 8.2259521484375, 8.598876953125, 8.9718017578125, 9.3447265625, 9.7176513671875, 10.090576171875, 10.4635009765625, 10.83642578125, 11.2093505859375, 11.582275390625, 11.9552001953125, 12.328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 3.0, 8.0, 10.0, 15.0, 15.0, 26.0, 35.0, 36.0, 39.0, 41.0, 58.0, 67.0, 96.0, 103.0, 94.0, 65.0, 49.0, 36.0, 40.0, 23.0, 32.0, 21.0, 22.0, 13.0, 9.0, 6.0, 9.0, 7.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.96875, -25.982421875, -24.99609375, -24.009765625, -23.0234375, -22.037109375, -21.05078125, -20.064453125, -19.078125, -18.091796875, -17.10546875, -16.119140625, -15.1328125, -14.146484375, -13.16015625, -12.173828125, -11.1875, -10.201171875, -9.21484375, -8.228515625, -7.2421875, -6.255859375, -5.26953125, -4.283203125, -3.296875, -2.310546875, -1.32421875, -0.337890625, 0.6484375, 1.634765625, 2.62109375, 3.607421875, 4.59375, 5.580078125, 6.56640625, 7.552734375, 8.5390625, 9.525390625, 10.51171875, 11.498046875, 12.484375, 13.470703125, 14.45703125, 15.443359375, 16.4296875, 17.416015625, 18.40234375, 19.388671875, 20.375, 21.361328125, 22.34765625, 23.333984375, 24.3203125, 25.306640625, 26.29296875, 27.279296875, 28.265625, 29.251953125, 30.23828125, 31.224609375, 32.2109375, 33.197265625, 34.18359375, 35.169921875, 36.15625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 11.0, 11.0, 10.0, 16.0, 34.0, 46.0, 62.0, 97.0, 184.0, 352.0, 886.0, 2435.0, 8173.0, 47788.0, 881462.0, 89132.0, 12317.0, 3272.0, 1177.0, 445.0, 257.0, 146.0, 71.0, 47.0, 36.0, 21.0, 23.0, 13.0, 10.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9384765625, -1.8751983642578125, -1.811920166015625, -1.7486419677734375, -1.68536376953125, -1.6220855712890625, -1.558807373046875, -1.4955291748046875, -1.4322509765625, -1.3689727783203125, -1.305694580078125, -1.2424163818359375, -1.17913818359375, -1.1158599853515625, -1.052581787109375, -0.9893035888671875, -0.926025390625, -0.8627471923828125, -0.799468994140625, -0.7361907958984375, -0.67291259765625, -0.6096343994140625, -0.546356201171875, -0.4830780029296875, -0.4197998046875, -0.3565216064453125, -0.293243408203125, -0.2299652099609375, -0.16668701171875, -0.1034088134765625, -0.040130615234375, 0.0231475830078125, 0.08642578125, 0.1497039794921875, 0.212982177734375, 0.2762603759765625, 0.33953857421875, 0.4028167724609375, 0.466094970703125, 0.5293731689453125, 0.5926513671875, 0.6559295654296875, 0.719207763671875, 0.7824859619140625, 0.84576416015625, 0.9090423583984375, 0.972320556640625, 1.0355987548828125, 1.098876953125, 1.1621551513671875, 1.225433349609375, 1.2887115478515625, 1.35198974609375, 1.4152679443359375, 1.478546142578125, 1.5418243408203125, 1.6051025390625, 1.6683807373046875, 1.731658935546875, 1.7949371337890625, 1.85821533203125, 1.9214935302734375, 1.984771728515625, 2.0480499267578125, 2.111328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 3.0, 14.0, 12.0, 21.0, 10.0, 29.0, 43.0, 54.0, 89.0, 114.0, 118.0, 125.0, 123.0, 58.0, 44.0, 39.0, 25.0, 15.0, 12.0, 6.0, 17.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0006594657897949219, -0.0006439685821533203, -0.0006284713745117188, -0.0006129741668701172, -0.0005974769592285156, -0.0005819797515869141, -0.0005664825439453125, -0.0005509853363037109, -0.0005354881286621094, -0.0005199909210205078, -0.0005044937133789062, -0.0004889965057373047, -0.0004734992980957031, -0.00045800209045410156, -0.0004425048828125, -0.00042700767517089844, -0.0004115104675292969, -0.0003960132598876953, -0.00038051605224609375, -0.0003650188446044922, -0.0003495216369628906, -0.00033402442932128906, -0.0003185272216796875, -0.00030303001403808594, -0.0002875328063964844, -0.0002720355987548828, -0.00025653839111328125, -0.0002410411834716797, -0.00022554397583007812, -0.00021004676818847656, -0.000194549560546875, -0.00017905235290527344, -0.00016355514526367188, -0.0001480579376220703, -0.00013256072998046875, -0.00011706352233886719, -0.00010156631469726562, -8.606910705566406e-05, -7.05718994140625e-05, -5.507469177246094e-05, -3.9577484130859375e-05, -2.4080276489257812e-05, -8.58306884765625e-06, 6.9141387939453125e-06, 2.2411346435546875e-05, 3.790855407714844e-05, 5.340576171875e-05, 6.890296936035156e-05, 8.440017700195312e-05, 9.989738464355469e-05, 0.00011539459228515625, 0.0001308917999267578, 0.00014638900756835938, 0.00016188621520996094, 0.0001773834228515625, 0.00019288063049316406, 0.00020837783813476562, 0.0002238750457763672, 0.00023937225341796875, 0.0002548694610595703, 0.0002703666687011719, 0.00028586387634277344, 0.000301361083984375, 0.00031685829162597656, 0.0003323554992675781]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 8.0, 14.0, 16.0, 31.0, 51.0, 108.0, 230.0, 465.0, 1224.0, 3726.0, 14086.0, 86521.0, 867069.0, 59035.0, 11073.0, 3034.0, 1039.0, 429.0, 175.0, 101.0, 36.0, 28.0, 12.0, 10.0, 6.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.397064208984375, -2.33123779296875, -2.265411376953125, -2.1995849609375, -2.133758544921875, -2.06793212890625, -2.002105712890625, -1.936279296875, -1.870452880859375, -1.80462646484375, -1.738800048828125, -1.6729736328125, -1.607147216796875, -1.54132080078125, -1.475494384765625, -1.40966796875, -1.343841552734375, -1.27801513671875, -1.212188720703125, -1.1463623046875, -1.080535888671875, -1.01470947265625, -0.948883056640625, -0.883056640625, -0.817230224609375, -0.75140380859375, -0.685577392578125, -0.6197509765625, -0.553924560546875, -0.48809814453125, -0.422271728515625, -0.3564453125, -0.290618896484375, -0.22479248046875, -0.158966064453125, -0.0931396484375, -0.027313232421875, 0.03851318359375, 0.104339599609375, 0.170166015625, 0.235992431640625, 0.30181884765625, 0.367645263671875, 0.4334716796875, 0.499298095703125, 0.56512451171875, 0.630950927734375, 0.69677734375, 0.762603759765625, 0.82843017578125, 0.894256591796875, 0.9600830078125, 1.025909423828125, 1.09173583984375, 1.157562255859375, 1.223388671875, 1.289215087890625, 1.35504150390625, 1.420867919921875, 1.4866943359375, 1.552520751953125, 1.61834716796875, 1.684173583984375, 1.75]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 10.0, 5.0, 7.0, 10.0, 8.0, 11.0, 15.0, 18.0, 23.0, 23.0, 39.0, 59.0, 54.0, 61.0, 80.0, 90.0, 66.0, 65.0, 66.0, 59.0, 50.0, 37.0, 19.0, 26.0, 17.0, 12.0, 16.0, 9.0, 11.0, 6.0, 3.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.4163665771484375, -1.368865966796875, -1.3213653564453125, -1.27386474609375, -1.2263641357421875, -1.178863525390625, -1.1313629150390625, -1.0838623046875, -1.0363616943359375, -0.988861083984375, -0.9413604736328125, -0.89385986328125, -0.8463592529296875, -0.798858642578125, -0.7513580322265625, -0.703857421875, -0.6563568115234375, -0.608856201171875, -0.5613555908203125, -0.51385498046875, -0.4663543701171875, -0.418853759765625, -0.3713531494140625, -0.3238525390625, -0.2763519287109375, -0.228851318359375, -0.1813507080078125, -0.13385009765625, -0.0863494873046875, -0.038848876953125, 0.0086517333984375, 0.05615234375, 0.1036529541015625, 0.151153564453125, 0.1986541748046875, 0.24615478515625, 0.2936553955078125, 0.341156005859375, 0.3886566162109375, 0.4361572265625, 0.4836578369140625, 0.531158447265625, 0.5786590576171875, 0.62615966796875, 0.6736602783203125, 0.721160888671875, 0.7686614990234375, 0.816162109375, 0.8636627197265625, 0.911163330078125, 0.9586639404296875, 1.00616455078125, 1.0536651611328125, 1.101165771484375, 1.1486663818359375, 1.1961669921875, 1.2436676025390625, 1.291168212890625, 1.3386688232421875, 1.38616943359375, 1.4336700439453125, 1.481170654296875, 1.5286712646484375, 1.576171875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 12.0, 19.0, 13.0, 42.0, 105.0, 516.0, 162.0, 65.0, 29.0, 22.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.85951232910156, -161.33152770996094, -157.8035430908203, -154.2755584716797, -150.74758911132812, -147.2196044921875, -143.69161987304688, -140.16363525390625, -136.63565063476562, -133.107666015625, -129.57968139648438, -126.05170440673828, -122.52371978759766, -118.99573516845703, -115.46775817871094, -111.93977355957031, -108.41178894042969, -104.88380432128906, -101.35581970214844, -97.82784271240234, -94.29985809326172, -90.7718734741211, -87.243896484375, -83.71591186523438, -80.18792724609375, -76.65994262695312, -73.1319580078125, -69.6039810180664, -66.07599639892578, -62.548011779785156, -59.0200309753418, -55.49205017089844, -51.964073181152344, -48.43608856201172, -44.90810775756836, -41.380126953125, -37.852142333984375, -34.32415771484375, -30.79617691040039, -27.2681941986084, -23.740211486816406, -20.212228775024414, -16.684246063232422, -13.15626335144043, -9.628280639648438, -6.100297927856445, -2.572315216064453, 0.9556674957275391, 4.483650207519531, 8.011632919311523, 11.539615631103516, 15.067598342895508, 18.5955810546875, 22.123563766479492, 25.651546478271484, 29.179529190063477, 32.70751190185547, 36.235496520996094, 39.76347732543945, 43.29145812988281, 46.81944274902344, 50.34742736816406, 53.87540817260742, 57.40338897705078, 60.931373596191406]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 7.0, 7.0, 7.0, 10.0, 13.0, 15.0, 15.0, 18.0, 15.0, 21.0, 17.0, 24.0, 28.0, 46.0, 157.0, 299.0, 68.0, 34.0, 21.0, 18.0, 20.0, 20.0, 25.0, 10.0, 12.0, 13.0, 7.0, 5.0, 6.0, 7.0, 4.0, 6.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.678955078125, -66.32838439941406, -63.977813720703125, -61.62724304199219, -59.27667236328125, -56.92610168457031, -54.57553482055664, -52.2249641418457, -49.874393463134766, -47.52382278442383, -45.17325210571289, -42.82268142700195, -40.47211456298828, -38.121543884277344, -35.770973205566406, -33.42040252685547, -31.06983184814453, -28.719261169433594, -26.368690490722656, -24.01812171936035, -21.667551040649414, -19.316980361938477, -16.966411590576172, -14.615840911865234, -12.265270233154297, -9.91469955444336, -7.564129829406738, -5.213559627532959, -2.8629894256591797, -0.5124187469482422, 1.838150978088379, 4.188720703125, 6.5392913818359375, 8.889862060546875, 11.240431785583496, 13.591001510620117, 15.941572189331055, 18.292142868041992, 20.642711639404297, 22.993282318115234, 25.343852996826172, 27.69442367553711, 30.044994354248047, 32.395565032958984, 34.746131896972656, 37.096702575683594, 39.44727325439453, 41.79784393310547, 44.148414611816406, 46.498985290527344, 48.84955596923828, 51.20012664794922, 53.550697326660156, 55.901268005371094, 58.251834869384766, 60.6024055480957, 62.95297622680664, 65.30354309082031, 67.65411376953125, 70.00468444824219, 72.35525512695312, 74.70582580566406, 77.056396484375, 79.40696716308594, 81.75753784179688]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 2.0, 11.0, 8.0, 9.0, 12.0, 7.0, 9.0, 12.0, 35.0, 23.0, 24.0, 35.0, 40.0, 42.0, 75.0, 230.0, 133.0, 47.0, 43.0, 34.0, 39.0, 25.0, 16.0, 19.0, 16.0, 19.0, 12.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.796875, -8.5697021484375, -8.342529296875, -8.1153564453125, -7.88818359375, -7.6610107421875, -7.433837890625, -7.2066650390625, -6.9794921875, -6.7523193359375, -6.525146484375, -6.2979736328125, -6.07080078125, -5.8436279296875, -5.616455078125, -5.3892822265625, -5.162109375, -4.9349365234375, -4.707763671875, -4.4805908203125, -4.25341796875, -4.0262451171875, -3.799072265625, -3.5718994140625, -3.3447265625, -3.1175537109375, -2.890380859375, -2.6632080078125, -2.43603515625, -2.2088623046875, -1.981689453125, -1.7545166015625, -1.52734375, -1.3001708984375, -1.072998046875, -0.8458251953125, -0.61865234375, -0.3914794921875, -0.164306640625, 0.0628662109375, 0.2900390625, 0.5172119140625, 0.744384765625, 0.9715576171875, 1.19873046875, 1.4259033203125, 1.653076171875, 1.8802490234375, 2.107421875, 2.3345947265625, 2.561767578125, 2.7889404296875, 3.01611328125, 3.2432861328125, 3.470458984375, 3.6976318359375, 3.9248046875, 4.1519775390625, 4.379150390625, 4.6063232421875, 4.83349609375, 5.0606689453125, 5.287841796875, 5.5150146484375, 5.7421875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 9.0, 15.0, 21.0, 4.0, 5.0, 9.0, 22.0, 55.0, 78.0, 163.0, 355.0, 1255.0, 7532.0, 8351625.0, 24079.0, 2344.0, 500.0, 240.0, 106.0, 44.0, 46.0, 21.0, 12.0, 10.0, 12.0, 3.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.75170135498047, -49.36695098876953, -46.98219680786133, -44.597442626953125, -42.21269226074219, -39.82794189453125, -37.44318771362305, -35.058433532714844, -32.673683166503906, -30.288930892944336, -27.904178619384766, -25.519426345825195, -23.134674072265625, -20.749921798706055, -18.365169525146484, -15.980417251586914, -13.595664978027344, -11.210912704467773, -8.826160430908203, -6.441408157348633, -4.0566558837890625, -1.6719036102294922, 0.7128486633300781, 3.0976009368896484, 5.482353210449219, 7.867105484008789, 10.25185775756836, 12.63661003112793, 15.0213623046875, 17.40611457824707, 19.79086685180664, 22.17561912536621, 24.560379028320312, 26.945131301879883, 29.329883575439453, 31.714635848999023, 34.099388122558594, 36.48413848876953, 38.868892669677734, 41.25364685058594, 43.638397216796875, 46.02314758300781, 48.407901763916016, 50.79265594482422, 53.177406311035156, 55.562156677246094, 57.9469108581543, 60.3316650390625, 62.71641540527344, 65.10116577148438, 67.48591613769531, 69.87067413330078, 72.25542449951172, 74.64017486572266, 77.02493286132812, 79.40968322753906, 81.79443359375, 84.17918395996094, 86.56393432617188, 88.94869232177734, 91.33344268798828, 93.71819305419922, 96.10295104980469, 98.48770141601562, 100.87245178222656]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 7.0, 7.0, 3.0, 1.0, 2.0, 8.0, 1.0, 8.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-177.3442840576172, -173.36721801757812, -169.39015197753906, -165.4130859375, -161.43603515625, -157.45896911621094, -153.48190307617188, -149.5048370361328, -145.52777099609375, -141.5507049560547, -137.57363891601562, -133.59658813476562, -129.61952209472656, -125.6424560546875, -121.66539001464844, -117.68832397460938, -113.71126556396484, -109.73419952392578, -105.75714111328125, -101.78007507324219, -97.80300903320312, -93.82594299316406, -89.84888458251953, -85.87181854248047, -81.89476013183594, -77.91769409179688, -73.94063568115234, -69.96356964111328, -65.98650360107422, -62.00944137573242, -58.032379150390625, -54.05531311035156, -50.0782470703125, -46.1011848449707, -42.12411880493164, -38.147056579589844, -34.16999053955078, -30.192928314208984, -26.215866088867188, -22.238801956176758, -18.261737823486328, -14.284673690795898, -10.307610511779785, -6.330547332763672, -2.353483200073242, 1.6235809326171875, 5.600643157958984, 9.577707290649414, 13.554771423339844, 17.531835556030273, 21.508899688720703, 25.4859619140625, 29.46302604675293, 33.44009017944336, 37.417152404785156, 41.39421844482422, 45.371280670166016, 49.34834289550781, 53.325408935546875, 57.30247116088867, 61.27953338623047, 65.25659942626953, 69.23365783691406, 73.21072387695312, 77.18778991699219]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 11.0, 24.0, 31.0, 37.0, 55.0, 73.0, 84.0, 86.0, 109.0, 88.0, 85.0, 74.0, 61.0, 47.0, 32.0, 37.0, 21.0, 13.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.685302734375, -4.54638671875, -4.407470703125, -4.2685546875, -4.129638671875, -3.99072265625, -3.851806640625, -3.712890625, -3.573974609375, -3.43505859375, -3.296142578125, -3.1572265625, -3.018310546875, -2.87939453125, -2.740478515625, -2.6015625, -2.462646484375, -2.32373046875, -2.184814453125, -2.0458984375, -1.906982421875, -1.76806640625, -1.629150390625, -1.490234375, -1.351318359375, -1.21240234375, -1.073486328125, -0.9345703125, -0.795654296875, -0.65673828125, -0.517822265625, -0.37890625, -0.239990234375, -0.10107421875, 0.037841796875, 0.1767578125, 0.315673828125, 0.45458984375, 0.593505859375, 0.732421875, 0.871337890625, 1.01025390625, 1.149169921875, 1.2880859375, 1.427001953125, 1.56591796875, 1.704833984375, 1.84375, 1.982666015625, 2.12158203125, 2.260498046875, 2.3994140625, 2.538330078125, 2.67724609375, 2.816162109375, 2.955078125, 3.093994140625, 3.23291015625, 3.371826171875, 3.5107421875, 3.649658203125, 3.78857421875, 3.927490234375, 4.06640625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 8.0, 6.0, 5.0, 17.0, 43.0, 64.0, 128.0, 318.0, 966.0, 5545.0, 70864.0, 386950.0, 53533.0, 4321.0, 907.0, 313.0, 126.0, 61.0, 37.0, 24.0, 13.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.1875, -110.873046875, -107.55859375, -104.244140625, -100.9296875, -97.615234375, -94.30078125, -90.986328125, -87.671875, -84.357421875, -81.04296875, -77.728515625, -74.4140625, -71.099609375, -67.78515625, -64.470703125, -61.15625, -57.841796875, -54.52734375, -51.212890625, -47.8984375, -44.583984375, -41.26953125, -37.955078125, -34.640625, -31.326171875, -28.01171875, -24.697265625, -21.3828125, -18.068359375, -14.75390625, -11.439453125, -8.125, -4.810546875, -1.49609375, 1.818359375, 5.1328125, 8.447265625, 11.76171875, 15.076171875, 18.390625, 21.705078125, 25.01953125, 28.333984375, 31.6484375, 34.962890625, 38.27734375, 41.591796875, 44.90625, 48.220703125, 51.53515625, 54.849609375, 58.1640625, 61.478515625, 64.79296875, 68.107421875, 71.421875, 74.736328125, 78.05078125, 81.365234375, 84.6796875, 87.994140625, 91.30859375, 94.623046875, 97.9375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 14.0, 13.0, 21.0, 33.0, 47.0, 91.0, 118.0, 136.0, 135.0, 139.0, 88.0, 63.0, 48.0, 22.0, 11.0, 11.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09375, -18.618408203125, -18.14306640625, -17.667724609375, -17.1923828125, -16.717041015625, -16.24169921875, -15.766357421875, -15.291015625, -14.815673828125, -14.34033203125, -13.864990234375, -13.3896484375, -12.914306640625, -12.43896484375, -11.963623046875, -11.48828125, -11.012939453125, -10.53759765625, -10.062255859375, -9.5869140625, -9.111572265625, -8.63623046875, -8.160888671875, -7.685546875, -7.210205078125, -6.73486328125, -6.259521484375, -5.7841796875, -5.308837890625, -4.83349609375, -4.358154296875, -3.8828125, -3.407470703125, -2.93212890625, -2.456787109375, -1.9814453125, -1.506103515625, -1.03076171875, -0.555419921875, -0.080078125, 0.395263671875, 0.87060546875, 1.345947265625, 1.8212890625, 2.296630859375, 2.77197265625, 3.247314453125, 3.72265625, 4.197998046875, 4.67333984375, 5.148681640625, 5.6240234375, 6.099365234375, 6.57470703125, 7.050048828125, 7.525390625, 8.000732421875, 8.47607421875, 8.951416015625, 9.4267578125, 9.902099609375, 10.37744140625, 10.852783203125, 11.328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 2.0, 3.0, 4.0, 10.0, 14.0, 36.0, 74.0, 172.0, 91.0, 39.0, 16.0, 6.0, 6.0, 4.0, 7.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-106.58972930908203, -104.20504760742188, -101.82035827636719, -99.4356689453125, -97.05098724365234, -94.66630554199219, -92.2816162109375, -89.89692687988281, -87.51224517822266, -85.1275634765625, -82.74287414550781, -80.35818481445312, -77.97350311279297, -75.58882141113281, -73.20413208007812, -70.81944274902344, -68.43476104736328, -66.05007934570312, -63.66539001464844, -61.280704498291016, -58.896018981933594, -56.51133346557617, -54.12664794921875, -51.74196243286133, -49.357276916503906, -46.972591400146484, -44.58790588378906, -42.20322036743164, -39.81853485107422, -37.4338493347168, -35.049163818359375, -32.66447830200195, -30.27979278564453, -27.89510726928711, -25.510421752929688, -23.125736236572266, -20.741050720214844, -18.356365203857422, -15.9716796875, -13.586994171142578, -11.202308654785156, -8.817623138427734, -6.4329376220703125, -4.048252105712891, -1.6635665893554688, 0.7211189270019531, 3.105804443359375, 5.490489959716797, 7.875175476074219, 10.25986099243164, 12.644546508789062, 15.029232025146484, 17.413917541503906, 19.798603057861328, 22.18328857421875, 24.567974090576172, 26.952659606933594, 29.337345123291016, 31.722030639648438, 34.10671615600586, 36.49140167236328, 38.8760871887207, 41.260772705078125, 43.64545822143555, 46.03014373779297]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 3.0, 3.0, 4.0, 6.0, 15.0, 24.0, 36.0, 54.0, 85.0, 63.0, 58.0, 22.0, 26.0, 13.0, 10.0, 15.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.44866943359375, -30.308494567871094, -29.16832160949707, -28.028146743774414, -26.88797378540039, -25.747798919677734, -24.607624053955078, -23.467449188232422, -22.3272762298584, -21.187101364135742, -20.04692840576172, -18.906753540039062, -17.766578674316406, -16.626405715942383, -15.486230850219727, -14.346056938171387, -13.205883026123047, -12.065709114074707, -10.925535202026367, -9.785360336303711, -8.645186424255371, -7.505012512207031, -6.364838123321533, -5.224663734436035, -4.084489822387695, -2.9443156719207764, -1.8041415214538574, -0.6639673709869385, 0.47620677947998047, 1.6163806915283203, 2.7565550804138184, 3.8967294692993164, 5.036903381347656, 6.177077293395996, 7.317251682281494, 8.457426071166992, 9.597599983215332, 10.737773895263672, 11.877948760986328, 13.018122673034668, 14.158296585083008, 15.298470497131348, 16.438644409179688, 17.578819274902344, 18.718994140625, 19.859167098999023, 20.99934196472168, 22.139514923095703, 23.27968978881836, 24.419864654541016, 25.56003761291504, 26.700212478637695, 27.84038543701172, 28.980560302734375, 30.12073516845703, 31.260910034179688, 32.401084899902344, 33.541259765625, 34.681434631347656, 35.82160568237305, 36.9617805480957, 38.10195541381836, 39.242130279541016, 40.38230514526367, 41.52247619628906]}, "eval/loss": 6.05579948425293, "eval/wer": 1.3242760809202698, "eval/runtime": 647.7056, "eval/samples_per_second": 4.079, "eval/steps_per_second": 0.511} \ No newline at end of file