{"train/loss": 4.706, "train/learning_rate": 0.0002688, "train/epoch": 0.88, "train/global_step": 450, "_runtime": 4153, "_timestamp": 1646264118, "_step": 449, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 8.0, 7.0, 13.0, 14.0, 21.0, 25.0, 20.0, 40.0, 70.0, 102.0, 153.0, 157.0, 83.0, 73.0, 48.0, 33.0, 18.0, 28.0, 16.0, 20.0, 7.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-269.8289489746094, -260.6154479980469, -251.4019317626953, -242.18841552734375, -232.97491455078125, -223.76141357421875, -214.5478973388672, -205.33438110351562, -196.12088012695312, -186.90737915039062, -177.69386291503906, -168.4803466796875, -159.266845703125, -150.0533447265625, -140.83982849121094, -131.62631225585938, -122.41281127929688, -113.19930267333984, -103.98579406738281, -94.77228546142578, -85.55877685546875, -76.34526824951172, -67.13175964355469, -57.918251037597656, -48.704742431640625, -39.491233825683594, -30.277725219726562, -21.06421661376953, -11.8507080078125, -2.6371994018554688, 6.5763092041015625, 15.789817810058594, 25.00335693359375, 34.21686553955078, 43.43037414550781, 52.643882751464844, 61.857391357421875, 71.0708999633789, 80.28440856933594, 89.49791717529297, 98.71142578125, 107.92493438720703, 117.13844299316406, 126.3519515991211, 135.56546020507812, 144.77896118164062, 153.9924774169922, 163.20599365234375, 172.41949462890625, 181.63299560546875, 190.8465118408203, 200.06002807617188, 209.27352905273438, 218.48703002929688, 227.70054626464844, 236.9140625, 246.1275634765625, 255.341064453125, 264.5545654296875, 273.7680969238281, 282.9815979003906, 292.1950988769531, 301.40863037109375, 310.62213134765625, 319.83563232421875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 1.0, 5.0, 2.0, 2.0, 5.0, 9.0, 11.0, 22.0, 26.0, 38.0, 46.0, 59.0, 92.0, 104.0, 129.0, 81.0, 76.0, 62.0, 47.0, 35.0, 22.0, 26.0, 16.0, 15.0, 10.0, 7.0, 8.0, 11.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1637.169677734375, -1582.742919921875, -1528.3162841796875, -1473.8895263671875, -1419.462890625, -1365.0361328125, -1310.609375, -1256.1827392578125, -1201.7559814453125, -1147.3292236328125, -1092.902587890625, -1038.475830078125, -984.0491333007812, -929.6224365234375, -875.1957397460938, -820.76904296875, -766.3423461914062, -711.9156494140625, -657.4889526367188, -603.062255859375, -548.635498046875, -494.20880126953125, -439.7821044921875, -385.3553771972656, -330.9286804199219, -276.5019836425781, -222.07525634765625, -167.6485595703125, -113.22184753417969, -58.795135498046875, -4.368438720703125, 50.05828857421875, 104.4849853515625, 158.9116973876953, 213.33840942382812, 267.7651062011719, 322.19183349609375, 376.6185302734375, 431.04522705078125, 485.4719543457031, 539.898681640625, 594.3253784179688, 648.7520751953125, 703.1788330078125, 757.6055297851562, 812.0322265625, 866.4589233398438, 920.8856201171875, 975.3123168945312, 1029.739013671875, 1084.165771484375, 1138.5924072265625, 1193.0191650390625, 1247.44580078125, 1301.87255859375, 1356.29931640625, 1410.7259521484375, 1465.1527099609375, 1519.579345703125, 1574.006103515625, 1628.4327392578125, 1682.8594970703125, 1737.2861328125, 1791.712890625, 1846.1396484375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 1.0, 4.0, 4.0, 7.0, 2.0, 6.0, 10.0, 11.0, 23.0, 28.0, 18.0, 32.0, 35.0, 61.0, 70.0, 67.0, 73.0, 73.0, 63.0, 75.0, 39.0, 47.0, 44.0, 37.0, 19.0, 14.0, 26.0, 21.0, 13.0, 15.0, 14.0, 13.0, 5.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.75, -35.56005859375, -34.3701171875, -33.18017578125, -31.990234375, -30.80029296875, -29.6103515625, -28.42041015625, -27.23046875, -26.04052734375, -24.8505859375, -23.66064453125, -22.470703125, -21.28076171875, -20.0908203125, -18.90087890625, -17.7109375, -16.52099609375, -15.3310546875, -14.14111328125, -12.951171875, -11.76123046875, -10.5712890625, -9.38134765625, -8.19140625, -7.00146484375, -5.8115234375, -4.62158203125, -3.431640625, -2.24169921875, -1.0517578125, 0.13818359375, 1.328125, 2.51806640625, 3.7080078125, 4.89794921875, 6.087890625, 7.27783203125, 8.4677734375, 9.65771484375, 10.84765625, 12.03759765625, 13.2275390625, 14.41748046875, 15.607421875, 16.79736328125, 17.9873046875, 19.17724609375, 20.3671875, 21.55712890625, 22.7470703125, 23.93701171875, 25.126953125, 26.31689453125, 27.5068359375, 28.69677734375, 29.88671875, 31.07666015625, 32.2666015625, 33.45654296875, 34.646484375, 35.83642578125, 37.0263671875, 38.21630859375, 39.40625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 3.0, 9.0, 11.0, 15.0, 19.0, 33.0, 39.0, 58.0, 69.0, 87.0, 129.0, 188.0, 255.0, 382.0, 655.0, 1048.0, 1970.0, 4109.0, 10478.0, 41507.0, 3491079.0, 594508.0, 29934.0, 8952.0, 3760.0, 1949.0, 1092.0, 622.0, 420.0, 256.0, 196.0, 126.0, 89.0, 62.0, 43.0, 33.0, 25.0, 14.0, 15.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-273.5, -264.640625, -255.78125, -246.921875, -238.0625, -229.203125, -220.34375, -211.484375, -202.625, -193.765625, -184.90625, -176.046875, -167.1875, -158.328125, -149.46875, -140.609375, -131.75, -122.890625, -114.03125, -105.171875, -96.3125, -87.453125, -78.59375, -69.734375, -60.875, -52.015625, -43.15625, -34.296875, -25.4375, -16.578125, -7.71875, 1.140625, 10.0, 18.859375, 27.71875, 36.578125, 45.4375, 54.296875, 63.15625, 72.015625, 80.875, 89.734375, 98.59375, 107.453125, 116.3125, 125.171875, 134.03125, 142.890625, 151.75, 160.609375, 169.46875, 178.328125, 187.1875, 196.046875, 204.90625, 213.765625, 222.625, 231.484375, 240.34375, 249.203125, 258.0625, 266.921875, 275.78125, 284.640625, 293.5]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 6.0, 9.0, 18.0, 16.0, 26.0, 32.0, 49.0, 56.0, 78.0, 84.0, 169.0, 215.0, 411.0, 798.0, 938.0, 436.0, 210.0, 126.0, 90.0, 65.0, 65.0, 36.0, 25.0, 24.0, 17.0, 14.0, 14.0, 10.0, 11.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.25, -151.669921875, -147.08984375, -142.509765625, -137.9296875, -133.349609375, -128.76953125, -124.189453125, -119.609375, -115.029296875, -110.44921875, -105.869140625, -101.2890625, -96.708984375, -92.12890625, -87.548828125, -82.96875, -78.388671875, -73.80859375, -69.228515625, -64.6484375, -60.068359375, -55.48828125, -50.908203125, -46.328125, -41.748046875, -37.16796875, -32.587890625, -28.0078125, -23.427734375, -18.84765625, -14.267578125, -9.6875, -5.107421875, -0.52734375, 4.052734375, 8.6328125, 13.212890625, 17.79296875, 22.373046875, 26.953125, 31.533203125, 36.11328125, 40.693359375, 45.2734375, 49.853515625, 54.43359375, 59.013671875, 63.59375, 68.173828125, 72.75390625, 77.333984375, 81.9140625, 86.494140625, 91.07421875, 95.654296875, 100.234375, 104.814453125, 109.39453125, 113.974609375, 118.5546875, 123.134765625, 127.71484375, 132.294921875, 136.875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 2.0, 3.0, 8.0, 11.0, 15.0, 16.0, 16.0, 22.0, 34.0, 37.0, 60.0, 82.0, 133.0, 191.0, 326.0, 727.0, 2196.0, 14517.0, 579509.0, 3565348.0, 25867.0, 3095.0, 916.0, 370.0, 238.0, 159.0, 85.0, 70.0, 51.0, 43.0, 19.0, 27.0, 22.0, 18.0, 13.0, 7.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-462.0, -446.65625, -431.3125, -415.96875, -400.625, -385.28125, -369.9375, -354.59375, -339.25, -323.90625, -308.5625, -293.21875, -277.875, -262.53125, -247.1875, -231.84375, -216.5, -201.15625, -185.8125, -170.46875, -155.125, -139.78125, -124.4375, -109.09375, -93.75, -78.40625, -63.0625, -47.71875, -32.375, -17.03125, -1.6875, 13.65625, 29.0, 44.34375, 59.6875, 75.03125, 90.375, 105.71875, 121.0625, 136.40625, 151.75, 167.09375, 182.4375, 197.78125, 213.125, 228.46875, 243.8125, 259.15625, 274.5, 289.84375, 305.1875, 320.53125, 335.875, 351.21875, 366.5625, 381.90625, 397.25, 412.59375, 427.9375, 443.28125, 458.625, 473.96875, 489.3125, 504.65625, 520.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 22.0, 63.0, 266.0, 498.0, 130.0, 21.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-684.9306640625, -649.278564453125, -613.62646484375, -577.974365234375, -542.3222045898438, -506.67010498046875, -471.01800537109375, -435.36590576171875, -399.7137756347656, -364.0616760253906, -328.4095458984375, -292.7574462890625, -257.1053466796875, -221.45321655273438, -185.80111694335938, -150.1490020751953, -114.49688720703125, -78.84477233886719, -43.192665100097656, -7.540557861328125, 28.111557006835938, 63.763671875, 99.415771484375, 135.06788635253906, 170.72000122070312, 206.3721160888672, 242.02423095703125, 277.67633056640625, 313.32843017578125, 348.9805603027344, 384.6326599121094, 420.2847900390625, 455.9368896484375, 491.5889892578125, 527.2410888671875, 562.8931884765625, 598.5453491210938, 634.1974487304688, 669.8495483398438, 705.5016479492188, 741.15380859375, 776.805908203125, 812.4580078125, 848.110107421875, 883.7622680664062, 919.4143676757812, 955.0664672851562, 990.7185668945312, 1026.37060546875, 1062.022705078125, 1097.6748046875, 1133.326904296875, 1168.97900390625, 1204.631103515625, 1240.283203125, 1275.9354248046875, 1311.5875244140625, 1347.2396240234375, 1382.8917236328125, 1418.5438232421875, 1454.1959228515625, 1489.84814453125, 1525.500244140625, 1561.15234375, 1596.804443359375]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 10.0, 12.0, 10.0, 15.0, 16.0, 19.0, 19.0, 22.0, 20.0, 25.0, 23.0, 25.0, 34.0, 33.0, 23.0, 41.0, 28.0, 33.0, 43.0, 35.0, 40.0, 51.0, 32.0, 33.0, 32.0, 35.0, 35.0, 25.0, 23.0, 25.0, 28.0, 25.0, 19.0, 14.0, 15.0, 12.0, 5.0, 15.0, 10.0, 8.0, 6.0, 7.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-369.4579162597656, -357.46026611328125, -345.46258544921875, -333.4649353027344, -321.46728515625, -309.4696044921875, -297.4719543457031, -285.47430419921875, -273.47662353515625, -261.4789733886719, -249.48129272460938, -237.483642578125, -225.48597717285156, -213.48831176757812, -201.49066162109375, -189.4929962158203, -177.49533081054688, -165.49766540527344, -153.5, -141.50234985351562, -129.5046844482422, -117.50701904296875, -105.50936126708984, -93.51170349121094, -81.5140380859375, -69.51637268066406, -57.518714904785156, -45.521053314208984, -33.52339172363281, -21.52573013305664, -9.528068542480469, 2.4695892333984375, 14.46728515625, 26.464946746826172, 38.462608337402344, 50.460269927978516, 62.45793151855469, 74.45559692382812, 86.45325469970703, 98.45091247558594, 110.44857788085938, 122.44624328613281, 134.44390869140625, 146.44155883789062, 158.43922424316406, 170.4368896484375, 182.43453979492188, 194.4322052001953, 206.42987060546875, 218.4275360107422, 230.42520141601562, 242.4228515625, 254.42051696777344, 266.4181823730469, 278.41583251953125, 290.41351318359375, 302.4111633300781, 314.4088134765625, 326.406494140625, 338.4041442871094, 350.40179443359375, 362.39947509765625, 374.3971252441406, 386.394775390625, 398.3924560546875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 5.0, 4.0, 11.0, 10.0, 18.0, 18.0, 19.0, 23.0, 29.0, 39.0, 49.0, 50.0, 59.0, 70.0, 79.0, 59.0, 52.0, 70.0, 45.0, 41.0, 24.0, 40.0, 25.0, 20.0, 18.0, 17.0, 16.0, 10.0, 10.0, 14.0, 10.0, 3.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.4375, -33.3056640625, -32.173828125, -31.0419921875, -29.91015625, -28.7783203125, -27.646484375, -26.5146484375, -25.3828125, -24.2509765625, -23.119140625, -21.9873046875, -20.85546875, -19.7236328125, -18.591796875, -17.4599609375, -16.328125, -15.1962890625, -14.064453125, -12.9326171875, -11.80078125, -10.6689453125, -9.537109375, -8.4052734375, -7.2734375, -6.1416015625, -5.009765625, -3.8779296875, -2.74609375, -1.6142578125, -0.482421875, 0.6494140625, 1.78125, 2.9130859375, 4.044921875, 5.1767578125, 6.30859375, 7.4404296875, 8.572265625, 9.7041015625, 10.8359375, 11.9677734375, 13.099609375, 14.2314453125, 15.36328125, 16.4951171875, 17.626953125, 18.7587890625, 19.890625, 21.0224609375, 22.154296875, 23.2861328125, 24.41796875, 25.5498046875, 26.681640625, 27.8134765625, 28.9453125, 30.0771484375, 31.208984375, 32.3408203125, 33.47265625, 34.6044921875, 35.736328125, 36.8681640625, 38.0]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 12.0, 12.0, 14.0, 41.0, 46.0, 84.0, 146.0, 239.0, 397.0, 683.0, 1235.0, 2254.0, 4792.0, 12840.0, 78165.0, 837398.0, 87100.0, 13159.0, 4802.0, 2282.0, 1168.0, 680.0, 387.0, 227.0, 146.0, 82.0, 52.0, 33.0, 24.0, 10.0, 6.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.0, -20.3916015625, -19.783203125, -19.1748046875, -18.56640625, -17.9580078125, -17.349609375, -16.7412109375, -16.1328125, -15.5244140625, -14.916015625, -14.3076171875, -13.69921875, -13.0908203125, -12.482421875, -11.8740234375, -11.265625, -10.6572265625, -10.048828125, -9.4404296875, -8.83203125, -8.2236328125, -7.615234375, -7.0068359375, -6.3984375, -5.7900390625, -5.181640625, -4.5732421875, -3.96484375, -3.3564453125, -2.748046875, -2.1396484375, -1.53125, -0.9228515625, -0.314453125, 0.2939453125, 0.90234375, 1.5107421875, 2.119140625, 2.7275390625, 3.3359375, 3.9443359375, 4.552734375, 5.1611328125, 5.76953125, 6.3779296875, 6.986328125, 7.5947265625, 8.203125, 8.8115234375, 9.419921875, 10.0283203125, 10.63671875, 11.2451171875, 11.853515625, 12.4619140625, 13.0703125, 13.6787109375, 14.287109375, 14.8955078125, 15.50390625, 16.1123046875, 16.720703125, 17.3291015625, 17.9375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 13.0, 8.0, 8.0, 10.0, 12.0, 13.0, 17.0, 13.0, 15.0, 18.0, 22.0, 26.0, 20.0, 25.0, 26.0, 50.0, 33.0, 44.0, 37.0, 39.0, 31.0, 1062.0, 40.0, 35.0, 31.0, 41.0, 36.0, 39.0, 31.0, 29.0, 29.0, 28.0, 21.0, 17.0, 18.0, 11.0, 18.0, 11.0, 4.0, 7.0, 6.0, 2.0, 8.0, 7.0, 1.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-18.96875, -18.36181640625, -17.7548828125, -17.14794921875, -16.541015625, -15.93408203125, -15.3271484375, -14.72021484375, -14.11328125, -13.50634765625, -12.8994140625, -12.29248046875, -11.685546875, -11.07861328125, -10.4716796875, -9.86474609375, -9.2578125, -8.65087890625, -8.0439453125, -7.43701171875, -6.830078125, -6.22314453125, -5.6162109375, -5.00927734375, -4.40234375, -3.79541015625, -3.1884765625, -2.58154296875, -1.974609375, -1.36767578125, -0.7607421875, -0.15380859375, 0.453125, 1.06005859375, 1.6669921875, 2.27392578125, 2.880859375, 3.48779296875, 4.0947265625, 4.70166015625, 5.30859375, 5.91552734375, 6.5224609375, 7.12939453125, 7.736328125, 8.34326171875, 8.9501953125, 9.55712890625, 10.1640625, 10.77099609375, 11.3779296875, 11.98486328125, 12.591796875, 13.19873046875, 13.8056640625, 14.41259765625, 15.01953125, 15.62646484375, 16.2333984375, 16.84033203125, 17.447265625, 18.05419921875, 18.6611328125, 19.26806640625, 19.875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 12.0, 19.0, 24.0, 37.0, 51.0, 72.0, 110.0, 153.0, 210.0, 241.0, 351.0, 532.0, 713.0, 1068.0, 1580.0, 2582.0, 4338.0, 7781.0, 15516.0, 35654.0, 100121.0, 496936.0, 1228684.0, 120043.0, 41323.0, 17411.0, 8558.0, 4701.0, 2772.0, 1801.0, 1165.0, 763.0, 498.0, 351.0, 234.0, 169.0, 138.0, 101.0, 73.0, 75.0, 45.0, 30.0, 20.0, 12.0, 14.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.28125, -4.14349365234375, -4.0057373046875, -3.86798095703125, -3.730224609375, -3.59246826171875, -3.4547119140625, -3.31695556640625, -3.17919921875, -3.04144287109375, -2.9036865234375, -2.76593017578125, -2.628173828125, -2.49041748046875, -2.3526611328125, -2.21490478515625, -2.0771484375, -1.93939208984375, -1.8016357421875, -1.66387939453125, -1.526123046875, -1.38836669921875, -1.2506103515625, -1.11285400390625, -0.97509765625, -0.83734130859375, -0.6995849609375, -0.56182861328125, -0.424072265625, -0.28631591796875, -0.1485595703125, -0.01080322265625, 0.126953125, 0.26470947265625, 0.4024658203125, 0.54022216796875, 0.677978515625, 0.81573486328125, 0.9534912109375, 1.09124755859375, 1.22900390625, 1.36676025390625, 1.5045166015625, 1.64227294921875, 1.780029296875, 1.91778564453125, 2.0555419921875, 2.19329833984375, 2.3310546875, 2.46881103515625, 2.6065673828125, 2.74432373046875, 2.882080078125, 3.01983642578125, 3.1575927734375, 3.29534912109375, 3.43310546875, 3.57086181640625, 3.7086181640625, 3.84637451171875, 3.984130859375, 4.12188720703125, 4.2596435546875, 4.39739990234375, 4.53515625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 6.0, 6.0, 5.0, 7.0, 10.0, 8.0, 9.0, 10.0, 12.0, 21.0, 18.0, 43.0, 54.0, 62.0, 77.0, 103.0, 129.0, 82.0, 62.0, 52.0, 30.0, 30.0, 27.0, 20.0, 18.0, 12.0, 11.0, 10.0, 10.0, 3.0, 7.0, 9.0, 2.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7470703125, -0.7230682373046875, -0.699066162109375, -0.6750640869140625, -0.65106201171875, -0.6270599365234375, -0.603057861328125, -0.5790557861328125, -0.5550537109375, -0.5310516357421875, -0.507049560546875, -0.4830474853515625, -0.45904541015625, -0.4350433349609375, -0.411041259765625, -0.3870391845703125, -0.363037109375, -0.3390350341796875, -0.315032958984375, -0.2910308837890625, -0.26702880859375, -0.2430267333984375, -0.219024658203125, -0.1950225830078125, -0.1710205078125, -0.1470184326171875, -0.123016357421875, -0.0990142822265625, -0.07501220703125, -0.0510101318359375, -0.027008056640625, -0.0030059814453125, 0.02099609375, 0.0449981689453125, 0.069000244140625, 0.0930023193359375, 0.11700439453125, 0.1410064697265625, 0.165008544921875, 0.1890106201171875, 0.2130126953125, 0.2370147705078125, 0.261016845703125, 0.2850189208984375, 0.30902099609375, 0.3330230712890625, 0.357025146484375, 0.3810272216796875, 0.405029296875, 0.4290313720703125, 0.453033447265625, 0.4770355224609375, 0.50103759765625, 0.5250396728515625, 0.549041748046875, 0.5730438232421875, 0.5970458984375, 0.6210479736328125, 0.645050048828125, 0.6690521240234375, 0.69305419921875, 0.7170562744140625, 0.741058349609375, 0.7650604248046875, 0.7890625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 9.0, 6.0, 4.0, 9.0, 11.0, 11.0, 13.0, 21.0, 35.0, 50.0, 71.0, 96.0, 151.0, 220.0, 586.0, 934147.0, 111831.0, 554.0, 244.0, 161.0, 99.0, 49.0, 39.0, 32.0, 12.0, 10.0, 10.0, 10.0, 7.0, 5.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-21.96875, -21.30224609375, -20.6357421875, -19.96923828125, -19.302734375, -18.63623046875, -17.9697265625, -17.30322265625, -16.63671875, -15.97021484375, -15.3037109375, -14.63720703125, -13.970703125, -13.30419921875, -12.6376953125, -11.97119140625, -11.3046875, -10.63818359375, -9.9716796875, -9.30517578125, -8.638671875, -7.97216796875, -7.3056640625, -6.63916015625, -5.97265625, -5.30615234375, -4.6396484375, -3.97314453125, -3.306640625, -2.64013671875, -1.9736328125, -1.30712890625, -0.640625, 0.02587890625, 0.6923828125, 1.35888671875, 2.025390625, 2.69189453125, 3.3583984375, 4.02490234375, 4.69140625, 5.35791015625, 6.0244140625, 6.69091796875, 7.357421875, 8.02392578125, 8.6904296875, 9.35693359375, 10.0234375, 10.68994140625, 11.3564453125, 12.02294921875, 12.689453125, 13.35595703125, 14.0224609375, 14.68896484375, 15.35546875, 16.02197265625, 16.6884765625, 17.35498046875, 18.021484375, 18.68798828125, 19.3544921875, 20.02099609375, 20.6875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 31.0, 982.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8468017578125, -11.068922996520996, -10.291044235229492, -9.513166427612305, -8.735286712646484, -7.957408428192139, -7.179530143737793, -6.401651382446289, -5.623772621154785, -4.845893859863281, -4.068015098571777, -3.2901368141174316, -2.5122580528259277, -1.7343792915344238, -0.9565010070800781, -0.17862224578857422, 0.5992565155029297, 1.377135157585144, 2.1550137996673584, 2.932892322540283, 3.710771083831787, 4.488649845123291, 5.266528129577637, 6.044406890869141, 6.8222856521606445, 7.600164413452148, 8.378043174743652, 9.155921936035156, 9.933799743652344, 10.711679458618164, 11.489557266235352, 12.267436027526855, 13.04531478881836, 13.823193550109863, 14.601072311401367, 15.378950119018555, 16.156829833984375, 16.934707641601562, 17.71258544921875, 18.49046516418457, 19.26834487915039, 20.046222686767578, 20.8241024017334, 21.601980209350586, 22.379859924316406, 23.157737731933594, 23.93561553955078, 24.7134952545166, 25.49137306213379, 26.269250869750977, 27.047130584716797, 27.825008392333984, 28.602888107299805, 29.380765914916992, 30.158645629882812, 30.9365234375, 31.714401245117188, 32.492279052734375, 33.27015686035156, 34.048038482666016, 34.8259162902832, 35.60379409790039, 36.38167190551758, 37.15955352783203, 37.93743133544922]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 2.0, 2.0, 6.0, 12.0, 13.0, 19.0, 36.0, 32.0, 42.0, 38.0, 39.0, 59.0, 65.0, 68.0, 72.0, 59.0, 57.0, 63.0, 51.0, 55.0, 35.0, 29.0, 42.0, 26.0, 16.0, 19.0, 12.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0], "bins": [-3.3585169315338135, -3.2775042057037354, -3.196491241455078, -3.115478515625, -3.0344655513763428, -2.9534528255462646, -2.8724398612976074, -2.7914271354675293, -2.710414409637451, -2.629401683807373, -2.548388719558716, -2.4673759937286377, -2.3863630294799805, -2.3053503036499023, -2.224337339401245, -2.143324613571167, -2.0623116493225098, -1.981298804283142, -1.9002859592437744, -1.8192731142044067, -1.738260269165039, -1.657247543334961, -1.5762346982955933, -1.4952218532562256, -1.414209008216858, -1.3331961631774902, -1.2521833181381226, -1.1711704730987549, -1.0901577472686768, -1.0091447830200195, -0.9281320571899414, -0.8471192121505737, -0.7661066055297852, -0.6850937604904175, -0.6040809154510498, -0.5230681300163269, -0.44205528497695923, -0.36104243993759155, -0.28002962470054626, -0.19901680946350098, -0.1180039644241333, -0.03699113428592682, 0.04402169585227966, 0.12503452599048615, 0.20604735612869263, 0.2870602011680603, 0.3680730164051056, 0.4490858316421509, 0.5300986766815186, 0.6111115217208862, 0.6921243667602539, 0.7731371521949768, 0.8541499972343445, 0.9351628422737122, 1.016175627708435, 1.0971884727478027, 1.1782013177871704, 1.259214162826538, 1.3402270078659058, 1.4212398529052734, 1.5022525787353516, 1.5832655429840088, 1.664278268814087, 1.7452911138534546, 1.8263039588928223]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 5.0, 4.0, 11.0, 10.0, 18.0, 18.0, 19.0, 23.0, 29.0, 39.0, 48.0, 51.0, 58.0, 72.0, 78.0, 58.0, 52.0, 70.0, 46.0, 41.0, 23.0, 40.0, 25.0, 20.0, 19.0, 17.0, 16.0, 10.0, 10.0, 14.0, 8.0, 5.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.4375, -33.30615234375, -32.1748046875, -31.04345703125, -29.912109375, -28.78076171875, -27.6494140625, -26.51806640625, -25.38671875, -24.25537109375, -23.1240234375, -21.99267578125, -20.861328125, -19.72998046875, -18.5986328125, -17.46728515625, -16.3359375, -15.20458984375, -14.0732421875, -12.94189453125, -11.810546875, -10.67919921875, -9.5478515625, -8.41650390625, -7.28515625, -6.15380859375, -5.0224609375, -3.89111328125, -2.759765625, -1.62841796875, -0.4970703125, 0.63427734375, 1.765625, 2.89697265625, 4.0283203125, 5.15966796875, 6.291015625, 7.42236328125, 8.5537109375, 9.68505859375, 10.81640625, 11.94775390625, 13.0791015625, 14.21044921875, 15.341796875, 16.47314453125, 17.6044921875, 18.73583984375, 19.8671875, 20.99853515625, 22.1298828125, 23.26123046875, 24.392578125, 25.52392578125, 26.6552734375, 27.78662109375, 28.91796875, 30.04931640625, 31.1806640625, 32.31201171875, 33.443359375, 34.57470703125, 35.7060546875, 36.83740234375, 37.96875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 7.0, 10.0, 17.0, 19.0, 23.0, 35.0, 50.0, 44.0, 73.0, 96.0, 156.0, 187.0, 251.0, 364.0, 570.0, 859.0, 1718.0, 3600.0, 9531.0, 48710.0, 882839.0, 78184.0, 12086.0, 4105.0, 1946.0, 1017.0, 623.0, 400.0, 265.0, 188.0, 137.0, 107.0, 72.0, 58.0, 47.0, 39.0, 24.0, 18.0, 17.0, 17.0, 7.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-282.0, -273.34765625, -264.6953125, -256.04296875, -247.390625, -238.73828125, -230.0859375, -221.43359375, -212.78125, -204.12890625, -195.4765625, -186.82421875, -178.171875, -169.51953125, -160.8671875, -152.21484375, -143.5625, -134.91015625, -126.2578125, -117.60546875, -108.953125, -100.30078125, -91.6484375, -82.99609375, -74.34375, -65.69140625, -57.0390625, -48.38671875, -39.734375, -31.08203125, -22.4296875, -13.77734375, -5.125, 3.52734375, 12.1796875, 20.83203125, 29.484375, 38.13671875, 46.7890625, 55.44140625, 64.09375, 72.74609375, 81.3984375, 90.05078125, 98.703125, 107.35546875, 116.0078125, 124.66015625, 133.3125, 141.96484375, 150.6171875, 159.26953125, 167.921875, 176.57421875, 185.2265625, 193.87890625, 202.53125, 211.18359375, 219.8359375, 228.48828125, 237.140625, 245.79296875, 254.4453125, 263.09765625, 271.75]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 1.0, 7.0, 4.0, 6.0, 7.0, 8.0, 6.0, 9.0, 10.0, 15.0, 12.0, 22.0, 21.0, 24.0, 27.0, 26.0, 27.0, 31.0, 33.0, 43.0, 44.0, 55.0, 50.0, 90.0, 1862.0, 130.0, 55.0, 37.0, 50.0, 33.0, 30.0, 36.0, 21.0, 30.0, 28.0, 18.0, 25.0, 17.0, 25.0, 15.0, 14.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.375, -100.2138671875, -97.052734375, -93.8916015625, -90.73046875, -87.5693359375, -84.408203125, -81.2470703125, -78.0859375, -74.9248046875, -71.763671875, -68.6025390625, -65.44140625, -62.2802734375, -59.119140625, -55.9580078125, -52.796875, -49.6357421875, -46.474609375, -43.3134765625, -40.15234375, -36.9912109375, -33.830078125, -30.6689453125, -27.5078125, -24.3466796875, -21.185546875, -18.0244140625, -14.86328125, -11.7021484375, -8.541015625, -5.3798828125, -2.21875, 0.9423828125, 4.103515625, 7.2646484375, 10.42578125, 13.5869140625, 16.748046875, 19.9091796875, 23.0703125, 26.2314453125, 29.392578125, 32.5537109375, 35.71484375, 38.8759765625, 42.037109375, 45.1982421875, 48.359375, 51.5205078125, 54.681640625, 57.8427734375, 61.00390625, 64.1650390625, 67.326171875, 70.4873046875, 73.6484375, 76.8095703125, 79.970703125, 83.1318359375, 86.29296875, 89.4541015625, 92.615234375, 95.7763671875, 98.9375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 11.0, 8.0, 16.0, 22.0, 18.0, 17.0, 17.0, 26.0, 29.0, 29.0, 39.0, 55.0, 73.0, 182.0, 456.0, 2233.0, 109923.0, 3024656.0, 6349.0, 781.0, 258.0, 113.0, 68.0, 45.0, 34.0, 32.0, 22.0, 22.0, 25.0, 24.0, 16.0, 11.0, 12.0, 8.0, 7.0, 6.0, 8.0, 5.0, 5.0, 7.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-486.0, -470.42578125, -454.8515625, -439.27734375, -423.703125, -408.12890625, -392.5546875, -376.98046875, -361.40625, -345.83203125, -330.2578125, -314.68359375, -299.109375, -283.53515625, -267.9609375, -252.38671875, -236.8125, -221.23828125, -205.6640625, -190.08984375, -174.515625, -158.94140625, -143.3671875, -127.79296875, -112.21875, -96.64453125, -81.0703125, -65.49609375, -49.921875, -34.34765625, -18.7734375, -3.19921875, 12.375, 27.94921875, 43.5234375, 59.09765625, 74.671875, 90.24609375, 105.8203125, 121.39453125, 136.96875, 152.54296875, 168.1171875, 183.69140625, 199.265625, 214.83984375, 230.4140625, 245.98828125, 261.5625, 277.13671875, 292.7109375, 308.28515625, 323.859375, 339.43359375, 355.0078125, 370.58203125, 386.15625, 401.73046875, 417.3046875, 432.87890625, 448.453125, 464.02734375, 479.6015625, 495.17578125, 510.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 94.0, 913.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3376.05322265625, -3290.26806640625, -3204.483154296875, -3118.697998046875, -3032.912841796875, -2947.127685546875, -2861.3427734375, -2775.5576171875, -2689.7724609375, -2603.9873046875, -2518.202392578125, -2432.417236328125, -2346.632080078125, -2260.846923828125, -2175.06201171875, -2089.27685546875, -2003.4918212890625, -1917.706787109375, -1831.921630859375, -1746.1365966796875, -1660.3514404296875, -1574.56640625, -1488.78125, -1402.9962158203125, -1317.211181640625, -1231.4261474609375, -1145.6409912109375, -1059.85595703125, -974.07080078125, -888.2857666015625, -802.5006713867188, -716.715576171875, -630.930419921875, -545.1453247070312, -459.3602294921875, -373.5751647949219, -287.7900695800781, -202.00497436523438, -116.21990966796875, -30.434814453125, 55.35028076171875, 141.1353759765625, 226.9204559326172, 312.7055358886719, 398.4906311035156, 484.2757263183594, 570.060791015625, 655.8458862304688, 741.6309814453125, 827.4160766601562, 913.201171875, 998.9862060546875, 1084.7713623046875, 1170.556396484375, 1256.341552734375, 1342.1265869140625, 1427.91162109375, 1513.6966552734375, 1599.4818115234375, 1685.266845703125, 1771.052001953125, 1856.8370361328125, 1942.6220703125, 2028.4072265625, 2114.1923828125]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 6.0, 8.0, 6.0, 11.0, 13.0, 15.0, 21.0, 26.0, 25.0, 30.0, 23.0, 23.0, 35.0, 41.0, 29.0, 39.0, 49.0, 47.0, 39.0, 30.0, 35.0, 42.0, 34.0, 44.0, 34.0, 32.0, 37.0, 24.0, 39.0, 19.0, 21.0, 20.0, 30.0, 10.0, 18.0, 8.0, 10.0, 5.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-437.02105712890625, -424.54473876953125, -412.0684509277344, -399.5921325683594, -387.1158447265625, -374.6395263671875, -362.1632385253906, -349.6869201660156, -337.21063232421875, -324.73431396484375, -312.2580261230469, -299.7817077636719, -287.305419921875, -274.8291015625, -262.3528137207031, -249.87649536132812, -237.4001922607422, -224.92388916015625, -212.4475860595703, -199.97128295898438, -187.49497985839844, -175.0186767578125, -162.5423583984375, -150.06607055664062, -137.58975219726562, -125.11344909667969, -112.63714599609375, -100.16084289550781, -87.68453979492188, -75.20823669433594, -62.73192596435547, -50.25562286376953, -37.779327392578125, -25.303024291992188, -12.826719284057617, -0.3504142761230469, 12.12588882446289, 24.602191925048828, 37.07849884033203, 49.55480194091797, 62.031105041503906, 74.50740814208984, 86.98371124267578, 99.46002197265625, 111.93632507324219, 124.41262817382812, 136.88893127441406, 149.365234375, 161.84153747558594, 174.31784057617188, 186.7941436767578, 199.27044677734375, 211.7467498779297, 224.22305297851562, 236.69937133789062, 249.1756591796875, 261.6519775390625, 274.1282958984375, 286.6045837402344, 299.0809020996094, 311.55718994140625, 324.03350830078125, 336.5097961425781, 348.9861145019531, 361.46240234375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 4.0, 2.0, 7.0, 5.0, 19.0, 10.0, 15.0, 28.0, 24.0, 27.0, 36.0, 46.0, 54.0, 63.0, 56.0, 67.0, 59.0, 67.0, 65.0, 46.0, 45.0, 29.0, 37.0, 20.0, 21.0, 25.0, 24.0, 11.0, 13.0, 9.0, 16.0, 7.0, 7.0, 5.0, 5.0, 5.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.0, -35.79150390625, -34.5830078125, -33.37451171875, -32.166015625, -30.95751953125, -29.7490234375, -28.54052734375, -27.33203125, -26.12353515625, -24.9150390625, -23.70654296875, -22.498046875, -21.28955078125, -20.0810546875, -18.87255859375, -17.6640625, -16.45556640625, -15.2470703125, -14.03857421875, -12.830078125, -11.62158203125, -10.4130859375, -9.20458984375, -7.99609375, -6.78759765625, -5.5791015625, -4.37060546875, -3.162109375, -1.95361328125, -0.7451171875, 0.46337890625, 1.671875, 2.88037109375, 4.0888671875, 5.29736328125, 6.505859375, 7.71435546875, 8.9228515625, 10.13134765625, 11.33984375, 12.54833984375, 13.7568359375, 14.96533203125, 16.173828125, 17.38232421875, 18.5908203125, 19.79931640625, 21.0078125, 22.21630859375, 23.4248046875, 24.63330078125, 25.841796875, 27.05029296875, 28.2587890625, 29.46728515625, 30.67578125, 31.88427734375, 33.0927734375, 34.30126953125, 35.509765625, 36.71826171875, 37.9267578125, 39.13525390625, 40.34375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 8.0, 13.0, 14.0, 16.0, 31.0, 48.0, 64.0, 121.0, 182.0, 281.0, 549.0, 1113.0, 2358.0, 5481.0, 17064.0, 90252.0, 3897356.0, 142836.0, 23188.0, 7426.0, 2927.0, 1313.0, 677.0, 345.0, 214.0, 134.0, 67.0, 60.0, 40.0, 25.0, 17.0, 12.0, 9.0, 4.0, 11.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.0, -240.58203125, -232.1640625, -223.74609375, -215.328125, -206.91015625, -198.4921875, -190.07421875, -181.65625, -173.23828125, -164.8203125, -156.40234375, -147.984375, -139.56640625, -131.1484375, -122.73046875, -114.3125, -105.89453125, -97.4765625, -89.05859375, -80.640625, -72.22265625, -63.8046875, -55.38671875, -46.96875, -38.55078125, -30.1328125, -21.71484375, -13.296875, -4.87890625, 3.5390625, 11.95703125, 20.375, 28.79296875, 37.2109375, 45.62890625, 54.046875, 62.46484375, 70.8828125, 79.30078125, 87.71875, 96.13671875, 104.5546875, 112.97265625, 121.390625, 129.80859375, 138.2265625, 146.64453125, 155.0625, 163.48046875, 171.8984375, 180.31640625, 188.734375, 197.15234375, 205.5703125, 213.98828125, 222.40625, 230.82421875, 239.2421875, 247.66015625, 256.078125, 264.49609375, 272.9140625, 281.33203125, 289.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 3.0, 5.0, 1.0, 5.0, 6.0, 10.0, 10.0, 12.0, 23.0, 15.0, 30.0, 28.0, 36.0, 63.0, 44.0, 82.0, 118.0, 134.0, 200.0, 375.0, 643.0, 793.0, 435.0, 255.0, 183.0, 138.0, 93.0, 58.0, 53.0, 51.0, 33.0, 19.0, 24.0, 22.0, 13.0, 13.0, 13.0, 8.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.625, -105.0361328125, -101.447265625, -97.8583984375, -94.26953125, -90.6806640625, -87.091796875, -83.5029296875, -79.9140625, -76.3251953125, -72.736328125, -69.1474609375, -65.55859375, -61.9697265625, -58.380859375, -54.7919921875, -51.203125, -47.6142578125, -44.025390625, -40.4365234375, -36.84765625, -33.2587890625, -29.669921875, -26.0810546875, -22.4921875, -18.9033203125, -15.314453125, -11.7255859375, -8.13671875, -4.5478515625, -0.958984375, 2.6298828125, 6.21875, 9.8076171875, 13.396484375, 16.9853515625, 20.57421875, 24.1630859375, 27.751953125, 31.3408203125, 34.9296875, 38.5185546875, 42.107421875, 45.6962890625, 49.28515625, 52.8740234375, 56.462890625, 60.0517578125, 63.640625, 67.2294921875, 70.818359375, 74.4072265625, 77.99609375, 81.5849609375, 85.173828125, 88.7626953125, 92.3515625, 95.9404296875, 99.529296875, 103.1181640625, 106.70703125, 110.2958984375, 113.884765625, 117.4736328125, 121.0625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 6.0, 9.0, 9.0, 10.0, 22.0, 29.0, 32.0, 51.0, 66.0, 110.0, 218.0, 366.0, 892.0, 2637.0, 9895.0, 58842.0, 3970596.0, 128183.0, 16159.0, 3771.0, 1194.0, 476.0, 235.0, 135.0, 79.0, 60.0, 46.0, 21.0, 27.0, 17.0, 11.0, 17.0, 11.0, 14.0, 4.0, 6.0, 0.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-474.0, -459.0234375, -444.046875, -429.0703125, -414.09375, -399.1171875, -384.140625, -369.1640625, -354.1875, -339.2109375, -324.234375, -309.2578125, -294.28125, -279.3046875, -264.328125, -249.3515625, -234.375, -219.3984375, -204.421875, -189.4453125, -174.46875, -159.4921875, -144.515625, -129.5390625, -114.5625, -99.5859375, -84.609375, -69.6328125, -54.65625, -39.6796875, -24.703125, -9.7265625, 5.25, 20.2265625, 35.203125, 50.1796875, 65.15625, 80.1328125, 95.109375, 110.0859375, 125.0625, 140.0390625, 155.015625, 169.9921875, 184.96875, 199.9453125, 214.921875, 229.8984375, 244.875, 259.8515625, 274.828125, 289.8046875, 304.78125, 319.7578125, 334.734375, 349.7109375, 364.6875, 379.6640625, 394.640625, 409.6171875, 424.59375, 439.5703125, 454.546875, 469.5234375, 484.5]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 88.0, 765.0, 147.0, 9.0, 2.0, 2.0, 1.0], "bins": [-5609.19091796875, -5513.380859375, -5417.5712890625, -5321.76123046875, -5225.95166015625, -5130.1416015625, -5034.33203125, -4938.52197265625, -4842.7119140625, -4746.90185546875, -4651.09228515625, -4555.2822265625, -4459.47265625, -4363.66259765625, -4267.85302734375, -4172.04296875, -4076.2333984375, -3980.423583984375, -3884.61376953125, -3788.803955078125, -3692.994140625, -3597.18408203125, -3501.374267578125, -3405.564453125, -3309.754638671875, -3213.94482421875, -3118.135009765625, -3022.3251953125, -2926.51513671875, -2830.705322265625, -2734.8955078125, -2639.085693359375, -2543.276123046875, -2447.46630859375, -2351.656494140625, -2255.8466796875, -2160.03662109375, -2064.226806640625, -1968.4169921875, -1872.607177734375, -1776.79736328125, -1680.987548828125, -1585.177734375, -1489.3677978515625, -1393.5579833984375, -1297.7481689453125, -1201.938232421875, -1106.12841796875, -1010.318603515625, -914.5087890625, -818.6989135742188, -722.8890380859375, -627.0792236328125, -531.2694091796875, -435.45953369140625, -339.649658203125, -243.83984375, -148.02999877929688, -52.22015380859375, 43.589691162109375, 139.3995361328125, 235.20938110351562, 331.01922607421875, 426.8291015625, 522.638916015625]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 9.0, 8.0, 10.0, 11.0, 18.0, 20.0, 26.0, 26.0, 27.0, 20.0, 24.0, 26.0, 27.0, 25.0, 37.0, 38.0, 41.0, 44.0, 36.0, 39.0, 43.0, 32.0, 40.0, 31.0, 39.0, 29.0, 31.0, 25.0, 25.0, 31.0, 28.0, 15.0, 14.0, 15.0, 17.0, 14.0, 7.0, 6.0, 7.0, 5.0, 4.0, 6.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-379.9024658203125, -367.69268798828125, -355.4829406738281, -343.2731628417969, -331.06341552734375, -318.8536376953125, -306.64385986328125, -294.4341125488281, -282.224365234375, -270.01458740234375, -257.8048400878906, -245.59506225585938, -233.38531494140625, -221.175537109375, -208.9657745361328, -196.75601196289062, -184.54623413085938, -172.3364715576172, -160.126708984375, -147.91693115234375, -135.70718383789062, -123.4974136352539, -111.28764343261719, -99.077880859375, -86.86811828613281, -74.65835571289062, -62.44858932495117, -50.23882293701172, -38.02906036376953, -25.819297790527344, -13.609527587890625, -1.3997650146484375, 10.80999755859375, 23.01976203918457, 35.22952651977539, 47.439292907714844, 59.64905548095703, 71.85881805419922, 84.06858825683594, 96.27835083007812, 108.48811340332031, 120.6978759765625, 132.9076385498047, 145.11740112304688, 157.32717895507812, 169.53692626953125, 181.7467041015625, 193.9564666748047, 206.16622924804688, 218.37599182128906, 230.58575439453125, 242.7955322265625, 255.00527954101562, 267.2150573730469, 279.4248046875, 291.63458251953125, 303.8443603515625, 316.05413818359375, 328.2638854980469, 340.4736633300781, 352.68341064453125, 364.8931884765625, 377.10296630859375, 389.3127136230469, 401.5224609375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 12.0, 4.0, 4.0, 9.0, 19.0, 13.0, 11.0, 21.0, 29.0, 35.0, 39.0, 41.0, 44.0, 50.0, 55.0, 63.0, 53.0, 64.0, 49.0, 55.0, 34.0, 50.0, 35.0, 27.0, 25.0, 27.0, 19.0, 20.0, 12.0, 12.0, 10.0, 12.0, 8.0, 12.0, 4.0, 7.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.09375, -34.85400390625, -33.6142578125, -32.37451171875, -31.134765625, -29.89501953125, -28.6552734375, -27.41552734375, -26.17578125, -24.93603515625, -23.6962890625, -22.45654296875, -21.216796875, -19.97705078125, -18.7373046875, -17.49755859375, -16.2578125, -15.01806640625, -13.7783203125, -12.53857421875, -11.298828125, -10.05908203125, -8.8193359375, -7.57958984375, -6.33984375, -5.10009765625, -3.8603515625, -2.62060546875, -1.380859375, -0.14111328125, 1.0986328125, 2.33837890625, 3.578125, 4.81787109375, 6.0576171875, 7.29736328125, 8.537109375, 9.77685546875, 11.0166015625, 12.25634765625, 13.49609375, 14.73583984375, 15.9755859375, 17.21533203125, 18.455078125, 19.69482421875, 20.9345703125, 22.17431640625, 23.4140625, 24.65380859375, 25.8935546875, 27.13330078125, 28.373046875, 29.61279296875, 30.8525390625, 32.09228515625, 33.33203125, 34.57177734375, 35.8115234375, 37.05126953125, 38.291015625, 39.53076171875, 40.7705078125, 42.01025390625, 43.25]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 11.0, 9.0, 13.0, 13.0, 18.0, 38.0, 54.0, 64.0, 78.0, 122.0, 155.0, 217.0, 314.0, 411.0, 678.0, 1183.0, 2084.0, 4265.0, 9582.0, 31402.0, 402554.0, 539122.0, 35686.0, 10511.0, 4373.0, 2204.0, 1166.0, 689.0, 451.0, 303.0, 212.0, 152.0, 105.0, 90.0, 62.0, 46.0, 32.0, 19.0, 12.0, 18.0, 19.0, 5.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-23.78125, -23.1025390625, -22.423828125, -21.7451171875, -21.06640625, -20.3876953125, -19.708984375, -19.0302734375, -18.3515625, -17.6728515625, -16.994140625, -16.3154296875, -15.63671875, -14.9580078125, -14.279296875, -13.6005859375, -12.921875, -12.2431640625, -11.564453125, -10.8857421875, -10.20703125, -9.5283203125, -8.849609375, -8.1708984375, -7.4921875, -6.8134765625, -6.134765625, -5.4560546875, -4.77734375, -4.0986328125, -3.419921875, -2.7412109375, -2.0625, -1.3837890625, -0.705078125, -0.0263671875, 0.65234375, 1.3310546875, 2.009765625, 2.6884765625, 3.3671875, 4.0458984375, 4.724609375, 5.4033203125, 6.08203125, 6.7607421875, 7.439453125, 8.1181640625, 8.796875, 9.4755859375, 10.154296875, 10.8330078125, 11.51171875, 12.1904296875, 12.869140625, 13.5478515625, 14.2265625, 14.9052734375, 15.583984375, 16.2626953125, 16.94140625, 17.6201171875, 18.298828125, 18.9775390625, 19.65625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 8.0, 11.0, 6.0, 12.0, 13.0, 20.0, 16.0, 27.0, 22.0, 29.0, 32.0, 32.0, 45.0, 37.0, 51.0, 38.0, 51.0, 32.0, 1072.0, 36.0, 38.0, 47.0, 35.0, 40.0, 31.0, 32.0, 33.0, 36.0, 22.0, 13.0, 17.0, 12.0, 17.0, 13.0, 13.0, 11.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.265625, -24.4775390625, -23.689453125, -22.9013671875, -22.11328125, -21.3251953125, -20.537109375, -19.7490234375, -18.9609375, -18.1728515625, -17.384765625, -16.5966796875, -15.80859375, -15.0205078125, -14.232421875, -13.4443359375, -12.65625, -11.8681640625, -11.080078125, -10.2919921875, -9.50390625, -8.7158203125, -7.927734375, -7.1396484375, -6.3515625, -5.5634765625, -4.775390625, -3.9873046875, -3.19921875, -2.4111328125, -1.623046875, -0.8349609375, -0.046875, 0.7412109375, 1.529296875, 2.3173828125, 3.10546875, 3.8935546875, 4.681640625, 5.4697265625, 6.2578125, 7.0458984375, 7.833984375, 8.6220703125, 9.41015625, 10.1982421875, 10.986328125, 11.7744140625, 12.5625, 13.3505859375, 14.138671875, 14.9267578125, 15.71484375, 16.5029296875, 17.291015625, 18.0791015625, 18.8671875, 19.6552734375, 20.443359375, 21.2314453125, 22.01953125, 22.8076171875, 23.595703125, 24.3837890625, 25.171875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 10.0, 5.0, 9.0, 15.0, 16.0, 25.0, 33.0, 56.0, 69.0, 98.0, 148.0, 188.0, 266.0, 370.0, 497.0, 673.0, 995.0, 1506.0, 2260.0, 3689.0, 6094.0, 11106.0, 22304.0, 53718.0, 164841.0, 1439925.0, 255505.0, 71741.0, 28165.0, 13181.0, 7069.0, 4211.0, 2754.0, 1779.0, 1124.0, 818.0, 516.0, 381.0, 256.0, 212.0, 144.0, 110.0, 73.0, 54.0, 31.0, 26.0, 19.0, 11.0, 13.0, 13.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.55859375, -5.377197265625, -5.19580078125, -5.014404296875, -4.8330078125, -4.651611328125, -4.47021484375, -4.288818359375, -4.107421875, -3.926025390625, -3.74462890625, -3.563232421875, -3.3818359375, -3.200439453125, -3.01904296875, -2.837646484375, -2.65625, -2.474853515625, -2.29345703125, -2.112060546875, -1.9306640625, -1.749267578125, -1.56787109375, -1.386474609375, -1.205078125, -1.023681640625, -0.84228515625, -0.660888671875, -0.4794921875, -0.298095703125, -0.11669921875, 0.064697265625, 0.24609375, 0.427490234375, 0.60888671875, 0.790283203125, 0.9716796875, 1.153076171875, 1.33447265625, 1.515869140625, 1.697265625, 1.878662109375, 2.06005859375, 2.241455078125, 2.4228515625, 2.604248046875, 2.78564453125, 2.967041015625, 3.1484375, 3.329833984375, 3.51123046875, 3.692626953125, 3.8740234375, 4.055419921875, 4.23681640625, 4.418212890625, 4.599609375, 4.781005859375, 4.96240234375, 5.143798828125, 5.3251953125, 5.506591796875, 5.68798828125, 5.869384765625, 6.05078125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 3.0, 6.0, 12.0, 8.0, 10.0, 15.0, 9.0, 24.0, 18.0, 15.0, 18.0, 36.0, 34.0, 45.0, 42.0, 40.0, 34.0, 45.0, 176.0, 44.0, 44.0, 57.0, 38.0, 37.0, 35.0, 23.0, 18.0, 11.0, 11.0, 14.0, 15.0, 9.0, 8.0, 8.0, 6.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5760955810546875, -0.555023193359375, -0.5339508056640625, -0.51287841796875, -0.4918060302734375, -0.470733642578125, -0.4496612548828125, -0.4285888671875, -0.4075164794921875, -0.386444091796875, -0.3653717041015625, -0.34429931640625, -0.3232269287109375, -0.302154541015625, -0.2810821533203125, -0.260009765625, -0.2389373779296875, -0.217864990234375, -0.1967926025390625, -0.17572021484375, -0.1546478271484375, -0.133575439453125, -0.1125030517578125, -0.0914306640625, -0.0703582763671875, -0.049285888671875, -0.0282135009765625, -0.00714111328125, 0.0139312744140625, 0.035003662109375, 0.0560760498046875, 0.0771484375, 0.0982208251953125, 0.119293212890625, 0.1403656005859375, 0.16143798828125, 0.1825103759765625, 0.203582763671875, 0.2246551513671875, 0.2457275390625, 0.2667999267578125, 0.287872314453125, 0.3089447021484375, 0.33001708984375, 0.3510894775390625, 0.372161865234375, 0.3932342529296875, 0.414306640625, 0.4353790283203125, 0.456451416015625, 0.4775238037109375, 0.49859619140625, 0.5196685791015625, 0.540740966796875, 0.5618133544921875, 0.5828857421875, 0.6039581298828125, 0.625030517578125, 0.6461029052734375, 0.66717529296875, 0.6882476806640625, 0.709320068359375, 0.7303924560546875, 0.75146484375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 7.0, 7.0, 6.0, 10.0, 6.0, 11.0, 14.0, 13.0, 11.0, 12.0, 16.0, 26.0, 37.0, 47.0, 59.0, 94.0, 107.0, 307.0, 1046656.0, 517.0, 144.0, 93.0, 66.0, 56.0, 37.0, 38.0, 15.0, 16.0, 18.0, 24.0, 10.0, 15.0, 9.0, 8.0, 14.0, 5.0, 2.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.4375, -22.7802734375, -22.123046875, -21.4658203125, -20.80859375, -20.1513671875, -19.494140625, -18.8369140625, -18.1796875, -17.5224609375, -16.865234375, -16.2080078125, -15.55078125, -14.8935546875, -14.236328125, -13.5791015625, -12.921875, -12.2646484375, -11.607421875, -10.9501953125, -10.29296875, -9.6357421875, -8.978515625, -8.3212890625, -7.6640625, -7.0068359375, -6.349609375, -5.6923828125, -5.03515625, -4.3779296875, -3.720703125, -3.0634765625, -2.40625, -1.7490234375, -1.091796875, -0.4345703125, 0.22265625, 0.8798828125, 1.537109375, 2.1943359375, 2.8515625, 3.5087890625, 4.166015625, 4.8232421875, 5.48046875, 6.1376953125, 6.794921875, 7.4521484375, 8.109375, 8.7666015625, 9.423828125, 10.0810546875, 10.73828125, 11.3955078125, 12.052734375, 12.7099609375, 13.3671875, 14.0244140625, 14.681640625, 15.3388671875, 15.99609375, 16.6533203125, 17.310546875, 17.9677734375, 18.625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 251.0, 769.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7698224782943726, -0.8929613828659058, -0.016100287437438965, 0.8607608079910278, 1.7376219034194946, 2.614482879638672, 3.4913439750671387, 4.3682050704956055, 5.245066165924072, 6.121927261352539, 6.998788356781006, 7.875649452209473, 8.752510070800781, 9.629371643066406, 10.506233215332031, 11.38309383392334, 12.259955406188965, 13.136816024780273, 14.013677597045898, 14.890539169311523, 15.767399787902832, 16.64426040649414, 17.521121978759766, 18.39798355102539, 19.274843215942383, 20.151704788208008, 21.028564453125, 21.905426025390625, 22.78228759765625, 23.659149169921875, 24.5360107421875, 25.412870407104492, 26.28973388671875, 27.166595458984375, 28.04345703125, 28.920316696166992, 29.797178268432617, 30.674039840698242, 31.550899505615234, 32.42776107788086, 33.304622650146484, 34.18148422241211, 35.058345794677734, 35.93520736694336, 36.81206512451172, 37.688926696777344, 38.56578826904297, 39.442649841308594, 40.31951141357422, 41.196372985839844, 42.07323455810547, 42.950096130371094, 43.82695770263672, 44.70381546020508, 45.5806770324707, 46.45753860473633, 47.33440017700195, 48.21126174926758, 49.0881233215332, 49.96498489379883, 50.84184265136719, 51.71870422363281, 52.59556579589844, 53.47242736816406, 54.34928894042969]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 5.0, 7.0, 16.0, 16.0, 15.0, 16.0, 11.0, 24.0, 28.0, 27.0, 29.0, 36.0, 43.0, 35.0, 30.0, 49.0, 48.0, 32.0, 41.0, 36.0, 49.0, 45.0, 46.0, 34.0, 30.0, 29.0, 27.0, 29.0, 21.0, 21.0, 21.0, 23.0, 15.0, 15.0, 7.0, 7.0, 10.0, 3.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0], "bins": [-2.155302047729492, -2.0971593856811523, -2.0390167236328125, -1.9808741807937622, -1.9227315187454224, -1.864588975906372, -1.8064463138580322, -1.7483036518096924, -1.6901609897613525, -1.6320183277130127, -1.5738757848739624, -1.5157331228256226, -1.4575904607772827, -1.3994479179382324, -1.3413052558898926, -1.2831625938415527, -1.2250200510025024, -1.1668773889541626, -1.1087348461151123, -1.0505921840667725, -0.9924495220184326, -0.9343069195747375, -0.8761643171310425, -0.8180216550827026, -0.7598790526390076, -0.7017364501953125, -0.6435937881469727, -0.5854511857032776, -0.5273085832595825, -0.4691659212112427, -0.4110233187675476, -0.35288068652153015, -0.29473793506622314, -0.2365953028202057, -0.17845268547534943, -0.12031006813049316, -0.06216743588447571, -0.004024803638458252, 0.054117798805236816, 0.11226043105125427, 0.17040306329727173, 0.22854569554328918, 0.28668832778930664, 0.3448309302330017, 0.40297356247901917, 0.4611161947250366, 0.5192587971687317, 0.5774013996124268, 0.6355440616607666, 0.6936866641044617, 0.7518293261528015, 0.8099719285964966, 0.8681145906448364, 0.9262571930885315, 0.9843997955322266, 1.0425424575805664, 1.1006851196289062, 1.158827781677246, 1.2169703245162964, 1.2751129865646362, 1.333255648612976, 1.3913981914520264, 1.4495408535003662, 1.507683515548706, 1.5658260583877563]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 12.0, 4.0, 4.0, 9.0, 19.0, 13.0, 11.0, 21.0, 29.0, 35.0, 39.0, 41.0, 44.0, 50.0, 55.0, 63.0, 53.0, 64.0, 49.0, 55.0, 34.0, 50.0, 35.0, 27.0, 25.0, 27.0, 19.0, 20.0, 13.0, 11.0, 10.0, 12.0, 8.0, 12.0, 4.0, 7.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.09375, -34.85400390625, -33.6142578125, -32.37451171875, -31.134765625, -29.89501953125, -28.6552734375, -27.41552734375, -26.17578125, -24.93603515625, -23.6962890625, -22.45654296875, -21.216796875, -19.97705078125, -18.7373046875, -17.49755859375, -16.2578125, -15.01806640625, -13.7783203125, -12.53857421875, -11.298828125, -10.05908203125, -8.8193359375, -7.57958984375, -6.33984375, -5.10009765625, -3.8603515625, -2.62060546875, -1.380859375, -0.14111328125, 1.0986328125, 2.33837890625, 3.578125, 4.81787109375, 6.0576171875, 7.29736328125, 8.537109375, 9.77685546875, 11.0166015625, 12.25634765625, 13.49609375, 14.73583984375, 15.9755859375, 17.21533203125, 18.455078125, 19.69482421875, 20.9345703125, 22.17431640625, 23.4140625, 24.65380859375, 25.8935546875, 27.13330078125, 28.373046875, 29.61279296875, 30.8525390625, 32.09228515625, 33.33203125, 34.57177734375, 35.8115234375, 37.05126953125, 38.291015625, 39.53076171875, 40.7705078125, 42.01025390625, 43.25]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 4.0, 0.0, 3.0, 6.0, 2.0, 3.0, 10.0, 8.0, 20.0, 29.0, 38.0, 31.0, 45.0, 63.0, 107.0, 149.0, 204.0, 307.0, 580.0, 958.0, 1816.0, 3734.0, 8563.0, 22420.0, 76403.0, 482076.0, 352800.0, 63800.0, 19667.0, 7450.0, 3352.0, 1577.0, 815.0, 460.0, 310.0, 208.0, 133.0, 86.0, 61.0, 68.0, 49.0, 42.0, 23.0, 15.0, 13.0, 11.0, 9.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-30.375, -29.3251953125, -28.275390625, -27.2255859375, -26.17578125, -25.1259765625, -24.076171875, -23.0263671875, -21.9765625, -20.9267578125, -19.876953125, -18.8271484375, -17.77734375, -16.7275390625, -15.677734375, -14.6279296875, -13.578125, -12.5283203125, -11.478515625, -10.4287109375, -9.37890625, -8.3291015625, -7.279296875, -6.2294921875, -5.1796875, -4.1298828125, -3.080078125, -2.0302734375, -0.98046875, 0.0693359375, 1.119140625, 2.1689453125, 3.21875, 4.2685546875, 5.318359375, 6.3681640625, 7.41796875, 8.4677734375, 9.517578125, 10.5673828125, 11.6171875, 12.6669921875, 13.716796875, 14.7666015625, 15.81640625, 16.8662109375, 17.916015625, 18.9658203125, 20.015625, 21.0654296875, 22.115234375, 23.1650390625, 24.21484375, 25.2646484375, 26.314453125, 27.3642578125, 28.4140625, 29.4638671875, 30.513671875, 31.5634765625, 32.61328125, 33.6630859375, 34.712890625, 35.7626953125, 36.8125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 15.0, 6.0, 12.0, 10.0, 14.0, 20.0, 23.0, 29.0, 33.0, 26.0, 28.0, 35.0, 47.0, 41.0, 39.0, 41.0, 41.0, 69.0, 2047.0, 47.0, 41.0, 46.0, 31.0, 37.0, 28.0, 24.0, 24.0, 28.0, 26.0, 16.0, 20.0, 17.0, 15.0, 19.0, 12.0, 5.0, 7.0, 3.0, 0.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.0625, -118.9853515625, -114.908203125, -110.8310546875, -106.75390625, -102.6767578125, -98.599609375, -94.5224609375, -90.4453125, -86.3681640625, -82.291015625, -78.2138671875, -74.13671875, -70.0595703125, -65.982421875, -61.9052734375, -57.828125, -53.7509765625, -49.673828125, -45.5966796875, -41.51953125, -37.4423828125, -33.365234375, -29.2880859375, -25.2109375, -21.1337890625, -17.056640625, -12.9794921875, -8.90234375, -4.8251953125, -0.748046875, 3.3291015625, 7.40625, 11.4833984375, 15.560546875, 19.6376953125, 23.71484375, 27.7919921875, 31.869140625, 35.9462890625, 40.0234375, 44.1005859375, 48.177734375, 52.2548828125, 56.33203125, 60.4091796875, 64.486328125, 68.5634765625, 72.640625, 76.7177734375, 80.794921875, 84.8720703125, 88.94921875, 93.0263671875, 97.103515625, 101.1806640625, 105.2578125, 109.3349609375, 113.412109375, 117.4892578125, 121.56640625, 125.6435546875, 129.720703125, 133.7978515625, 137.875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 0.0, 3.0, 7.0, 4.0, 14.0, 19.0, 15.0, 18.0, 18.0, 20.0, 30.0, 41.0, 30.0, 41.0, 74.0, 102.0, 154.0, 325.0, 663.0, 1935.0, 3086531.0, 53201.0, 1145.0, 499.0, 236.0, 144.0, 96.0, 61.0, 47.0, 35.0, 34.0, 36.0, 25.0, 19.0, 13.0, 11.0, 11.0, 8.0, 13.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-305.0, -295.9765625, -286.953125, -277.9296875, -268.90625, -259.8828125, -250.859375, -241.8359375, -232.8125, -223.7890625, -214.765625, -205.7421875, -196.71875, -187.6953125, -178.671875, -169.6484375, -160.625, -151.6015625, -142.578125, -133.5546875, -124.53125, -115.5078125, -106.484375, -97.4609375, -88.4375, -79.4140625, -70.390625, -61.3671875, -52.34375, -43.3203125, -34.296875, -25.2734375, -16.25, -7.2265625, 1.796875, 10.8203125, 19.84375, 28.8671875, 37.890625, 46.9140625, 55.9375, 64.9609375, 73.984375, 83.0078125, 92.03125, 101.0546875, 110.078125, 119.1015625, 128.125, 137.1484375, 146.171875, 155.1953125, 164.21875, 173.2421875, 182.265625, 191.2890625, 200.3125, 209.3359375, 218.359375, 227.3828125, 236.40625, 245.4296875, 254.453125, 263.4765625, 272.5]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 89.0, 933.0], "bins": [-4926.447265625, -4848.41015625, -4770.373046875, -4692.3359375, -4614.298828125, -4536.26171875, -4458.224609375, -4380.1875, -4302.150390625, -4224.11328125, -4146.076171875, -4068.0390625, -3990.001953125, -3911.965087890625, -3833.927978515625, -3755.890869140625, -3677.85400390625, -3599.81689453125, -3521.77978515625, -3443.74267578125, -3365.70556640625, -3287.668701171875, -3209.631591796875, -3131.594482421875, -3053.557373046875, -2975.520263671875, -2897.483154296875, -2819.446044921875, -2741.4091796875, -2663.3720703125, -2585.3349609375, -2507.2978515625, -2429.2607421875, -2351.2236328125, -2273.1865234375, -2195.1494140625, -2117.1123046875, -2039.0753173828125, -1961.038330078125, -1883.001220703125, -1804.9642333984375, -1726.9271240234375, -1648.89013671875, -1570.85302734375, -1492.81591796875, -1414.77880859375, -1336.74169921875, -1258.7047119140625, -1180.6676025390625, -1102.6304931640625, -1024.593505859375, -946.556396484375, -868.519287109375, -790.482177734375, -712.4451293945312, -634.4080810546875, -556.3709106445312, -478.3338317871094, -400.2967529296875, -322.2596740722656, -244.22259521484375, -166.18551635742188, -88.1484375, -10.11138916015625, 67.92569732666016]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 18.0, 4.0, 14.0, 13.0, 16.0, 26.0, 20.0, 31.0, 29.0, 34.0, 35.0, 30.0, 36.0, 38.0, 38.0, 39.0, 45.0, 36.0, 44.0, 39.0, 49.0, 52.0, 33.0, 27.0, 41.0, 33.0, 22.0, 24.0, 15.0, 13.0, 15.0, 12.0, 12.0, 13.0, 8.0, 9.0, 5.0, 1.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-427.7646789550781, -413.6469421386719, -399.52923583984375, -385.4114990234375, -371.29376220703125, -357.1760559082031, -343.0583190917969, -328.94061279296875, -314.8228759765625, -300.70513916015625, -286.5874328613281, -272.4696960449219, -258.35198974609375, -244.2342529296875, -230.11651611328125, -215.99879455566406, -201.88107299804688, -187.7633514404297, -173.6456298828125, -159.52789306640625, -145.41017150878906, -131.29244995117188, -117.17472076416016, -103.05699157714844, -88.93927001953125, -74.82154846191406, -60.703819274902344, -46.58609390258789, -32.46836853027344, -18.35064697265625, -4.232917785644531, 9.884811401367188, 24.00250244140625, 38.1202278137207, 52.237953186035156, 66.35568237304688, 80.47340393066406, 94.59112548828125, 108.70885467529297, 122.82658386230469, 136.94430541992188, 151.06202697753906, 165.17974853515625, 179.2974853515625, 193.4152069091797, 207.53292846679688, 221.65066528320312, 235.7683868408203, 249.8861083984375, 264.00384521484375, 278.1215515136719, 292.2392883300781, 306.35699462890625, 320.4747314453125, 334.59246826171875, 348.710205078125, 362.8279113769531, 376.9456481933594, 391.0633544921875, 405.18109130859375, 419.298828125, 433.4165344238281, 447.5342712402344, 461.6519775390625, 475.76971435546875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 11.0, 7.0, 2.0, 14.0, 20.0, 10.0, 14.0, 21.0, 36.0, 40.0, 31.0, 45.0, 42.0, 48.0, 59.0, 62.0, 70.0, 49.0, 51.0, 49.0, 42.0, 48.0, 32.0, 19.0, 28.0, 27.0, 21.0, 15.0, 14.0, 10.0, 10.0, 11.0, 10.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.90625, -35.62646484375, -34.3466796875, -33.06689453125, -31.787109375, -30.50732421875, -29.2275390625, -27.94775390625, -26.66796875, -25.38818359375, -24.1083984375, -22.82861328125, -21.548828125, -20.26904296875, -18.9892578125, -17.70947265625, -16.4296875, -15.14990234375, -13.8701171875, -12.59033203125, -11.310546875, -10.03076171875, -8.7509765625, -7.47119140625, -6.19140625, -4.91162109375, -3.6318359375, -2.35205078125, -1.072265625, 0.20751953125, 1.4873046875, 2.76708984375, 4.046875, 5.32666015625, 6.6064453125, 7.88623046875, 9.166015625, 10.44580078125, 11.7255859375, 13.00537109375, 14.28515625, 15.56494140625, 16.8447265625, 18.12451171875, 19.404296875, 20.68408203125, 21.9638671875, 23.24365234375, 24.5234375, 25.80322265625, 27.0830078125, 28.36279296875, 29.642578125, 30.92236328125, 32.2021484375, 33.48193359375, 34.76171875, 36.04150390625, 37.3212890625, 38.60107421875, 39.880859375, 41.16064453125, 42.4404296875, 43.72021484375, 45.0]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 18.0, 15.0, 10.0, 26.0, 38.0, 41.0, 58.0, 82.0, 139.0, 171.0, 326.0, 472.0, 800.0, 1302.0, 2265.0, 4041.0, 7636.0, 16458.0, 57762.0, 1159893.0, 2806168.0, 95094.0, 19781.0, 9216.0, 4989.0, 2833.0, 1665.0, 1079.0, 637.0, 414.0, 259.0, 173.0, 105.0, 84.0, 53.0, 40.0, 34.0, 28.0, 19.0, 13.0, 9.0, 9.0, 10.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-125.6875, -122.1083984375, -118.529296875, -114.9501953125, -111.37109375, -107.7919921875, -104.212890625, -100.6337890625, -97.0546875, -93.4755859375, -89.896484375, -86.3173828125, -82.73828125, -79.1591796875, -75.580078125, -72.0009765625, -68.421875, -64.8427734375, -61.263671875, -57.6845703125, -54.10546875, -50.5263671875, -46.947265625, -43.3681640625, -39.7890625, -36.2099609375, -32.630859375, -29.0517578125, -25.47265625, -21.8935546875, -18.314453125, -14.7353515625, -11.15625, -7.5771484375, -3.998046875, -0.4189453125, 3.16015625, 6.7392578125, 10.318359375, 13.8974609375, 17.4765625, 21.0556640625, 24.634765625, 28.2138671875, 31.79296875, 35.3720703125, 38.951171875, 42.5302734375, 46.109375, 49.6884765625, 53.267578125, 56.8466796875, 60.42578125, 64.0048828125, 67.583984375, 71.1630859375, 74.7421875, 78.3212890625, 81.900390625, 85.4794921875, 89.05859375, 92.6376953125, 96.216796875, 99.7958984375, 103.375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 3.0, 3.0, 12.0, 12.0, 14.0, 23.0, 25.0, 38.0, 49.0, 57.0, 83.0, 118.0, 163.0, 297.0, 543.0, 888.0, 683.0, 370.0, 206.0, 136.0, 98.0, 67.0, 50.0, 36.0, 16.0, 15.0, 14.0, 8.0, 12.0, 6.0, 7.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-118.9375, -114.7939453125, -110.650390625, -106.5068359375, -102.36328125, -98.2197265625, -94.076171875, -89.9326171875, -85.7890625, -81.6455078125, -77.501953125, -73.3583984375, -69.21484375, -65.0712890625, -60.927734375, -56.7841796875, -52.640625, -48.4970703125, -44.353515625, -40.2099609375, -36.06640625, -31.9228515625, -27.779296875, -23.6357421875, -19.4921875, -15.3486328125, -11.205078125, -7.0615234375, -2.91796875, 1.2255859375, 5.369140625, 9.5126953125, 13.65625, 17.7998046875, 21.943359375, 26.0869140625, 30.23046875, 34.3740234375, 38.517578125, 42.6611328125, 46.8046875, 50.9482421875, 55.091796875, 59.2353515625, 63.37890625, 67.5224609375, 71.666015625, 75.8095703125, 79.953125, 84.0966796875, 88.240234375, 92.3837890625, 96.52734375, 100.6708984375, 104.814453125, 108.9580078125, 113.1015625, 117.2451171875, 121.388671875, 125.5322265625, 129.67578125, 133.8193359375, 137.962890625, 142.1064453125, 146.25]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 10.0, 10.0, 11.0, 20.0, 27.0, 45.0, 77.0, 102.0, 209.0, 396.0, 757.0, 1661.0, 4227.0, 12525.0, 48051.0, 3179239.0, 890164.0, 39170.0, 10715.0, 3771.0, 1489.0, 734.0, 369.0, 176.0, 107.0, 73.0, 52.0, 29.0, 15.0, 16.0, 9.0, 2.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-356.0, -344.8515625, -333.703125, -322.5546875, -311.40625, -300.2578125, -289.109375, -277.9609375, -266.8125, -255.6640625, -244.515625, -233.3671875, -222.21875, -211.0703125, -199.921875, -188.7734375, -177.625, -166.4765625, -155.328125, -144.1796875, -133.03125, -121.8828125, -110.734375, -99.5859375, -88.4375, -77.2890625, -66.140625, -54.9921875, -43.84375, -32.6953125, -21.546875, -10.3984375, 0.75, 11.8984375, 23.046875, 34.1953125, 45.34375, 56.4921875, 67.640625, 78.7890625, 89.9375, 101.0859375, 112.234375, 123.3828125, 134.53125, 145.6796875, 156.828125, 167.9765625, 179.125, 190.2734375, 201.421875, 212.5703125, 223.71875, 234.8671875, 246.015625, 257.1640625, 268.3125, 279.4609375, 290.609375, 301.7578125, 312.90625, 324.0546875, 335.203125, 346.3515625, 357.5]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 7.0, 14.0, 37.0, 70.0, 175.0, 395.0, 174.0, 81.0, 23.0, 18.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1845.301025390625, -1810.799560546875, -1776.2979736328125, -1741.79638671875, -1707.294921875, -1672.79345703125, -1638.2918701171875, -1603.790283203125, -1569.288818359375, -1534.787353515625, -1500.2857666015625, -1465.7841796875, -1431.28271484375, -1396.78125, -1362.2796630859375, -1327.778076171875, -1293.276611328125, -1258.775146484375, -1224.2735595703125, -1189.77197265625, -1155.2705078125, -1120.76904296875, -1086.2674560546875, -1051.765869140625, -1017.264404296875, -982.7628784179688, -948.2613525390625, -913.7598266601562, -879.25830078125, -844.7567749023438, -810.2552490234375, -775.7537231445312, -741.2521362304688, -706.7506103515625, -672.2490844726562, -637.74755859375, -603.2460327148438, -568.7445068359375, -534.2429809570312, -499.741455078125, -465.23992919921875, -430.7384033203125, -396.23687744140625, -361.7353515625, -327.23382568359375, -292.7322998046875, -258.23077392578125, -223.729248046875, -189.22772216796875, -154.7261962890625, -120.22467041015625, -85.72314453125, -51.22161865234375, -16.7200927734375, 17.78143310546875, 52.282958984375, 86.78448486328125, 121.2860107421875, 155.78753662109375, 190.2890625, 224.79058837890625, 259.2921142578125, 293.79364013671875, 328.295166015625, 362.79669189453125]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 4.0, 10.0, 6.0, 5.0, 17.0, 13.0, 15.0, 13.0, 15.0, 13.0, 18.0, 24.0, 26.0, 47.0, 23.0, 29.0, 37.0, 38.0, 34.0, 38.0, 31.0, 44.0, 42.0, 40.0, 28.0, 31.0, 32.0, 28.0, 25.0, 28.0, 34.0, 23.0, 23.0, 18.0, 22.0, 28.0, 14.0, 17.0, 11.0, 10.0, 5.0, 10.0, 4.0, 6.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-365.4508361816406, -354.922607421875, -344.3944091796875, -333.8661804199219, -323.3379821777344, -312.80975341796875, -302.28155517578125, -291.7533264160156, -281.22509765625, -270.6968688964844, -260.1686706542969, -249.6404571533203, -239.11224365234375, -228.58401489257812, -218.05580139160156, -207.527587890625, -196.9993896484375, -186.47117614746094, -175.94296264648438, -165.4147491455078, -154.88653564453125, -144.35830688476562, -133.83009338378906, -123.3018798828125, -112.77366638183594, -102.24545288085938, -91.71723937988281, -81.18901824951172, -70.66080474853516, -60.132591247558594, -49.604373931884766, -39.07615661621094, -28.54791259765625, -18.019697189331055, -7.491481781005859, 3.036733627319336, 13.564949035644531, 24.093162536621094, 34.62137985229492, 45.14959716796875, 55.67781066894531, 66.20602416992188, 76.73423767089844, 87.26245880126953, 97.7906723022461, 108.31888580322266, 118.84710693359375, 129.3753204345703, 139.90353393554688, 150.43174743652344, 160.9599609375, 171.48817443847656, 182.01638793945312, 192.54461669921875, 203.0728302001953, 213.60104370117188, 224.12925720214844, 234.657470703125, 245.18568420410156, 255.71389770507812, 266.24212646484375, 276.77032470703125, 287.2985534667969, 297.8267822265625, 308.35498046875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 10.0, 5.0, 4.0, 13.0, 12.0, 13.0, 20.0, 20.0, 17.0, 27.0, 33.0, 34.0, 46.0, 47.0, 56.0, 67.0, 64.0, 57.0, 40.0, 57.0, 53.0, 39.0, 35.0, 31.0, 28.0, 27.0, 28.0, 20.0, 8.0, 21.0, 7.0, 17.0, 11.0, 8.0, 6.0, 3.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.9375, -38.5888671875, -37.240234375, -35.8916015625, -34.54296875, -33.1943359375, -31.845703125, -30.4970703125, -29.1484375, -27.7998046875, -26.451171875, -25.1025390625, -23.75390625, -22.4052734375, -21.056640625, -19.7080078125, -18.359375, -17.0107421875, -15.662109375, -14.3134765625, -12.96484375, -11.6162109375, -10.267578125, -8.9189453125, -7.5703125, -6.2216796875, -4.873046875, -3.5244140625, -2.17578125, -0.8271484375, 0.521484375, 1.8701171875, 3.21875, 4.5673828125, 5.916015625, 7.2646484375, 8.61328125, 9.9619140625, 11.310546875, 12.6591796875, 14.0078125, 15.3564453125, 16.705078125, 18.0537109375, 19.40234375, 20.7509765625, 22.099609375, 23.4482421875, 24.796875, 26.1455078125, 27.494140625, 28.8427734375, 30.19140625, 31.5400390625, 32.888671875, 34.2373046875, 35.5859375, 36.9345703125, 38.283203125, 39.6318359375, 40.98046875, 42.3291015625, 43.677734375, 45.0263671875, 46.375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 10.0, 9.0, 12.0, 15.0, 13.0, 22.0, 35.0, 61.0, 64.0, 93.0, 92.0, 155.0, 200.0, 288.0, 415.0, 653.0, 934.0, 1702.0, 3028.0, 6468.0, 17642.0, 115315.0, 793041.0, 79881.0, 15193.0, 5763.0, 2850.0, 1589.0, 962.0, 593.0, 392.0, 273.0, 228.0, 140.0, 123.0, 63.0, 66.0, 40.0, 37.0, 26.0, 24.0, 15.0, 6.0, 6.0, 10.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-23.359375, -22.66064453125, -21.9619140625, -21.26318359375, -20.564453125, -19.86572265625, -19.1669921875, -18.46826171875, -17.76953125, -17.07080078125, -16.3720703125, -15.67333984375, -14.974609375, -14.27587890625, -13.5771484375, -12.87841796875, -12.1796875, -11.48095703125, -10.7822265625, -10.08349609375, -9.384765625, -8.68603515625, -7.9873046875, -7.28857421875, -6.58984375, -5.89111328125, -5.1923828125, -4.49365234375, -3.794921875, -3.09619140625, -2.3974609375, -1.69873046875, -1.0, -0.30126953125, 0.3974609375, 1.09619140625, 1.794921875, 2.49365234375, 3.1923828125, 3.89111328125, 4.58984375, 5.28857421875, 5.9873046875, 6.68603515625, 7.384765625, 8.08349609375, 8.7822265625, 9.48095703125, 10.1796875, 10.87841796875, 11.5771484375, 12.27587890625, 12.974609375, 13.67333984375, 14.3720703125, 15.07080078125, 15.76953125, 16.46826171875, 17.1669921875, 17.86572265625, 18.564453125, 19.26318359375, 19.9619140625, 20.66064453125, 21.359375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 7.0, 6.0, 8.0, 8.0, 13.0, 14.0, 11.0, 16.0, 16.0, 20.0, 23.0, 22.0, 28.0, 20.0, 38.0, 37.0, 42.0, 45.0, 51.0, 42.0, 1068.0, 43.0, 39.0, 38.0, 41.0, 30.0, 39.0, 36.0, 26.0, 30.0, 38.0, 23.0, 18.0, 16.0, 9.0, 12.0, 13.0, 5.0, 11.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -19.9033203125, -19.150390625, -18.3974609375, -17.64453125, -16.8916015625, -16.138671875, -15.3857421875, -14.6328125, -13.8798828125, -13.126953125, -12.3740234375, -11.62109375, -10.8681640625, -10.115234375, -9.3623046875, -8.609375, -7.8564453125, -7.103515625, -6.3505859375, -5.59765625, -4.8447265625, -4.091796875, -3.3388671875, -2.5859375, -1.8330078125, -1.080078125, -0.3271484375, 0.42578125, 1.1787109375, 1.931640625, 2.6845703125, 3.4375, 4.1904296875, 4.943359375, 5.6962890625, 6.44921875, 7.2021484375, 7.955078125, 8.7080078125, 9.4609375, 10.2138671875, 10.966796875, 11.7197265625, 12.47265625, 13.2255859375, 13.978515625, 14.7314453125, 15.484375, 16.2373046875, 16.990234375, 17.7431640625, 18.49609375, 19.2490234375, 20.001953125, 20.7548828125, 21.5078125, 22.2607421875, 23.013671875, 23.7666015625, 24.51953125, 25.2724609375, 26.025390625, 26.7783203125, 27.53125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 4.0, 15.0, 13.0, 30.0, 32.0, 53.0, 55.0, 81.0, 124.0, 192.0, 313.0, 435.0, 644.0, 970.0, 1410.0, 2340.0, 4215.0, 7722.0, 15397.0, 36596.0, 112409.0, 1426430.0, 352622.0, 78627.0, 28164.0, 12291.0, 6347.0, 3682.0, 2060.0, 1233.0, 853.0, 521.0, 380.0, 245.0, 163.0, 137.0, 89.0, 60.0, 50.0, 37.0, 31.0, 17.0, 11.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.53125, -6.33245849609375, -6.1336669921875, -5.93487548828125, -5.736083984375, -5.53729248046875, -5.3385009765625, -5.13970947265625, -4.94091796875, -4.74212646484375, -4.5433349609375, -4.34454345703125, -4.145751953125, -3.94696044921875, -3.7481689453125, -3.54937744140625, -3.3505859375, -3.15179443359375, -2.9530029296875, -2.75421142578125, -2.555419921875, -2.35662841796875, -2.1578369140625, -1.95904541015625, -1.76025390625, -1.56146240234375, -1.3626708984375, -1.16387939453125, -0.965087890625, -0.76629638671875, -0.5675048828125, -0.36871337890625, -0.169921875, 0.02886962890625, 0.2276611328125, 0.42645263671875, 0.625244140625, 0.82403564453125, 1.0228271484375, 1.22161865234375, 1.42041015625, 1.61920166015625, 1.8179931640625, 2.01678466796875, 2.215576171875, 2.41436767578125, 2.6131591796875, 2.81195068359375, 3.0107421875, 3.20953369140625, 3.4083251953125, 3.60711669921875, 3.805908203125, 4.00469970703125, 4.2034912109375, 4.40228271484375, 4.60107421875, 4.79986572265625, 4.9986572265625, 5.19744873046875, 5.396240234375, 5.59503173828125, 5.7938232421875, 5.99261474609375, 6.19140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 8.0, 8.0, 12.0, 10.0, 19.0, 27.0, 25.0, 29.0, 43.0, 61.0, 103.0, 121.0, 156.0, 101.0, 62.0, 45.0, 28.0, 26.0, 23.0, 23.0, 12.0, 6.0, 6.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6525726318359375, -0.630828857421875, -0.6090850830078125, -0.58734130859375, -0.5655975341796875, -0.543853759765625, -0.5221099853515625, -0.5003662109375, -0.4786224365234375, -0.456878662109375, -0.4351348876953125, -0.41339111328125, -0.3916473388671875, -0.369903564453125, -0.3481597900390625, -0.326416015625, -0.3046722412109375, -0.282928466796875, -0.2611846923828125, -0.23944091796875, -0.2176971435546875, -0.195953369140625, -0.1742095947265625, -0.1524658203125, -0.1307220458984375, -0.108978271484375, -0.0872344970703125, -0.06549072265625, -0.0437469482421875, -0.022003173828125, -0.0002593994140625, 0.021484375, 0.0432281494140625, 0.064971923828125, 0.0867156982421875, 0.10845947265625, 0.1302032470703125, 0.151947021484375, 0.1736907958984375, 0.1954345703125, 0.2171783447265625, 0.238922119140625, 0.2606658935546875, 0.28240966796875, 0.3041534423828125, 0.325897216796875, 0.3476409912109375, 0.369384765625, 0.3911285400390625, 0.412872314453125, 0.4346160888671875, 0.45635986328125, 0.4781036376953125, 0.499847412109375, 0.5215911865234375, 0.5433349609375, 0.5650787353515625, 0.586822509765625, 0.6085662841796875, 0.63031005859375, 0.6520538330078125, 0.673797607421875, 0.6955413818359375, 0.71728515625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 6.0, 5.0, 7.0, 9.0, 26.0, 18.0, 30.0, 39.0, 48.0, 86.0, 174.0, 588.0, 1046877.0, 248.0, 126.0, 55.0, 46.0, 25.0, 29.0, 15.0, 21.0, 9.0, 13.0, 9.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.59375, -21.9140625, -21.234375, -20.5546875, -19.875, -19.1953125, -18.515625, -17.8359375, -17.15625, -16.4765625, -15.796875, -15.1171875, -14.4375, -13.7578125, -13.078125, -12.3984375, -11.71875, -11.0390625, -10.359375, -9.6796875, -9.0, -8.3203125, -7.640625, -6.9609375, -6.28125, -5.6015625, -4.921875, -4.2421875, -3.5625, -2.8828125, -2.203125, -1.5234375, -0.84375, -0.1640625, 0.515625, 1.1953125, 1.875, 2.5546875, 3.234375, 3.9140625, 4.59375, 5.2734375, 5.953125, 6.6328125, 7.3125, 7.9921875, 8.671875, 9.3515625, 10.03125, 10.7109375, 11.390625, 12.0703125, 12.75, 13.4296875, 14.109375, 14.7890625, 15.46875, 16.1484375, 16.828125, 17.5078125, 18.1875, 18.8671875, 19.546875, 20.2265625, 20.90625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [413.0, 609.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49994513392448425, -0.004762709140777588, 0.4904197156429291, 0.9856021404266357, 1.48078453540802, 1.9759669303894043, 2.471149444580078, 2.966331720352173, 3.4615142345428467, 3.9566967487335205, 4.451879024505615, 4.947061538696289, 5.442244052886963, 5.937426567077637, 6.432608604431152, 6.927791118621826, 7.4229736328125, 7.918156147003174, 8.413338661193848, 8.908520698547363, 9.403703689575195, 9.898885726928711, 10.394067764282227, 10.889250755310059, 11.384432792663574, 11.87961483001709, 12.374797821044922, 12.869979858398438, 13.36516284942627, 13.860344886779785, 14.355527877807617, 14.850709915161133, 15.345892906188965, 15.84107494354248, 16.336257934570312, 16.831439971923828, 17.326622009277344, 17.82180404663086, 18.316987991333008, 18.812170028686523, 19.30735206604004, 19.802534103393555, 20.29771614074707, 20.79290008544922, 21.288082122802734, 21.78326416015625, 22.278446197509766, 22.77362823486328, 23.26881217956543, 23.763994216918945, 24.25917625427246, 24.75436019897461, 25.249542236328125, 25.74472427368164, 26.239906311035156, 26.735088348388672, 27.230270385742188, 27.725452423095703, 28.22063446044922, 28.715818405151367, 29.211000442504883, 29.7061824798584, 30.201364517211914, 30.69654655456543, 31.191730499267578]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 11.0, 7.0, 6.0, 12.0, 15.0, 15.0, 16.0, 25.0, 13.0, 17.0, 24.0, 30.0, 38.0, 36.0, 21.0, 33.0, 38.0, 41.0, 36.0, 32.0, 44.0, 49.0, 33.0, 31.0, 33.0, 36.0, 25.0, 22.0, 25.0, 25.0, 28.0, 25.0, 21.0, 22.0, 19.0, 12.0, 14.0, 9.0, 14.0, 5.0, 6.0, 3.0, 7.0, 1.0, 3.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.2812654972076416, -1.2406190633773804, -1.1999726295471191, -1.1593260765075684, -1.1186796426773071, -1.078033208847046, -1.0373867750167847, -0.9967403411865234, -0.9560938477516174, -0.9154474139213562, -0.8748009204864502, -0.834154486656189, -0.7935080528259277, -0.7528615593910217, -0.7122151255607605, -0.6715686321258545, -0.6309221982955933, -0.590275764465332, -0.549629271030426, -0.5089828372001648, -0.4683363735675812, -0.42768990993499756, -0.38704347610473633, -0.3463970124721527, -0.3057505488395691, -0.2651040852069855, -0.22445763647556305, -0.18381118774414062, -0.143164724111557, -0.10251826047897339, -0.061871811747550964, -0.02122536301612854, 0.019420981407165527, 0.06006743758916855, 0.10071389377117157, 0.141360342502594, 0.1820068061351776, 0.22265326976776123, 0.26329970359802246, 0.3039461672306061, 0.3445926308631897, 0.3852390944957733, 0.42588555812835693, 0.46653199195861816, 0.5071784257888794, 0.5478249192237854, 0.5884713530540466, 0.6291178464889526, 0.6697642803192139, 0.7104107141494751, 0.7510572075843811, 0.7917036414146423, 0.8323501348495483, 0.8729965686798096, 0.9136430025100708, 0.954289436340332, 0.994935929775238, 1.035582423210144, 1.0762288570404053, 1.1168752908706665, 1.1575217247009277, 1.1981682777404785, 1.2388147115707397, 1.279461145401001, 1.3201075792312622]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 10.0, 5.0, 4.0, 13.0, 12.0, 13.0, 20.0, 20.0, 17.0, 27.0, 33.0, 34.0, 46.0, 47.0, 56.0, 67.0, 64.0, 57.0, 40.0, 57.0, 53.0, 39.0, 35.0, 31.0, 28.0, 27.0, 28.0, 20.0, 8.0, 21.0, 7.0, 17.0, 11.0, 8.0, 6.0, 3.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.9375, -38.5888671875, -37.240234375, -35.8916015625, -34.54296875, -33.1943359375, -31.845703125, -30.4970703125, -29.1484375, -27.7998046875, -26.451171875, -25.1025390625, -23.75390625, -22.4052734375, -21.056640625, -19.7080078125, -18.359375, -17.0107421875, -15.662109375, -14.3134765625, -12.96484375, -11.6162109375, -10.267578125, -8.9189453125, -7.5703125, -6.2216796875, -4.873046875, -3.5244140625, -2.17578125, -0.8271484375, 0.521484375, 1.8701171875, 3.21875, 4.5673828125, 5.916015625, 7.2646484375, 8.61328125, 9.9619140625, 11.310546875, 12.6591796875, 14.0078125, 15.3564453125, 16.705078125, 18.0537109375, 19.40234375, 20.7509765625, 22.099609375, 23.4482421875, 24.796875, 26.1455078125, 27.494140625, 28.8427734375, 30.19140625, 31.5400390625, 32.888671875, 34.2373046875, 35.5859375, 36.9345703125, 38.283203125, 39.6318359375, 40.98046875, 42.3291015625, 43.677734375, 45.0263671875, 46.375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 8.0, 8.0, 17.0, 22.0, 29.0, 30.0, 58.0, 97.0, 167.0, 240.0, 466.0, 824.0, 1519.0, 3293.0, 6824.0, 16059.0, 43105.0, 148433.0, 542751.0, 196281.0, 53491.0, 19209.0, 8142.0, 3552.0, 1809.0, 923.0, 452.0, 286.0, 168.0, 93.0, 53.0, 40.0, 28.0, 23.0, 19.0, 9.0, 3.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.765625, -20.06396484375, -19.3623046875, -18.66064453125, -17.958984375, -17.25732421875, -16.5556640625, -15.85400390625, -15.15234375, -14.45068359375, -13.7490234375, -13.04736328125, -12.345703125, -11.64404296875, -10.9423828125, -10.24072265625, -9.5390625, -8.83740234375, -8.1357421875, -7.43408203125, -6.732421875, -6.03076171875, -5.3291015625, -4.62744140625, -3.92578125, -3.22412109375, -2.5224609375, -1.82080078125, -1.119140625, -0.41748046875, 0.2841796875, 0.98583984375, 1.6875, 2.38916015625, 3.0908203125, 3.79248046875, 4.494140625, 5.19580078125, 5.8974609375, 6.59912109375, 7.30078125, 8.00244140625, 8.7041015625, 9.40576171875, 10.107421875, 10.80908203125, 11.5107421875, 12.21240234375, 12.9140625, 13.61572265625, 14.3173828125, 15.01904296875, 15.720703125, 16.42236328125, 17.1240234375, 17.82568359375, 18.52734375, 19.22900390625, 19.9306640625, 20.63232421875, 21.333984375, 22.03564453125, 22.7373046875, 23.43896484375, 24.140625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 3.0, 7.0, 8.0, 10.0, 13.0, 13.0, 12.0, 12.0, 15.0, 22.0, 16.0, 24.0, 23.0, 42.0, 34.0, 27.0, 36.0, 42.0, 38.0, 36.0, 60.0, 2001.0, 102.0, 49.0, 30.0, 39.0, 33.0, 29.0, 32.0, 31.0, 31.0, 27.0, 19.0, 16.0, 16.0, 16.0, 16.0, 10.0, 13.0, 6.0, 10.0, 6.0, 5.0, 2.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0], "bins": [-142.125, -138.142578125, -134.16015625, -130.177734375, -126.1953125, -122.212890625, -118.23046875, -114.248046875, -110.265625, -106.283203125, -102.30078125, -98.318359375, -94.3359375, -90.353515625, -86.37109375, -82.388671875, -78.40625, -74.423828125, -70.44140625, -66.458984375, -62.4765625, -58.494140625, -54.51171875, -50.529296875, -46.546875, -42.564453125, -38.58203125, -34.599609375, -30.6171875, -26.634765625, -22.65234375, -18.669921875, -14.6875, -10.705078125, -6.72265625, -2.740234375, 1.2421875, 5.224609375, 9.20703125, 13.189453125, 17.171875, 21.154296875, 25.13671875, 29.119140625, 33.1015625, 37.083984375, 41.06640625, 45.048828125, 49.03125, 53.013671875, 56.99609375, 60.978515625, 64.9609375, 68.943359375, 72.92578125, 76.908203125, 80.890625, 84.873046875, 88.85546875, 92.837890625, 96.8203125, 100.802734375, 104.78515625, 108.767578125, 112.75]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 3.0, 5.0, 6.0, 9.0, 6.0, 14.0, 8.0, 14.0, 19.0, 18.0, 11.0, 21.0, 35.0, 48.0, 56.0, 86.0, 99.0, 166.0, 283.0, 500.0, 1036.0, 25152.0, 3112123.0, 3963.0, 756.0, 426.0, 252.0, 159.0, 96.0, 59.0, 62.0, 34.0, 27.0, 21.0, 25.0, 15.0, 12.0, 14.0, 10.0, 12.0, 12.0, 7.0, 6.0, 3.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-193.125, -186.30859375, -179.4921875, -172.67578125, -165.859375, -159.04296875, -152.2265625, -145.41015625, -138.59375, -131.77734375, -124.9609375, -118.14453125, -111.328125, -104.51171875, -97.6953125, -90.87890625, -84.0625, -77.24609375, -70.4296875, -63.61328125, -56.796875, -49.98046875, -43.1640625, -36.34765625, -29.53125, -22.71484375, -15.8984375, -9.08203125, -2.265625, 4.55078125, 11.3671875, 18.18359375, 25.0, 31.81640625, 38.6328125, 45.44921875, 52.265625, 59.08203125, 65.8984375, 72.71484375, 79.53125, 86.34765625, 93.1640625, 99.98046875, 106.796875, 113.61328125, 120.4296875, 127.24609375, 134.0625, 140.87890625, 147.6953125, 154.51171875, 161.328125, 168.14453125, 174.9609375, 181.77734375, 188.59375, 195.41015625, 202.2265625, 209.04296875, 215.859375, 222.67578125, 229.4921875, 236.30859375, 243.125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 150.0, 818.0, 44.0, 2.0], "bins": [-1352.915771484375, -1330.8555908203125, -1308.7955322265625, -1286.7353515625, -1264.67529296875, -1242.6151123046875, -1220.554931640625, -1198.494873046875, -1176.4346923828125, -1154.37451171875, -1132.314453125, -1110.2542724609375, -1088.194091796875, -1066.134033203125, -1044.0738525390625, -1022.0137329101562, -999.95361328125, -977.8934936523438, -955.8333740234375, -933.773193359375, -911.7130737304688, -889.6529541015625, -867.5927734375, -845.5326538085938, -823.4725341796875, -801.4124145507812, -779.352294921875, -757.2921142578125, -735.2319946289062, -713.171875, -691.1116943359375, -669.0515747070312, -646.9913940429688, -624.9312744140625, -602.87109375, -580.8109741210938, -558.7508544921875, -536.6907348632812, -514.630615234375, -492.5704345703125, -470.5103454589844, -448.4501953125, -426.39007568359375, -404.3299560546875, -382.2698059082031, -360.20965576171875, -338.1495361328125, -316.08941650390625, -294.0292663574219, -271.9691162109375, -249.90899658203125, -227.84886169433594, -205.78872680664062, -183.7285919189453, -161.66845703125, -139.6083221435547, -117.54818725585938, -95.48805236816406, -73.42791748046875, -51.36778259277344, -29.307647705078125, -7.2475128173828125, 14.8126220703125, 36.87275695800781, 58.93289566040039]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 9.0, 13.0, 5.0, 11.0, 12.0, 11.0, 12.0, 25.0, 24.0, 29.0, 20.0, 31.0, 33.0, 44.0, 26.0, 40.0, 32.0, 56.0, 35.0, 48.0, 40.0, 40.0, 38.0, 31.0, 37.0, 38.0, 41.0, 30.0, 21.0, 22.0, 24.0, 15.0, 22.0, 11.0, 12.0, 16.0, 5.0, 7.0, 9.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-456.897705078125, -442.4989013671875, -428.10009765625, -413.7012939453125, -399.302490234375, -384.9036865234375, -370.5048828125, -356.1060791015625, -341.707275390625, -327.3084716796875, -312.90966796875, -298.5108642578125, -284.112060546875, -269.7132568359375, -255.314453125, -240.9156494140625, -226.51683044433594, -212.11802673339844, -197.71922302246094, -183.32041931152344, -168.92161560058594, -154.52279663085938, -140.12399291992188, -125.7251968383789, -111.3263931274414, -96.9275894165039, -82.5287857055664, -68.12997436523438, -53.73117446899414, -39.332366943359375, -24.933563232421875, -10.534759521484375, 3.864044189453125, 18.262847900390625, 32.661651611328125, 47.06045913696289, 61.45926284790039, 75.85807037353516, 90.25687408447266, 104.65567779541016, 119.05448150634766, 133.4532928466797, 147.8520965576172, 162.2509002685547, 176.6497039794922, 191.0485076904297, 205.4473114013672, 219.8461151123047, 234.2449188232422, 248.6437225341797, 263.04254150390625, 277.44134521484375, 291.84014892578125, 306.23895263671875, 320.63775634765625, 335.03656005859375, 349.43536376953125, 363.83416748046875, 378.23297119140625, 392.63177490234375, 407.03057861328125, 421.42938232421875, 435.82818603515625, 450.22698974609375, 464.62579345703125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 8.0, 3.0, 13.0, 10.0, 12.0, 23.0, 21.0, 14.0, 22.0, 33.0, 38.0, 43.0, 40.0, 53.0, 60.0, 70.0, 53.0, 45.0, 47.0, 60.0, 34.0, 41.0, 33.0, 26.0, 31.0, 26.0, 24.0, 15.0, 13.0, 13.0, 13.0, 14.0, 10.0, 6.0, 6.0, 3.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.6875, -37.35205078125, -36.0166015625, -34.68115234375, -33.345703125, -32.01025390625, -30.6748046875, -29.33935546875, -28.00390625, -26.66845703125, -25.3330078125, -23.99755859375, -22.662109375, -21.32666015625, -19.9912109375, -18.65576171875, -17.3203125, -15.98486328125, -14.6494140625, -13.31396484375, -11.978515625, -10.64306640625, -9.3076171875, -7.97216796875, -6.63671875, -5.30126953125, -3.9658203125, -2.63037109375, -1.294921875, 0.04052734375, 1.3759765625, 2.71142578125, 4.046875, 5.38232421875, 6.7177734375, 8.05322265625, 9.388671875, 10.72412109375, 12.0595703125, 13.39501953125, 14.73046875, 16.06591796875, 17.4013671875, 18.73681640625, 20.072265625, 21.40771484375, 22.7431640625, 24.07861328125, 25.4140625, 26.74951171875, 28.0849609375, 29.42041015625, 30.755859375, 32.09130859375, 33.4267578125, 34.76220703125, 36.09765625, 37.43310546875, 38.7685546875, 40.10400390625, 41.439453125, 42.77490234375, 44.1103515625, 45.44580078125, 46.78125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 6.0, 13.0, 6.0, 30.0, 58.0, 109.0, 266.0, 537.0, 1191.0, 2902.0, 8685.0, 38719.0, 3865235.0, 252192.0, 15825.0, 4989.0, 1906.0, 842.0, 368.0, 177.0, 104.0, 35.0, 17.0, 8.0, 3.0, 3.0, 5.0, 6.0, 2.0, 3.0, 8.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-227.25, -219.853515625, -212.45703125, -205.060546875, -197.6640625, -190.267578125, -182.87109375, -175.474609375, -168.078125, -160.681640625, -153.28515625, -145.888671875, -138.4921875, -131.095703125, -123.69921875, -116.302734375, -108.90625, -101.509765625, -94.11328125, -86.716796875, -79.3203125, -71.923828125, -64.52734375, -57.130859375, -49.734375, -42.337890625, -34.94140625, -27.544921875, -20.1484375, -12.751953125, -5.35546875, 2.041015625, 9.4375, 16.833984375, 24.23046875, 31.626953125, 39.0234375, 46.419921875, 53.81640625, 61.212890625, 68.609375, 76.005859375, 83.40234375, 90.798828125, 98.1953125, 105.591796875, 112.98828125, 120.384765625, 127.78125, 135.177734375, 142.57421875, 149.970703125, 157.3671875, 164.763671875, 172.16015625, 179.556640625, 186.953125, 194.349609375, 201.74609375, 209.142578125, 216.5390625, 223.935546875, 231.33203125, 238.728515625, 246.125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 11.0, 6.0, 18.0, 18.0, 19.0, 17.0, 35.0, 62.0, 71.0, 124.0, 185.0, 356.0, 724.0, 1021.0, 581.0, 278.0, 158.0, 89.0, 75.0, 54.0, 42.0, 30.0, 17.0, 20.0, 9.0, 13.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.4375, -120.4697265625, -116.501953125, -112.5341796875, -108.56640625, -104.5986328125, -100.630859375, -96.6630859375, -92.6953125, -88.7275390625, -84.759765625, -80.7919921875, -76.82421875, -72.8564453125, -68.888671875, -64.9208984375, -60.953125, -56.9853515625, -53.017578125, -49.0498046875, -45.08203125, -41.1142578125, -37.146484375, -33.1787109375, -29.2109375, -25.2431640625, -21.275390625, -17.3076171875, -13.33984375, -9.3720703125, -5.404296875, -1.4365234375, 2.53125, 6.4990234375, 10.466796875, 14.4345703125, 18.40234375, 22.3701171875, 26.337890625, 30.3056640625, 34.2734375, 38.2412109375, 42.208984375, 46.1767578125, 50.14453125, 54.1123046875, 58.080078125, 62.0478515625, 66.015625, 69.9833984375, 73.951171875, 77.9189453125, 81.88671875, 85.8544921875, 89.822265625, 93.7900390625, 97.7578125, 101.7255859375, 105.693359375, 109.6611328125, 113.62890625, 117.5966796875, 121.564453125, 125.5322265625, 129.5]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 15.0, 12.0, 19.0, 28.0, 36.0, 51.0, 65.0, 102.0, 139.0, 238.0, 412.0, 801.0, 1535.0, 3423.0, 8628.0, 25426.0, 144956.0, 3886028.0, 88906.0, 20267.0, 7126.0, 2956.0, 1343.0, 701.0, 384.0, 233.0, 127.0, 90.0, 72.0, 38.0, 24.0, 26.0, 16.0, 9.0, 15.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-279.0, -269.51171875, -260.0234375, -250.53515625, -241.046875, -231.55859375, -222.0703125, -212.58203125, -203.09375, -193.60546875, -184.1171875, -174.62890625, -165.140625, -155.65234375, -146.1640625, -136.67578125, -127.1875, -117.69921875, -108.2109375, -98.72265625, -89.234375, -79.74609375, -70.2578125, -60.76953125, -51.28125, -41.79296875, -32.3046875, -22.81640625, -13.328125, -3.83984375, 5.6484375, 15.13671875, 24.625, 34.11328125, 43.6015625, 53.08984375, 62.578125, 72.06640625, 81.5546875, 91.04296875, 100.53125, 110.01953125, 119.5078125, 128.99609375, 138.484375, 147.97265625, 157.4609375, 166.94921875, 176.4375, 185.92578125, 195.4140625, 204.90234375, 214.390625, 223.87890625, 233.3671875, 242.85546875, 252.34375, 261.83203125, 271.3203125, 280.80859375, 290.296875, 299.78515625, 309.2734375, 318.76171875, 328.25]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 10.0, 13.0, 19.0, 35.0, 62.0, 88.0, 201.0, 257.0, 138.0, 76.0, 33.0, 21.0, 18.0, 7.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-953.1666259765625, -932.5780029296875, -911.9893798828125, -891.4008178710938, -870.8121948242188, -850.2235717773438, -829.6349487304688, -809.0463256835938, -788.457763671875, -767.869140625, -747.280517578125, -726.6919555664062, -706.1033325195312, -685.5147094726562, -664.9260864257812, -644.3374633789062, -623.7488403320312, -603.1602172851562, -582.5715942382812, -561.9830322265625, -541.3944091796875, -520.8057861328125, -500.2171630859375, -479.6285400390625, -459.0399475097656, -438.4513244628906, -417.86273193359375, -397.27410888671875, -376.68548583984375, -356.0968933105469, -335.5082702636719, -314.919677734375, -294.3310546875, -273.742431640625, -253.15383911132812, -232.56521606445312, -211.9766082763672, -191.38800048828125, -170.79937744140625, -150.2107696533203, -129.62216186523438, -109.03355407714844, -88.44493865966797, -67.8563232421875, -47.26771545410156, -26.679107666015625, -6.090492248535156, 14.498123168945312, 35.08673095703125, 55.67534255981445, 76.26395416259766, 96.85256958007812, 117.44117736816406, 138.02978515625, 158.618408203125, 179.20701599121094, 199.79562377929688, 220.3842315673828, 240.97283935546875, 261.56146240234375, 282.15008544921875, 302.7386779785156, 323.3273010253906, 343.9158935546875, 364.5045166015625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 7.0, 3.0, 5.0, 16.0, 9.0, 9.0, 10.0, 18.0, 22.0, 15.0, 20.0, 18.0, 29.0, 30.0, 36.0, 36.0, 35.0, 45.0, 41.0, 28.0, 37.0, 45.0, 46.0, 42.0, 29.0, 45.0, 43.0, 36.0, 32.0, 32.0, 26.0, 20.0, 26.0, 20.0, 17.0, 14.0, 12.0, 9.0, 5.0, 5.0, 5.0, 6.0, 7.0, 1.0, 2.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.9327392578125, -316.22528076171875, -305.5177917480469, -294.8103332519531, -284.10284423828125, -273.3953857421875, -262.68792724609375, -251.98045349121094, -241.27297973632812, -230.5655059814453, -219.8580322265625, -209.15057373046875, -198.44309997558594, -187.73562622070312, -177.02816772460938, -166.32069396972656, -155.61322021484375, -144.90574645996094, -134.19827270507812, -123.49081420898438, -112.78334045410156, -102.07586669921875, -91.36840057373047, -80.66093444824219, -69.95346069335938, -59.24599075317383, -48.53852081298828, -37.831050872802734, -27.123580932617188, -16.41611099243164, -5.708641052246094, 4.9988250732421875, 15.706298828125, 26.413768768310547, 37.121238708496094, 47.82870864868164, 58.53617858886719, 69.24365234375, 79.95111846923828, 90.65858459472656, 101.36605834960938, 112.07353210449219, 122.78099822998047, 133.48846435546875, 144.19593811035156, 154.90341186523438, 165.61087036132812, 176.31834411621094, 187.02581787109375, 197.73329162597656, 208.44076538085938, 219.14822387695312, 229.85569763183594, 240.56317138671875, 251.2706298828125, 261.97808837890625, 272.6855773925781, 283.3930358886719, 294.10052490234375, 304.8079833984375, 315.51544189453125, 326.2229309082031, 336.9303894042969, 347.63787841796875, 358.3453369140625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 2.0, 3.0, 2.0, 8.0, 10.0, 11.0, 18.0, 20.0, 19.0, 26.0, 30.0, 28.0, 23.0, 41.0, 51.0, 52.0, 40.0, 64.0, 49.0, 62.0, 45.0, 44.0, 42.0, 42.0, 39.0, 35.0, 31.0, 24.0, 24.0, 22.0, 14.0, 21.0, 8.0, 5.0, 10.0, 10.0, 6.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-43.4375, -42.04541015625, -40.6533203125, -39.26123046875, -37.869140625, -36.47705078125, -35.0849609375, -33.69287109375, -32.30078125, -30.90869140625, -29.5166015625, -28.12451171875, -26.732421875, -25.34033203125, -23.9482421875, -22.55615234375, -21.1640625, -19.77197265625, -18.3798828125, -16.98779296875, -15.595703125, -14.20361328125, -12.8115234375, -11.41943359375, -10.02734375, -8.63525390625, -7.2431640625, -5.85107421875, -4.458984375, -3.06689453125, -1.6748046875, -0.28271484375, 1.109375, 2.50146484375, 3.8935546875, 5.28564453125, 6.677734375, 8.06982421875, 9.4619140625, 10.85400390625, 12.24609375, 13.63818359375, 15.0302734375, 16.42236328125, 17.814453125, 19.20654296875, 20.5986328125, 21.99072265625, 23.3828125, 24.77490234375, 26.1669921875, 27.55908203125, 28.951171875, 30.34326171875, 31.7353515625, 33.12744140625, 34.51953125, 35.91162109375, 37.3037109375, 38.69580078125, 40.087890625, 41.47998046875, 42.8720703125, 44.26416015625, 45.65625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 13.0, 7.0, 12.0, 23.0, 23.0, 39.0, 52.0, 65.0, 76.0, 103.0, 144.0, 212.0, 281.0, 403.0, 547.0, 896.0, 1332.0, 2312.0, 4083.0, 8429.0, 23832.0, 109449.0, 656775.0, 183144.0, 33028.0, 10867.0, 4953.0, 2612.0, 1608.0, 983.0, 641.0, 453.0, 301.0, 237.0, 157.0, 126.0, 82.0, 62.0, 52.0, 45.0, 25.0, 19.0, 13.0, 13.0, 4.0, 7.0, 9.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.7265625, -14.260986328125, -13.79541015625, -13.329833984375, -12.8642578125, -12.398681640625, -11.93310546875, -11.467529296875, -11.001953125, -10.536376953125, -10.07080078125, -9.605224609375, -9.1396484375, -8.674072265625, -8.20849609375, -7.742919921875, -7.27734375, -6.811767578125, -6.34619140625, -5.880615234375, -5.4150390625, -4.949462890625, -4.48388671875, -4.018310546875, -3.552734375, -3.087158203125, -2.62158203125, -2.156005859375, -1.6904296875, -1.224853515625, -0.75927734375, -0.293701171875, 0.171875, 0.637451171875, 1.10302734375, 1.568603515625, 2.0341796875, 2.499755859375, 2.96533203125, 3.430908203125, 3.896484375, 4.362060546875, 4.82763671875, 5.293212890625, 5.7587890625, 6.224365234375, 6.68994140625, 7.155517578125, 7.62109375, 8.086669921875, 8.55224609375, 9.017822265625, 9.4833984375, 9.948974609375, 10.41455078125, 10.880126953125, 11.345703125, 11.811279296875, 12.27685546875, 12.742431640625, 13.2080078125, 13.673583984375, 14.13916015625, 14.604736328125, 15.0703125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 4.0, 1.0, 8.0, 11.0, 13.0, 18.0, 17.0, 23.0, 19.0, 37.0, 30.0, 36.0, 39.0, 39.0, 43.0, 38.0, 51.0, 49.0, 1069.0, 40.0, 51.0, 42.0, 31.0, 43.0, 45.0, 48.0, 28.0, 47.0, 20.0, 13.0, 20.0, 12.0, 12.0, 5.0, 13.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.0, -23.0341796875, -22.068359375, -21.1025390625, -20.13671875, -19.1708984375, -18.205078125, -17.2392578125, -16.2734375, -15.3076171875, -14.341796875, -13.3759765625, -12.41015625, -11.4443359375, -10.478515625, -9.5126953125, -8.546875, -7.5810546875, -6.615234375, -5.6494140625, -4.68359375, -3.7177734375, -2.751953125, -1.7861328125, -0.8203125, 0.1455078125, 1.111328125, 2.0771484375, 3.04296875, 4.0087890625, 4.974609375, 5.9404296875, 6.90625, 7.8720703125, 8.837890625, 9.8037109375, 10.76953125, 11.7353515625, 12.701171875, 13.6669921875, 14.6328125, 15.5986328125, 16.564453125, 17.5302734375, 18.49609375, 19.4619140625, 20.427734375, 21.3935546875, 22.359375, 23.3251953125, 24.291015625, 25.2568359375, 26.22265625, 27.1884765625, 28.154296875, 29.1201171875, 30.0859375, 31.0517578125, 32.017578125, 32.9833984375, 33.94921875, 34.9150390625, 35.880859375, 36.8466796875, 37.8125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 13.0, 14.0, 23.0, 45.0, 41.0, 68.0, 95.0, 119.0, 171.0, 231.0, 315.0, 496.0, 793.0, 1175.0, 2017.0, 3363.0, 6049.0, 11102.0, 23554.0, 54323.0, 139714.0, 1339248.0, 335449.0, 99037.0, 39948.0, 18282.0, 9020.0, 4814.0, 2691.0, 1680.0, 1094.0, 708.0, 439.0, 291.0, 187.0, 123.0, 118.0, 68.0, 63.0, 34.0, 28.0, 24.0, 11.0, 9.0, 11.0, 7.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.47265625, -4.32757568359375, -4.1824951171875, -4.03741455078125, -3.892333984375, -3.74725341796875, -3.6021728515625, -3.45709228515625, -3.31201171875, -3.16693115234375, -3.0218505859375, -2.87677001953125, -2.731689453125, -2.58660888671875, -2.4415283203125, -2.29644775390625, -2.1513671875, -2.00628662109375, -1.8612060546875, -1.71612548828125, -1.571044921875, -1.42596435546875, -1.2808837890625, -1.13580322265625, -0.99072265625, -0.84564208984375, -0.7005615234375, -0.55548095703125, -0.410400390625, -0.26531982421875, -0.1202392578125, 0.02484130859375, 0.169921875, 0.31500244140625, 0.4600830078125, 0.60516357421875, 0.750244140625, 0.89532470703125, 1.0404052734375, 1.18548583984375, 1.33056640625, 1.47564697265625, 1.6207275390625, 1.76580810546875, 1.910888671875, 2.05596923828125, 2.2010498046875, 2.34613037109375, 2.4912109375, 2.63629150390625, 2.7813720703125, 2.92645263671875, 3.071533203125, 3.21661376953125, 3.3616943359375, 3.50677490234375, 3.65185546875, 3.79693603515625, 3.9420166015625, 4.08709716796875, 4.232177734375, 4.37725830078125, 4.5223388671875, 4.66741943359375, 4.8125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 7.0, 3.0, 13.0, 7.0, 11.0, 6.0, 17.0, 21.0, 16.0, 18.0, 21.0, 21.0, 36.0, 29.0, 31.0, 51.0, 72.0, 101.0, 101.0, 75.0, 61.0, 39.0, 34.0, 28.0, 24.0, 19.0, 24.0, 19.0, 18.0, 9.0, 2.0, 11.0, 6.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.453857421875, -0.4396781921386719, -0.42549896240234375, -0.4113197326660156, -0.3971405029296875, -0.3829612731933594, -0.36878204345703125, -0.3546028137207031, -0.340423583984375, -0.3262443542480469, -0.31206512451171875, -0.2978858947753906, -0.2837066650390625, -0.2695274353027344, -0.25534820556640625, -0.24116897583007812, -0.22698974609375, -0.21281051635742188, -0.19863128662109375, -0.18445205688476562, -0.1702728271484375, -0.15609359741210938, -0.14191436767578125, -0.12773513793945312, -0.113555908203125, -0.09937667846679688, -0.08519744873046875, -0.07101821899414062, -0.0568389892578125, -0.042659759521484375, -0.02848052978515625, -0.014301300048828125, -0.0001220703125, 0.014057159423828125, 0.02823638916015625, 0.042415618896484375, 0.0565948486328125, 0.07077407836914062, 0.08495330810546875, 0.09913253784179688, 0.113311767578125, 0.12749099731445312, 0.14167022705078125, 0.15584945678710938, 0.1700286865234375, 0.18420791625976562, 0.19838714599609375, 0.21256637573242188, 0.22674560546875, 0.24092483520507812, 0.25510406494140625, 0.2692832946777344, 0.2834625244140625, 0.2976417541503906, 0.31182098388671875, 0.3260002136230469, 0.340179443359375, 0.3543586730957031, 0.36853790283203125, 0.3827171325683594, 0.3968963623046875, 0.4110755920410156, 0.42525482177734375, 0.4394340515136719, 0.45361328125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 6.0, 13.0, 2.0, 10.0, 17.0, 18.0, 26.0, 19.0, 28.0, 33.0, 54.0, 74.0, 109.0, 192.0, 17887.0, 1029355.0, 203.0, 117.0, 80.0, 42.0, 43.0, 29.0, 19.0, 18.0, 18.0, 17.0, 20.0, 7.0, 8.0, 11.0, 8.0, 8.0, 5.0, 10.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.28125, -13.835693359375, -13.39013671875, -12.944580078125, -12.4990234375, -12.053466796875, -11.60791015625, -11.162353515625, -10.716796875, -10.271240234375, -9.82568359375, -9.380126953125, -8.9345703125, -8.489013671875, -8.04345703125, -7.597900390625, -7.15234375, -6.706787109375, -6.26123046875, -5.815673828125, -5.3701171875, -4.924560546875, -4.47900390625, -4.033447265625, -3.587890625, -3.142333984375, -2.69677734375, -2.251220703125, -1.8056640625, -1.360107421875, -0.91455078125, -0.468994140625, -0.0234375, 0.422119140625, 0.86767578125, 1.313232421875, 1.7587890625, 2.204345703125, 2.64990234375, 3.095458984375, 3.541015625, 3.986572265625, 4.43212890625, 4.877685546875, 5.3232421875, 5.768798828125, 6.21435546875, 6.659912109375, 7.10546875, 7.551025390625, 7.99658203125, 8.442138671875, 8.8876953125, 9.333251953125, 9.77880859375, 10.224365234375, 10.669921875, 11.115478515625, 11.56103515625, 12.006591796875, 12.4521484375, 12.897705078125, 13.34326171875, 13.788818359375, 14.234375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [873.0, 148.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32646626234054565, 0.021451056003570557, 0.36936837434768677, 0.717285692691803, 1.0652029514312744, 1.4131202697753906, 1.7610375881195068, 2.108954906463623, 2.4568722248077393, 2.8047895431518555, 3.1527068614959717, 3.500624179840088, 3.848541498184204, 4.19645881652832, 4.544376373291016, 4.892293453216553, 5.240211009979248, 5.588128089904785, 5.9360456466674805, 6.283963203430176, 6.631880283355713, 6.97979736328125, 7.327714920043945, 7.675632476806641, 8.02354907989502, 8.371466636657715, 8.719383239746094, 9.067300796508789, 9.415218353271484, 9.76313591003418, 10.111053466796875, 10.458970069885254, 10.806888580322266, 11.154806137084961, 11.502723693847656, 11.850640296936035, 12.19855785369873, 12.546475410461426, 12.894392013549805, 13.2423095703125, 13.590227127075195, 13.93814468383789, 14.286062240600586, 14.633978843688965, 14.98189640045166, 15.329813957214355, 15.677730560302734, 16.02564811706543, 16.373565673828125, 16.72148323059082, 17.069400787353516, 17.41731834411621, 17.765235900878906, 18.11315155029297, 18.461069107055664, 18.80898666381836, 19.156904220581055, 19.50482177734375, 19.852739334106445, 20.20065689086914, 20.548572540283203, 20.8964900970459, 21.244407653808594, 21.59232521057129, 21.940242767333984]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 10.0, 9.0, 13.0, 16.0, 10.0, 20.0, 17.0, 19.0, 25.0, 26.0, 32.0, 31.0, 33.0, 42.0, 24.0, 41.0, 39.0, 28.0, 32.0, 38.0, 37.0, 38.0, 35.0, 33.0, 25.0, 29.0, 32.0, 29.0, 32.0, 18.0, 23.0, 20.0, 14.0, 13.0, 19.0, 21.0, 15.0, 10.0, 6.0, 4.0, 9.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1879254579544067, -1.1490732431411743, -1.1102209091186523, -1.07136869430542, -1.032516360282898, -0.9936641454696655, -0.9548118710517883, -0.9159595966339111, -0.8771073222160339, -0.8382550477981567, -0.7994027733802795, -0.7605504989624023, -0.7216982841491699, -0.682845950126648, -0.6439937353134155, -0.6051414608955383, -0.5662891864776611, -0.5274369120597839, -0.48858463764190674, -0.44973239302635193, -0.41088011860847473, -0.37202784419059753, -0.3331755995750427, -0.2943233251571655, -0.25547105073928833, -0.21661877632141113, -0.17776651680469513, -0.13891425728797913, -0.10006198287010193, -0.06120970845222473, -0.022357448935508728, 0.016494810581207275, 0.05534708499908447, 0.09419935196638107, 0.13305161893367767, 0.17190387845039368, 0.21075615286827087, 0.24960842728614807, 0.2884606719017029, 0.3273129463195801, 0.3661652207374573, 0.4050174951553345, 0.44386976957321167, 0.4827220141887665, 0.5215742588043213, 0.5604265928268433, 0.5992788076400757, 0.6381310820579529, 0.6769833564758301, 0.7158356308937073, 0.7546879053115845, 0.7935401797294617, 0.8323924541473389, 0.8712446689605713, 0.9100969433784485, 0.9489492177963257, 0.9878014922142029, 1.02665376663208, 1.0655059814453125, 1.1043583154678345, 1.143210530281067, 1.1820628643035889, 1.2209150791168213, 1.2597672939300537, 1.2986196279525757]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 2.0, 3.0, 2.0, 8.0, 10.0, 11.0, 18.0, 20.0, 19.0, 26.0, 30.0, 28.0, 23.0, 41.0, 51.0, 52.0, 40.0, 64.0, 49.0, 62.0, 45.0, 44.0, 42.0, 42.0, 39.0, 35.0, 31.0, 24.0, 24.0, 22.0, 14.0, 21.0, 8.0, 5.0, 10.0, 10.0, 6.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-43.4375, -42.04541015625, -40.6533203125, -39.26123046875, -37.869140625, -36.47705078125, -35.0849609375, -33.69287109375, -32.30078125, -30.90869140625, -29.5166015625, -28.12451171875, -26.732421875, -25.34033203125, -23.9482421875, -22.55615234375, -21.1640625, -19.77197265625, -18.3798828125, -16.98779296875, -15.595703125, -14.20361328125, -12.8115234375, -11.41943359375, -10.02734375, -8.63525390625, -7.2431640625, -5.85107421875, -4.458984375, -3.06689453125, -1.6748046875, -0.28271484375, 1.109375, 2.50146484375, 3.8935546875, 5.28564453125, 6.677734375, 8.06982421875, 9.4619140625, 10.85400390625, 12.24609375, 13.63818359375, 15.0302734375, 16.42236328125, 17.814453125, 19.20654296875, 20.5986328125, 21.99072265625, 23.3828125, 24.77490234375, 26.1669921875, 27.55908203125, 28.951171875, 30.34326171875, 31.7353515625, 33.12744140625, 34.51953125, 35.91162109375, 37.3037109375, 38.69580078125, 40.087890625, 41.47998046875, 42.8720703125, 44.26416015625, 45.65625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 2.0, 5.0, 10.0, 6.0, 20.0, 19.0, 30.0, 40.0, 72.0, 89.0, 141.0, 175.0, 251.0, 407.0, 628.0, 985.0, 1690.0, 3018.0, 5719.0, 11984.0, 27182.0, 71188.0, 240770.0, 462951.0, 137304.0, 46177.0, 18761.0, 8692.0, 4316.0, 2317.0, 1322.0, 791.0, 459.0, 324.0, 210.0, 161.0, 95.0, 67.0, 49.0, 29.0, 32.0, 19.0, 12.0, 7.0, 3.0, 10.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.40625, -16.849853515625, -16.29345703125, -15.737060546875, -15.1806640625, -14.624267578125, -14.06787109375, -13.511474609375, -12.955078125, -12.398681640625, -11.84228515625, -11.285888671875, -10.7294921875, -10.173095703125, -9.61669921875, -9.060302734375, -8.50390625, -7.947509765625, -7.39111328125, -6.834716796875, -6.2783203125, -5.721923828125, -5.16552734375, -4.609130859375, -4.052734375, -3.496337890625, -2.93994140625, -2.383544921875, -1.8271484375, -1.270751953125, -0.71435546875, -0.157958984375, 0.3984375, 0.954833984375, 1.51123046875, 2.067626953125, 2.6240234375, 3.180419921875, 3.73681640625, 4.293212890625, 4.849609375, 5.406005859375, 5.96240234375, 6.518798828125, 7.0751953125, 7.631591796875, 8.18798828125, 8.744384765625, 9.30078125, 9.857177734375, 10.41357421875, 10.969970703125, 11.5263671875, 12.082763671875, 12.63916015625, 13.195556640625, 13.751953125, 14.308349609375, 14.86474609375, 15.421142578125, 15.9775390625, 16.533935546875, 17.09033203125, 17.646728515625, 18.203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 13.0, 8.0, 14.0, 16.0, 15.0, 27.0, 25.0, 21.0, 27.0, 32.0, 50.0, 35.0, 29.0, 40.0, 39.0, 68.0, 1836.0, 228.0, 60.0, 40.0, 50.0, 39.0, 43.0, 32.0, 27.0, 41.0, 27.0, 23.0, 10.0, 20.0, 21.0, 15.0, 13.0, 6.0, 8.0, 12.0, 6.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-141.875, -137.564453125, -133.25390625, -128.943359375, -124.6328125, -120.322265625, -116.01171875, -111.701171875, -107.390625, -103.080078125, -98.76953125, -94.458984375, -90.1484375, -85.837890625, -81.52734375, -77.216796875, -72.90625, -68.595703125, -64.28515625, -59.974609375, -55.6640625, -51.353515625, -47.04296875, -42.732421875, -38.421875, -34.111328125, -29.80078125, -25.490234375, -21.1796875, -16.869140625, -12.55859375, -8.248046875, -3.9375, 0.373046875, 4.68359375, 8.994140625, 13.3046875, 17.615234375, 21.92578125, 26.236328125, 30.546875, 34.857421875, 39.16796875, 43.478515625, 47.7890625, 52.099609375, 56.41015625, 60.720703125, 65.03125, 69.341796875, 73.65234375, 77.962890625, 82.2734375, 86.583984375, 90.89453125, 95.205078125, 99.515625, 103.826171875, 108.13671875, 112.447265625, 116.7578125, 121.068359375, 125.37890625, 129.689453125, 134.0]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 11.0, 7.0, 12.0, 10.0, 14.0, 22.0, 24.0, 19.0, 34.0, 46.0, 72.0, 83.0, 117.0, 157.0, 240.0, 405.0, 953.0, 5032.0, 3018718.0, 115763.0, 2250.0, 631.0, 313.0, 225.0, 127.0, 124.0, 55.0, 36.0, 33.0, 30.0, 33.0, 15.0, 16.0, 17.0, 8.0, 13.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-203.125, -196.533203125, -189.94140625, -183.349609375, -176.7578125, -170.166015625, -163.57421875, -156.982421875, -150.390625, -143.798828125, -137.20703125, -130.615234375, -124.0234375, -117.431640625, -110.83984375, -104.248046875, -97.65625, -91.064453125, -84.47265625, -77.880859375, -71.2890625, -64.697265625, -58.10546875, -51.513671875, -44.921875, -38.330078125, -31.73828125, -25.146484375, -18.5546875, -11.962890625, -5.37109375, 1.220703125, 7.8125, 14.404296875, 20.99609375, 27.587890625, 34.1796875, 40.771484375, 47.36328125, 53.955078125, 60.546875, 67.138671875, 73.73046875, 80.322265625, 86.9140625, 93.505859375, 100.09765625, 106.689453125, 113.28125, 119.873046875, 126.46484375, 133.056640625, 139.6484375, 146.240234375, 152.83203125, 159.423828125, 166.015625, 172.607421875, 179.19921875, 185.791015625, 192.3828125, 198.974609375, 205.56640625, 212.158203125, 218.75]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 167.0, 853.0], "bins": [-3870.767578125, -3809.46533203125, -3748.1630859375, -3686.86083984375, -3625.558349609375, -3564.256103515625, -3502.953857421875, -3441.651611328125, -3380.349365234375, -3319.047119140625, -3257.744873046875, -3196.4423828125, -3135.14013671875, -3073.837890625, -3012.53564453125, -2951.2333984375, -2889.930908203125, -2828.628662109375, -2767.326416015625, -2706.02392578125, -2644.7216796875, -2583.41943359375, -2522.1171875, -2460.81494140625, -2399.5126953125, -2338.21044921875, -2276.908203125, -2215.60595703125, -2154.303466796875, -2093.001220703125, -2031.698974609375, -1970.396728515625, -1909.0943603515625, -1847.7921142578125, -1786.48974609375, -1725.1875, -1663.88525390625, -1602.5828857421875, -1541.2806396484375, -1479.978271484375, -1418.676025390625, -1357.373779296875, -1296.0714111328125, -1234.7691650390625, -1173.4669189453125, -1112.16455078125, -1050.8623046875, -989.5599975585938, -928.2577514648438, -866.9554443359375, -805.6531982421875, -744.3508911132812, -683.048583984375, -621.746337890625, -560.4440307617188, -499.1417236328125, -437.8394775390625, -376.5372009277344, -315.2348937988281, -253.9326171875, -192.6303253173828, -131.32803344726562, -70.0257568359375, -8.72344970703125, 52.57883071899414]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 8.0, 0.0, 4.0, 4.0, 2.0, 13.0, 12.0, 18.0, 13.0, 11.0, 9.0, 26.0, 23.0, 30.0, 39.0, 34.0, 41.0, 38.0, 30.0, 31.0, 51.0, 36.0, 40.0, 42.0, 53.0, 45.0, 32.0, 32.0, 36.0, 39.0, 28.0, 30.0, 27.0, 20.0, 19.0, 14.0, 11.0, 12.0, 6.0, 9.0, 6.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0], "bins": [-498.8547058105469, -484.73089599609375, -470.6070861816406, -456.4832763671875, -442.3594665527344, -428.23565673828125, -414.1118469238281, -399.988037109375, -385.8642272949219, -371.74041748046875, -357.6166076660156, -343.4927978515625, -329.3689880371094, -315.24517822265625, -301.1213684082031, -286.99755859375, -272.8737487792969, -258.74993896484375, -244.62612915039062, -230.5023193359375, -216.37850952148438, -202.25469970703125, -188.13088989257812, -174.007080078125, -159.88327026367188, -145.75946044921875, -131.63565063476562, -117.5118408203125, -103.38803100585938, -89.26422119140625, -75.14041137695312, -61.0166015625, -46.892791748046875, -32.76898193359375, -18.645172119140625, -4.5213623046875, 9.602447509765625, 23.72625732421875, 37.850067138671875, 51.973876953125, 66.09768676757812, 80.22149658203125, 94.34530639648438, 108.4691162109375, 122.59292602539062, 136.71673583984375, 150.84054565429688, 164.96435546875, 179.08816528320312, 193.21197509765625, 207.33578491210938, 221.4595947265625, 235.58340454101562, 249.70721435546875, 263.8310241699219, 277.954833984375, 292.0786437988281, 306.20245361328125, 320.3262634277344, 334.4500732421875, 348.5738830566406, 362.69769287109375, 376.8215026855469, 390.9453125, 405.0691223144531]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 7.0, 9.0, 13.0, 12.0, 14.0, 20.0, 20.0, 26.0, 32.0, 27.0, 34.0, 33.0, 51.0, 47.0, 50.0, 52.0, 59.0, 54.0, 39.0, 41.0, 44.0, 40.0, 39.0, 34.0, 35.0, 19.0, 22.0, 29.0, 12.0, 15.0, 13.0, 6.0, 9.0, 9.0, 7.0, 6.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-42.28125, -40.9208984375, -39.560546875, -38.2001953125, -36.83984375, -35.4794921875, -34.119140625, -32.7587890625, -31.3984375, -30.0380859375, -28.677734375, -27.3173828125, -25.95703125, -24.5966796875, -23.236328125, -21.8759765625, -20.515625, -19.1552734375, -17.794921875, -16.4345703125, -15.07421875, -13.7138671875, -12.353515625, -10.9931640625, -9.6328125, -8.2724609375, -6.912109375, -5.5517578125, -4.19140625, -2.8310546875, -1.470703125, -0.1103515625, 1.25, 2.6103515625, 3.970703125, 5.3310546875, 6.69140625, 8.0517578125, 9.412109375, 10.7724609375, 12.1328125, 13.4931640625, 14.853515625, 16.2138671875, 17.57421875, 18.9345703125, 20.294921875, 21.6552734375, 23.015625, 24.3759765625, 25.736328125, 27.0966796875, 28.45703125, 29.8173828125, 31.177734375, 32.5380859375, 33.8984375, 35.2587890625, 36.619140625, 37.9794921875, 39.33984375, 40.7001953125, 42.060546875, 43.4208984375, 44.78125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 1.0, 15.0, 14.0, 21.0, 28.0, 49.0, 68.0, 97.0, 100.0, 188.0, 259.0, 433.0, 637.0, 1005.0, 1646.0, 2935.0, 5331.0, 10364.0, 21521.0, 104199.0, 3002057.0, 960778.0, 46089.0, 16595.0, 8570.0, 4484.0, 2530.0, 1487.0, 912.0, 617.0, 402.0, 253.0, 186.0, 104.0, 87.0, 59.0, 47.0, 38.0, 21.0, 14.0, 12.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-122.0, -118.16796875, -114.3359375, -110.50390625, -106.671875, -102.83984375, -99.0078125, -95.17578125, -91.34375, -87.51171875, -83.6796875, -79.84765625, -76.015625, -72.18359375, -68.3515625, -64.51953125, -60.6875, -56.85546875, -53.0234375, -49.19140625, -45.359375, -41.52734375, -37.6953125, -33.86328125, -30.03125, -26.19921875, -22.3671875, -18.53515625, -14.703125, -10.87109375, -7.0390625, -3.20703125, 0.625, 4.45703125, 8.2890625, 12.12109375, 15.953125, 19.78515625, 23.6171875, 27.44921875, 31.28125, 35.11328125, 38.9453125, 42.77734375, 46.609375, 50.44140625, 54.2734375, 58.10546875, 61.9375, 65.76953125, 69.6015625, 73.43359375, 77.265625, 81.09765625, 84.9296875, 88.76171875, 92.59375, 96.42578125, 100.2578125, 104.08984375, 107.921875, 111.75390625, 115.5859375, 119.41796875, 123.25]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 5.0, 9.0, 7.0, 12.0, 20.0, 11.0, 25.0, 21.0, 51.0, 62.0, 96.0, 122.0, 209.0, 393.0, 746.0, 899.0, 532.0, 282.0, 180.0, 98.0, 83.0, 48.0, 40.0, 23.0, 16.0, 14.0, 12.0, 10.0, 6.0, 13.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-140.75, -136.7587890625, -132.767578125, -128.7763671875, -124.78515625, -120.7939453125, -116.802734375, -112.8115234375, -108.8203125, -104.8291015625, -100.837890625, -96.8466796875, -92.85546875, -88.8642578125, -84.873046875, -80.8818359375, -76.890625, -72.8994140625, -68.908203125, -64.9169921875, -60.92578125, -56.9345703125, -52.943359375, -48.9521484375, -44.9609375, -40.9697265625, -36.978515625, -32.9873046875, -28.99609375, -25.0048828125, -21.013671875, -17.0224609375, -13.03125, -9.0400390625, -5.048828125, -1.0576171875, 2.93359375, 6.9248046875, 10.916015625, 14.9072265625, 18.8984375, 22.8896484375, 26.880859375, 30.8720703125, 34.86328125, 38.8544921875, 42.845703125, 46.8369140625, 50.828125, 54.8193359375, 58.810546875, 62.8017578125, 66.79296875, 70.7841796875, 74.775390625, 78.7666015625, 82.7578125, 86.7490234375, 90.740234375, 94.7314453125, 98.72265625, 102.7138671875, 106.705078125, 110.6962890625, 114.6875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 7.0, 16.0, 15.0, 12.0, 25.0, 43.0, 47.0, 101.0, 148.0, 307.0, 455.0, 952.0, 1955.0, 4450.0, 11342.0, 35397.0, 315060.0, 3723587.0, 69843.0, 18140.0, 6679.0, 2838.0, 1328.0, 631.0, 317.0, 225.0, 110.0, 71.0, 51.0, 23.0, 22.0, 18.0, 11.0, 9.0, 12.0, 10.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-306.5, -296.68359375, -286.8671875, -277.05078125, -267.234375, -257.41796875, -247.6015625, -237.78515625, -227.96875, -218.15234375, -208.3359375, -198.51953125, -188.703125, -178.88671875, -169.0703125, -159.25390625, -149.4375, -139.62109375, -129.8046875, -119.98828125, -110.171875, -100.35546875, -90.5390625, -80.72265625, -70.90625, -61.08984375, -51.2734375, -41.45703125, -31.640625, -21.82421875, -12.0078125, -2.19140625, 7.625, 17.44140625, 27.2578125, 37.07421875, 46.890625, 56.70703125, 66.5234375, 76.33984375, 86.15625, 95.97265625, 105.7890625, 115.60546875, 125.421875, 135.23828125, 145.0546875, 154.87109375, 164.6875, 174.50390625, 184.3203125, 194.13671875, 203.953125, 213.76953125, 223.5859375, 233.40234375, 243.21875, 253.03515625, 262.8515625, 272.66796875, 282.484375, 292.30078125, 302.1171875, 311.93359375, 321.75]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 7.0, 9.0, 29.0, 39.0, 59.0, 138.0, 306.0, 189.0, 95.0, 53.0, 32.0, 17.0, 7.0, 10.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-717.5640258789062, -690.7764892578125, -663.989013671875, -637.2014770507812, -610.4140014648438, -583.62646484375, -556.8389892578125, -530.0514526367188, -503.26397705078125, -476.4764709472656, -449.68896484375, -422.9014587402344, -396.11395263671875, -369.326416015625, -342.5389404296875, -315.75140380859375, -288.9638977050781, -262.1763916015625, -235.38888549804688, -208.60137939453125, -181.81387329101562, -155.02635192871094, -128.2388458251953, -101.45133972167969, -74.66383361816406, -47.87632751464844, -21.088817596435547, 5.698692321777344, 32.48619842529297, 59.273712158203125, 86.06121826171875, 112.84872436523438, 139.63623046875, 166.42373657226562, 193.21124267578125, 219.99874877929688, 246.7862548828125, 273.57379150390625, 300.36126708984375, 327.1488037109375, 353.936279296875, 380.7237854003906, 407.51129150390625, 434.2987976074219, 461.0863037109375, 487.87384033203125, 514.6613159179688, 541.4488525390625, 568.236328125, 595.0238647460938, 621.8113403320312, 648.598876953125, 675.3863525390625, 702.1738891601562, 728.9613647460938, 755.7489013671875, 782.5364379882812, 809.323974609375, 836.1114501953125, 862.8989868164062, 889.6864624023438, 916.4739990234375, 943.261474609375, 970.0490112304688, 996.8364868164062]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 10.0, 5.0, 9.0, 8.0, 9.0, 14.0, 14.0, 14.0, 33.0, 26.0, 20.0, 16.0, 19.0, 26.0, 25.0, 35.0, 43.0, 57.0, 44.0, 42.0, 51.0, 39.0, 40.0, 50.0, 39.0, 33.0, 30.0, 35.0, 29.0, 31.0, 22.0, 25.0, 23.0, 14.0, 17.0, 14.0, 9.0, 5.0, 8.0, 3.0, 5.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.17828369140625, -315.122802734375, -304.0672912597656, -293.0118103027344, -281.956298828125, -270.90081787109375, -259.8453369140625, -248.7898406982422, -237.73434448242188, -226.67884826660156, -215.62335205078125, -204.56787109375, -193.5123748779297, -182.45687866210938, -171.40139770507812, -160.3459014892578, -149.2904052734375, -138.2349090576172, -127.1794204711914, -116.12393188476562, -105.06843566894531, -94.012939453125, -82.95745086669922, -71.90196228027344, -60.846466064453125, -49.79097366333008, -38.73548126220703, -27.679988861083984, -16.624496459960938, -5.569004058837891, 5.486488342285156, 16.541976928710938, 27.597442626953125, 38.65293502807617, 49.70842742919922, 60.763919830322266, 71.81941223144531, 82.87490844726562, 93.9303970336914, 104.98588562011719, 116.0413818359375, 127.09687805175781, 138.15237426757812, 149.20785522460938, 160.2633514404297, 171.31884765625, 182.37432861328125, 193.42982482910156, 204.48532104492188, 215.5408172607422, 226.5963134765625, 237.65179443359375, 248.70729064941406, 259.7627868652344, 270.8182678222656, 281.873779296875, 292.92926025390625, 303.9847412109375, 315.0402526855469, 326.0957336425781, 337.1512451171875, 348.20672607421875, 359.26220703125, 370.31768798828125, 381.3731994628906]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 9.0, 4.0, 11.0, 13.0, 18.0, 15.0, 24.0, 29.0, 33.0, 37.0, 41.0, 42.0, 58.0, 35.0, 64.0, 45.0, 51.0, 45.0, 54.0, 53.0, 40.0, 32.0, 44.0, 27.0, 23.0, 21.0, 19.0, 20.0, 17.0, 17.0, 6.0, 7.0, 6.0, 8.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.125, -41.65576171875, -40.1865234375, -38.71728515625, -37.248046875, -35.77880859375, -34.3095703125, -32.84033203125, -31.37109375, -29.90185546875, -28.4326171875, -26.96337890625, -25.494140625, -24.02490234375, -22.5556640625, -21.08642578125, -19.6171875, -18.14794921875, -16.6787109375, -15.20947265625, -13.740234375, -12.27099609375, -10.8017578125, -9.33251953125, -7.86328125, -6.39404296875, -4.9248046875, -3.45556640625, -1.986328125, -0.51708984375, 0.9521484375, 2.42138671875, 3.890625, 5.35986328125, 6.8291015625, 8.29833984375, 9.767578125, 11.23681640625, 12.7060546875, 14.17529296875, 15.64453125, 17.11376953125, 18.5830078125, 20.05224609375, 21.521484375, 22.99072265625, 24.4599609375, 25.92919921875, 27.3984375, 28.86767578125, 30.3369140625, 31.80615234375, 33.275390625, 34.74462890625, 36.2138671875, 37.68310546875, 39.15234375, 40.62158203125, 42.0908203125, 43.56005859375, 45.029296875, 46.49853515625, 47.9677734375, 49.43701171875, 50.90625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 9.0, 11.0, 13.0, 21.0, 30.0, 33.0, 47.0, 70.0, 72.0, 117.0, 158.0, 244.0, 271.0, 441.0, 607.0, 837.0, 1301.0, 1836.0, 2741.0, 4458.0, 7690.0, 16226.0, 44122.0, 186020.0, 573111.0, 138293.0, 35955.0, 14173.0, 7042.0, 4212.0, 2622.0, 1684.0, 1177.0, 833.0, 607.0, 407.0, 274.0, 206.0, 187.0, 111.0, 94.0, 46.0, 36.0, 38.0, 26.0, 12.0, 5.0, 7.0, 10.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.4296875, -12.02099609375, -11.6123046875, -11.20361328125, -10.794921875, -10.38623046875, -9.9775390625, -9.56884765625, -9.16015625, -8.75146484375, -8.3427734375, -7.93408203125, -7.525390625, -7.11669921875, -6.7080078125, -6.29931640625, -5.890625, -5.48193359375, -5.0732421875, -4.66455078125, -4.255859375, -3.84716796875, -3.4384765625, -3.02978515625, -2.62109375, -2.21240234375, -1.8037109375, -1.39501953125, -0.986328125, -0.57763671875, -0.1689453125, 0.23974609375, 0.6484375, 1.05712890625, 1.4658203125, 1.87451171875, 2.283203125, 2.69189453125, 3.1005859375, 3.50927734375, 3.91796875, 4.32666015625, 4.7353515625, 5.14404296875, 5.552734375, 5.96142578125, 6.3701171875, 6.77880859375, 7.1875, 7.59619140625, 8.0048828125, 8.41357421875, 8.822265625, 9.23095703125, 9.6396484375, 10.04833984375, 10.45703125, 10.86572265625, 11.2744140625, 11.68310546875, 12.091796875, 12.50048828125, 12.9091796875, 13.31787109375, 13.7265625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 18.0, 17.0, 17.0, 14.0, 24.0, 21.0, 25.0, 25.0, 24.0, 32.0, 39.0, 42.0, 40.0, 49.0, 46.0, 40.0, 1059.0, 37.0, 38.0, 43.0, 39.0, 46.0, 28.0, 20.0, 35.0, 31.0, 20.0, 21.0, 16.0, 19.0, 11.0, 7.0, 12.0, 11.0, 8.0, 4.0, 8.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.125, -25.272705078125, -24.42041015625, -23.568115234375, -22.7158203125, -21.863525390625, -21.01123046875, -20.158935546875, -19.306640625, -18.454345703125, -17.60205078125, -16.749755859375, -15.8974609375, -15.045166015625, -14.19287109375, -13.340576171875, -12.48828125, -11.635986328125, -10.78369140625, -9.931396484375, -9.0791015625, -8.226806640625, -7.37451171875, -6.522216796875, -5.669921875, -4.817626953125, -3.96533203125, -3.113037109375, -2.2607421875, -1.408447265625, -0.55615234375, 0.296142578125, 1.1484375, 2.000732421875, 2.85302734375, 3.705322265625, 4.5576171875, 5.409912109375, 6.26220703125, 7.114501953125, 7.966796875, 8.819091796875, 9.67138671875, 10.523681640625, 11.3759765625, 12.228271484375, 13.08056640625, 13.932861328125, 14.78515625, 15.637451171875, 16.48974609375, 17.342041015625, 18.1943359375, 19.046630859375, 19.89892578125, 20.751220703125, 21.603515625, 22.455810546875, 23.30810546875, 24.160400390625, 25.0126953125, 25.864990234375, 26.71728515625, 27.569580078125, 28.421875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 9.0, 15.0, 20.0, 31.0, 34.0, 59.0, 76.0, 119.0, 206.0, 258.0, 379.0, 584.0, 951.0, 1541.0, 2471.0, 3943.0, 6681.0, 11895.0, 21792.0, 43180.0, 94139.0, 269078.0, 1309775.0, 179498.0, 72456.0, 35130.0, 18101.0, 9919.0, 5656.0, 3330.0, 2013.0, 1292.0, 880.0, 505.0, 350.0, 237.0, 185.0, 85.0, 85.0, 51.0, 38.0, 30.0, 11.0, 16.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.375, -4.23541259765625, -4.0958251953125, -3.95623779296875, -3.816650390625, -3.67706298828125, -3.5374755859375, -3.39788818359375, -3.25830078125, -3.11871337890625, -2.9791259765625, -2.83953857421875, -2.699951171875, -2.56036376953125, -2.4207763671875, -2.28118896484375, -2.1416015625, -2.00201416015625, -1.8624267578125, -1.72283935546875, -1.583251953125, -1.44366455078125, -1.3040771484375, -1.16448974609375, -1.02490234375, -0.88531494140625, -0.7457275390625, -0.60614013671875, -0.466552734375, -0.32696533203125, -0.1873779296875, -0.04779052734375, 0.091796875, 0.23138427734375, 0.3709716796875, 0.51055908203125, 0.650146484375, 0.78973388671875, 0.9293212890625, 1.06890869140625, 1.20849609375, 1.34808349609375, 1.4876708984375, 1.62725830078125, 1.766845703125, 1.90643310546875, 2.0460205078125, 2.18560791015625, 2.3251953125, 2.46478271484375, 2.6043701171875, 2.74395751953125, 2.883544921875, 3.02313232421875, 3.1627197265625, 3.30230712890625, 3.44189453125, 3.58148193359375, 3.7210693359375, 3.86065673828125, 4.000244140625, 4.13983154296875, 4.2794189453125, 4.41900634765625, 4.55859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 7.0, 7.0, 6.0, 9.0, 11.0, 13.0, 12.0, 16.0, 24.0, 30.0, 30.0, 42.0, 41.0, 63.0, 73.0, 71.0, 80.0, 72.0, 90.0, 56.0, 51.0, 43.0, 34.0, 30.0, 21.0, 10.0, 6.0, 8.0, 8.0, 8.0, 9.0, 3.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83154296875, -0.8021163940429688, -0.7726898193359375, -0.7432632446289062, -0.713836669921875, -0.6844100952148438, -0.6549835205078125, -0.6255569458007812, -0.59613037109375, -0.5667037963867188, -0.5372772216796875, -0.5078506469726562, -0.478424072265625, -0.44899749755859375, -0.4195709228515625, -0.39014434814453125, -0.3607177734375, -0.33129119873046875, -0.3018646240234375, -0.27243804931640625, -0.243011474609375, -0.21358489990234375, -0.1841583251953125, -0.15473175048828125, -0.12530517578125, -0.09587860107421875, -0.0664520263671875, -0.03702545166015625, -0.007598876953125, 0.02182769775390625, 0.0512542724609375, 0.08068084716796875, 0.110107421875, 0.13953399658203125, 0.1689605712890625, 0.19838714599609375, 0.227813720703125, 0.25724029541015625, 0.2866668701171875, 0.31609344482421875, 0.34552001953125, 0.37494659423828125, 0.4043731689453125, 0.43379974365234375, 0.463226318359375, 0.49265289306640625, 0.5220794677734375, 0.5515060424804688, 0.5809326171875, 0.6103591918945312, 0.6397857666015625, 0.6692123413085938, 0.698638916015625, 0.7280654907226562, 0.7574920654296875, 0.7869186401367188, 0.81634521484375, 0.8457717895507812, 0.8751983642578125, 0.9046249389648438, 0.934051513671875, 0.9634780883789062, 0.9929046630859375, 1.0223312377929688, 1.0517578125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 8.0, 2.0, 2.0, 11.0, 8.0, 6.0, 11.0, 8.0, 10.0, 21.0, 32.0, 39.0, 48.0, 72.0, 83.0, 140.0, 264.0, 1046913.0, 331.0, 162.0, 105.0, 56.0, 46.0, 33.0, 28.0, 27.0, 15.0, 11.0, 11.0, 12.0, 9.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -32.408447265625, -31.47314453125, -30.537841796875, -29.6025390625, -28.667236328125, -27.73193359375, -26.796630859375, -25.861328125, -24.926025390625, -23.99072265625, -23.055419921875, -22.1201171875, -21.184814453125, -20.24951171875, -19.314208984375, -18.37890625, -17.443603515625, -16.50830078125, -15.572998046875, -14.6376953125, -13.702392578125, -12.76708984375, -11.831787109375, -10.896484375, -9.961181640625, -9.02587890625, -8.090576171875, -7.1552734375, -6.219970703125, -5.28466796875, -4.349365234375, -3.4140625, -2.478759765625, -1.54345703125, -0.608154296875, 0.3271484375, 1.262451171875, 2.19775390625, 3.133056640625, 4.068359375, 5.003662109375, 5.93896484375, 6.874267578125, 7.8095703125, 8.744873046875, 9.68017578125, 10.615478515625, 11.55078125, 12.486083984375, 13.42138671875, 14.356689453125, 15.2919921875, 16.227294921875, 17.16259765625, 18.097900390625, 19.033203125, 19.968505859375, 20.90380859375, 21.839111328125, 22.7744140625, 23.709716796875, 24.64501953125, 25.580322265625, 26.515625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1021.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34220564365386963, 0.515373945236206, 1.3729535341262817, 2.2305331230163574, 3.0881128311157227, 3.945692539215088, 4.803271770477295, 5.66085147857666, 6.518431186676025, 7.376010894775391, 8.233590126037598, 9.091169357299805, 9.948749542236328, 10.806329727172852, 11.663908004760742, 12.521488189697266, 13.379067420959473, 14.23664665222168, 15.094226837158203, 15.95180606842041, 16.809385299682617, 17.66696548461914, 18.52454376220703, 19.382123947143555, 20.239704132080078, 21.0972843170166, 21.954862594604492, 22.812442779541016, 23.67002296447754, 24.527603149414062, 25.385181427001953, 26.242761611938477, 27.100341796875, 27.957921981811523, 28.815500259399414, 29.673080444335938, 30.53066062927246, 31.388240814208984, 32.245819091796875, 33.103397369384766, 33.96097946166992, 34.81855773925781, 35.67613983154297, 36.53371810913086, 37.39129638671875, 38.248878479003906, 39.1064567565918, 39.96403503417969, 40.821617126464844, 41.679195404052734, 42.53677749633789, 43.39435577392578, 44.25193405151367, 45.10951614379883, 45.96709442138672, 46.82467269897461, 47.6822509765625, 48.53982925415039, 49.39741134643555, 50.25498962402344, 51.11256790161133, 51.970149993896484, 52.827728271484375, 53.685306549072266, 54.54288864135742]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 8.0, 8.0, 11.0, 16.0, 14.0, 17.0, 25.0, 31.0, 18.0, 23.0, 31.0, 29.0, 35.0, 37.0, 40.0, 41.0, 32.0, 37.0, 44.0, 46.0, 34.0, 34.0, 36.0, 26.0, 36.0, 32.0, 33.0, 27.0, 27.0, 24.0, 26.0, 23.0, 15.0, 17.0, 9.0, 17.0, 9.0, 8.0, 3.0, 2.0, 6.0, 2.0, 2.0, 6.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2174978256225586, -2.1358795166015625, -2.0542612075805664, -1.9726428985595703, -1.8910247087478638, -1.8094063997268677, -1.7277880907058716, -1.646169900894165, -1.564551591873169, -1.4829332828521729, -1.4013149738311768, -1.3196966648101807, -1.2380784749984741, -1.156460165977478, -1.074841856956482, -0.9932236075401306, -0.9116052389144897, -0.8299869298934937, -0.7483686804771423, -0.6667503714561462, -0.5851321220397949, -0.5035138130187988, -0.42189550399780273, -0.3402772545814514, -0.2586589455604553, -0.17704066634178162, -0.09542237222194672, -0.013804078102111816, 0.06781420111656189, 0.1494324803352356, 0.2310507893562317, 0.312669038772583, 0.3942873477935791, 0.4759056270122528, 0.5575239062309265, 0.6391422152519226, 0.7207604646682739, 0.80237877368927, 0.8839970827102661, 0.9656153321266174, 1.0472335815429688, 1.1288518905639648, 1.210470199584961, 1.292088508605957, 1.3737066984176636, 1.4553250074386597, 1.5369433164596558, 1.6185615062713623, 1.700179934501648, 1.781798243522644, 1.8634165525436401, 1.9450347423553467, 2.0266530513763428, 2.108271360397339, 2.189889669418335, 2.271507978439331, 2.353126287460327, 2.4347445964813232, 2.5163629055023193, 2.5979812145233154, 2.6795995235443115, 2.7612175941467285, 2.8428359031677246, 2.9244542121887207, 3.006072521209717]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 9.0, 4.0, 11.0, 13.0, 18.0, 15.0, 24.0, 29.0, 33.0, 37.0, 41.0, 41.0, 59.0, 35.0, 64.0, 45.0, 51.0, 45.0, 54.0, 53.0, 40.0, 32.0, 44.0, 27.0, 23.0, 21.0, 19.0, 20.0, 17.0, 17.0, 6.0, 7.0, 6.0, 8.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.125, -41.65576171875, -40.1865234375, -38.71728515625, -37.248046875, -35.77880859375, -34.3095703125, -32.84033203125, -31.37109375, -29.90185546875, -28.4326171875, -26.96337890625, -25.494140625, -24.02490234375, -22.5556640625, -21.08642578125, -19.6171875, -18.14794921875, -16.6787109375, -15.20947265625, -13.740234375, -12.27099609375, -10.8017578125, -9.33251953125, -7.86328125, -6.39404296875, -4.9248046875, -3.45556640625, -1.986328125, -0.51708984375, 0.9521484375, 2.42138671875, 3.890625, 5.35986328125, 6.8291015625, 8.29833984375, 9.767578125, 11.23681640625, 12.7060546875, 14.17529296875, 15.64453125, 17.11376953125, 18.5830078125, 20.05224609375, 21.521484375, 22.99072265625, 24.4599609375, 25.92919921875, 27.3984375, 28.86767578125, 30.3369140625, 31.80615234375, 33.275390625, 34.74462890625, 36.2138671875, 37.68310546875, 39.15234375, 40.62158203125, 42.0908203125, 43.56005859375, 45.029296875, 46.49853515625, 47.9677734375, 49.43701171875, 50.90625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 11.0, 9.0, 7.0, 16.0, 22.0, 33.0, 44.0, 84.0, 146.0, 272.0, 581.0, 1234.0, 2907.0, 6903.0, 18870.0, 60798.0, 286971.0, 526434.0, 98987.0, 27430.0, 9909.0, 3704.0, 1663.0, 733.0, 328.0, 173.0, 82.0, 52.0, 33.0, 38.0, 12.0, 12.0, 7.0, 7.0, 11.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.25, -19.53125, -18.8125, -18.09375, -17.375, -16.65625, -15.9375, -15.21875, -14.5, -13.78125, -13.0625, -12.34375, -11.625, -10.90625, -10.1875, -9.46875, -8.75, -8.03125, -7.3125, -6.59375, -5.875, -5.15625, -4.4375, -3.71875, -3.0, -2.28125, -1.5625, -0.84375, -0.125, 0.59375, 1.3125, 2.03125, 2.75, 3.46875, 4.1875, 4.90625, 5.625, 6.34375, 7.0625, 7.78125, 8.5, 9.21875, 9.9375, 10.65625, 11.375, 12.09375, 12.8125, 13.53125, 14.25, 14.96875, 15.6875, 16.40625, 17.125, 17.84375, 18.5625, 19.28125, 20.0, 20.71875, 21.4375, 22.15625, 22.875, 23.59375, 24.3125, 25.03125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 5.0, 6.0, 7.0, 5.0, 8.0, 13.0, 12.0, 13.0, 21.0, 19.0, 23.0, 23.0, 25.0, 15.0, 31.0, 19.0, 40.0, 34.0, 44.0, 25.0, 41.0, 74.0, 2000.0, 68.0, 44.0, 43.0, 38.0, 34.0, 32.0, 24.0, 36.0, 25.0, 26.0, 29.0, 14.0, 15.0, 17.0, 20.0, 7.0, 16.0, 10.0, 7.0, 6.0, 5.0, 10.0, 4.0, 4.0, 4.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-121.0625, -117.0927734375, -113.123046875, -109.1533203125, -105.18359375, -101.2138671875, -97.244140625, -93.2744140625, -89.3046875, -85.3349609375, -81.365234375, -77.3955078125, -73.42578125, -69.4560546875, -65.486328125, -61.5166015625, -57.546875, -53.5771484375, -49.607421875, -45.6376953125, -41.66796875, -37.6982421875, -33.728515625, -29.7587890625, -25.7890625, -21.8193359375, -17.849609375, -13.8798828125, -9.91015625, -5.9404296875, -1.970703125, 1.9990234375, 5.96875, 9.9384765625, 13.908203125, 17.8779296875, 21.84765625, 25.8173828125, 29.787109375, 33.7568359375, 37.7265625, 41.6962890625, 45.666015625, 49.6357421875, 53.60546875, 57.5751953125, 61.544921875, 65.5146484375, 69.484375, 73.4541015625, 77.423828125, 81.3935546875, 85.36328125, 89.3330078125, 93.302734375, 97.2724609375, 101.2421875, 105.2119140625, 109.181640625, 113.1513671875, 117.12109375, 121.0908203125, 125.060546875, 129.0302734375, 133.0]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 0.0, 4.0, 3.0, 5.0, 7.0, 8.0, 5.0, 7.0, 10.0, 15.0, 10.0, 19.0, 17.0, 19.0, 23.0, 35.0, 44.0, 53.0, 76.0, 86.0, 141.0, 194.0, 321.0, 514.0, 1320.0, 14334.0, 3116730.0, 9021.0, 1219.0, 435.0, 293.0, 198.0, 145.0, 75.0, 61.0, 41.0, 36.0, 40.0, 24.0, 19.0, 23.0, 14.0, 11.0, 15.0, 5.0, 5.0, 7.0, 5.0, 6.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-221.625, -214.998046875, -208.37109375, -201.744140625, -195.1171875, -188.490234375, -181.86328125, -175.236328125, -168.609375, -161.982421875, -155.35546875, -148.728515625, -142.1015625, -135.474609375, -128.84765625, -122.220703125, -115.59375, -108.966796875, -102.33984375, -95.712890625, -89.0859375, -82.458984375, -75.83203125, -69.205078125, -62.578125, -55.951171875, -49.32421875, -42.697265625, -36.0703125, -29.443359375, -22.81640625, -16.189453125, -9.5625, -2.935546875, 3.69140625, 10.318359375, 16.9453125, 23.572265625, 30.19921875, 36.826171875, 43.453125, 50.080078125, 56.70703125, 63.333984375, 69.9609375, 76.587890625, 83.21484375, 89.841796875, 96.46875, 103.095703125, 109.72265625, 116.349609375, 122.9765625, 129.603515625, 136.23046875, 142.857421875, 149.484375, 156.111328125, 162.73828125, 169.365234375, 175.9921875, 182.619140625, 189.24609375, 195.873046875, 202.5]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 23.0, 919.0, 76.0, 0.0, 2.0], "bins": [-1884.5546875, -1853.460693359375, -1822.36669921875, -1791.272705078125, -1760.1785888671875, -1729.0845947265625, -1697.9906005859375, -1666.8966064453125, -1635.8026123046875, -1604.7086181640625, -1573.6146240234375, -1542.5205078125, -1511.426513671875, -1480.33251953125, -1449.238525390625, -1418.14453125, -1387.0504150390625, -1355.9564208984375, -1324.8624267578125, -1293.768310546875, -1262.67431640625, -1231.580322265625, -1200.486328125, -1169.392333984375, -1138.29833984375, -1107.204345703125, -1076.1103515625, -1045.016357421875, -1013.9223022460938, -982.8282470703125, -951.7342529296875, -920.6402587890625, -889.5462036132812, -858.4522094726562, -827.358154296875, -796.26416015625, -765.170166015625, -734.0761108398438, -702.9821166992188, -671.8880615234375, -640.7940673828125, -609.7000732421875, -578.6060180664062, -547.5120239257812, -516.4180297851562, -485.323974609375, -454.22998046875, -423.1359558105469, -392.04193115234375, -360.9479064941406, -329.8539123535156, -298.7598876953125, -267.6658630371094, -236.5718536376953, -205.47784423828125, -174.38381958007812, -143.28982543945312, -112.19580841064453, -81.10179138183594, -50.007781982421875, -18.91376495361328, 12.180252075195312, 43.274261474609375, 74.3682861328125, 105.46229553222656]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 14.0, 14.0, 7.0, 13.0, 14.0, 13.0, 17.0, 18.0, 12.0, 16.0, 22.0, 26.0, 28.0, 33.0, 32.0, 29.0, 42.0, 49.0, 24.0, 33.0, 39.0, 39.0, 39.0, 28.0, 33.0, 40.0, 36.0, 40.0, 37.0, 18.0, 32.0, 22.0, 12.0, 17.0, 20.0, 16.0, 23.0, 7.0, 12.0, 6.0, 3.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-398.93206787109375, -385.97369384765625, -373.0153503417969, -360.0569763183594, -347.0986328125, -334.1402587890625, -321.1819152832031, -308.2235412597656, -295.26519775390625, -282.30682373046875, -269.3484802246094, -256.3901062011719, -243.4317626953125, -230.473388671875, -217.51504516601562, -204.55667114257812, -191.5983123779297, -178.63995361328125, -165.6815948486328, -152.72323608398438, -139.76487731933594, -126.80651092529297, -113.84815216064453, -100.8897933959961, -87.93143463134766, -74.97307586669922, -62.01471710205078, -49.05635452270508, -36.09799575805664, -23.139633178710938, -10.1812744140625, 2.7770843505859375, 15.735443115234375, 28.693801879882812, 41.65216064453125, 54.61052322387695, 67.56887817382812, 80.5272445678711, 93.48560333251953, 106.44396209716797, 119.4023208618164, 132.36068725585938, 145.3190460205078, 158.27740478515625, 171.2357635498047, 184.19412231445312, 197.15248107910156, 210.11083984375, 223.06919860839844, 236.02755737304688, 248.9859161376953, 261.94427490234375, 274.90264892578125, 287.8609924316406, 300.8193664550781, 313.7777099609375, 326.736083984375, 339.6944580078125, 352.6528015136719, 365.6111755371094, 378.56951904296875, 391.52789306640625, 404.4862365722656, 417.4446105957031, 430.4029541015625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 7.0, 5.0, 5.0, 17.0, 13.0, 15.0, 23.0, 24.0, 30.0, 35.0, 38.0, 37.0, 49.0, 47.0, 50.0, 59.0, 44.0, 47.0, 45.0, 59.0, 51.0, 37.0, 36.0, 37.0, 22.0, 20.0, 24.0, 19.0, 17.0, 21.0, 9.0, 9.0, 7.0, 6.0, 9.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.65625, -41.18798828125, -39.7197265625, -38.25146484375, -36.783203125, -35.31494140625, -33.8466796875, -32.37841796875, -30.91015625, -29.44189453125, -27.9736328125, -26.50537109375, -25.037109375, -23.56884765625, -22.1005859375, -20.63232421875, -19.1640625, -17.69580078125, -16.2275390625, -14.75927734375, -13.291015625, -11.82275390625, -10.3544921875, -8.88623046875, -7.41796875, -5.94970703125, -4.4814453125, -3.01318359375, -1.544921875, -0.07666015625, 1.3916015625, 2.85986328125, 4.328125, 5.79638671875, 7.2646484375, 8.73291015625, 10.201171875, 11.66943359375, 13.1376953125, 14.60595703125, 16.07421875, 17.54248046875, 19.0107421875, 20.47900390625, 21.947265625, 23.41552734375, 24.8837890625, 26.35205078125, 27.8203125, 29.28857421875, 30.7568359375, 32.22509765625, 33.693359375, 35.16162109375, 36.6298828125, 38.09814453125, 39.56640625, 41.03466796875, 42.5029296875, 43.97119140625, 45.439453125, 46.90771484375, 48.3759765625, 49.84423828125, 51.3125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 11.0, 7.0, 14.0, 22.0, 21.0, 36.0, 43.0, 62.0, 104.0, 125.0, 191.0, 273.0, 376.0, 538.0, 826.0, 1199.0, 1829.0, 2925.0, 4477.0, 7594.0, 13617.0, 37410.0, 389934.0, 3309270.0, 356255.0, 32184.0, 13382.0, 7507.0, 4684.0, 2942.0, 1950.0, 1353.0, 880.0, 620.0, 462.0, 322.0, 212.0, 200.0, 98.0, 92.0, 61.0, 46.0, 25.0, 15.0, 26.0, 15.0, 12.0, 7.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-97.9375, -94.7255859375, -91.513671875, -88.3017578125, -85.08984375, -81.8779296875, -78.666015625, -75.4541015625, -72.2421875, -69.0302734375, -65.818359375, -62.6064453125, -59.39453125, -56.1826171875, -52.970703125, -49.7587890625, -46.546875, -43.3349609375, -40.123046875, -36.9111328125, -33.69921875, -30.4873046875, -27.275390625, -24.0634765625, -20.8515625, -17.6396484375, -14.427734375, -11.2158203125, -8.00390625, -4.7919921875, -1.580078125, 1.6318359375, 4.84375, 8.0556640625, 11.267578125, 14.4794921875, 17.69140625, 20.9033203125, 24.115234375, 27.3271484375, 30.5390625, 33.7509765625, 36.962890625, 40.1748046875, 43.38671875, 46.5986328125, 49.810546875, 53.0224609375, 56.234375, 59.4462890625, 62.658203125, 65.8701171875, 69.08203125, 72.2939453125, 75.505859375, 78.7177734375, 81.9296875, 85.1416015625, 88.353515625, 91.5654296875, 94.77734375, 97.9892578125, 101.201171875, 104.4130859375, 107.625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 7.0, 9.0, 10.0, 14.0, 22.0, 40.0, 43.0, 49.0, 77.0, 152.0, 260.0, 493.0, 917.0, 831.0, 459.0, 250.0, 147.0, 73.0, 47.0, 47.0, 30.0, 20.0, 14.0, 15.0, 9.0, 8.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.875, -145.45703125, -141.0390625, -136.62109375, -132.203125, -127.78515625, -123.3671875, -118.94921875, -114.53125, -110.11328125, -105.6953125, -101.27734375, -96.859375, -92.44140625, -88.0234375, -83.60546875, -79.1875, -74.76953125, -70.3515625, -65.93359375, -61.515625, -57.09765625, -52.6796875, -48.26171875, -43.84375, -39.42578125, -35.0078125, -30.58984375, -26.171875, -21.75390625, -17.3359375, -12.91796875, -8.5, -4.08203125, 0.3359375, 4.75390625, 9.171875, 13.58984375, 18.0078125, 22.42578125, 26.84375, 31.26171875, 35.6796875, 40.09765625, 44.515625, 48.93359375, 53.3515625, 57.76953125, 62.1875, 66.60546875, 71.0234375, 75.44140625, 79.859375, 84.27734375, 88.6953125, 93.11328125, 97.53125, 101.94921875, 106.3671875, 110.78515625, 115.203125, 119.62109375, 124.0390625, 128.45703125, 132.875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 5.0, 4.0, 9.0, 6.0, 12.0, 16.0, 24.0, 27.0, 41.0, 56.0, 103.0, 130.0, 236.0, 424.0, 647.0, 1277.0, 2489.0, 5448.0, 13222.0, 40056.0, 361877.0, 3654445.0, 77703.0, 20607.0, 8040.0, 3448.0, 1657.0, 912.0, 488.0, 298.0, 200.0, 114.0, 55.0, 54.0, 44.0, 26.0, 12.0, 15.0, 6.0, 8.0, 12.0, 5.0, 8.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-253.75, -245.06640625, -236.3828125, -227.69921875, -219.015625, -210.33203125, -201.6484375, -192.96484375, -184.28125, -175.59765625, -166.9140625, -158.23046875, -149.546875, -140.86328125, -132.1796875, -123.49609375, -114.8125, -106.12890625, -97.4453125, -88.76171875, -80.078125, -71.39453125, -62.7109375, -54.02734375, -45.34375, -36.66015625, -27.9765625, -19.29296875, -10.609375, -1.92578125, 6.7578125, 15.44140625, 24.125, 32.80859375, 41.4921875, 50.17578125, 58.859375, 67.54296875, 76.2265625, 84.91015625, 93.59375, 102.27734375, 110.9609375, 119.64453125, 128.328125, 137.01171875, 145.6953125, 154.37890625, 163.0625, 171.74609375, 180.4296875, 189.11328125, 197.796875, 206.48046875, 215.1640625, 223.84765625, 232.53125, 241.21484375, 249.8984375, 258.58203125, 267.265625, 275.94921875, 284.6328125, 293.31640625, 302.0]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 8.0, 8.0, 20.0, 21.0, 28.0, 62.0, 96.0, 205.0, 224.0, 115.0, 69.0, 43.0, 22.0, 20.0, 15.0, 13.0, 8.0, 9.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-502.72283935546875, -481.8905334472656, -461.0582275390625, -440.2259216308594, -419.39361572265625, -398.56134033203125, -377.7290344238281, -356.896728515625, -336.0644226074219, -315.23211669921875, -294.3998107910156, -273.5675048828125, -252.73521423339844, -231.9029083251953, -211.07061767578125, -190.23831176757812, -169.406005859375, -148.57369995117188, -127.74140167236328, -106.90910339355469, -86.07679748535156, -65.24449157714844, -44.412193298339844, -23.57989501953125, -2.747589111328125, 18.084712982177734, 38.917015075683594, 59.74931716918945, 80.58161926269531, 101.41392517089844, 122.24622344970703, 143.07852172851562, 163.91082763671875, 184.74313354492188, 205.575439453125, 226.40773010253906, 247.2400360107422, 268.07232666015625, 288.9046325683594, 309.7369384765625, 330.5692443847656, 351.40155029296875, 372.2338562011719, 393.066162109375, 413.8984375, 434.73077392578125, 455.56304931640625, 476.3953552246094, 497.2276611328125, 518.0599365234375, 538.8922729492188, 559.7245483398438, 580.556884765625, 601.38916015625, 622.2214965820312, 643.0537719726562, 663.8861083984375, 684.7183837890625, 705.5507202148438, 726.3829956054688, 747.21533203125, 768.047607421875, 788.8799438476562, 809.7122192382812, 830.5444946289062]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 4.0, 5.0, 9.0, 6.0, 13.0, 17.0, 22.0, 24.0, 22.0, 28.0, 26.0, 19.0, 29.0, 24.0, 34.0, 32.0, 36.0, 31.0, 48.0, 42.0, 35.0, 32.0, 39.0, 31.0, 35.0, 41.0, 35.0, 33.0, 16.0, 19.0, 24.0, 26.0, 23.0, 16.0, 16.0, 19.0, 17.0, 10.0, 10.0, 7.0, 9.0, 3.0, 3.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-324.1053466796875, -314.41790771484375, -304.7304382324219, -295.0429992675781, -285.35552978515625, -275.6680908203125, -265.9806213378906, -256.2931823730469, -246.60572814941406, -236.91827392578125, -227.23081970214844, -217.54336547851562, -207.85592651367188, -198.16845703125, -188.48101806640625, -178.79356384277344, -169.10610961914062, -159.4186553955078, -149.731201171875, -140.0437469482422, -130.35629272460938, -120.6688461303711, -110.98139953613281, -101.2939453125, -91.60649108886719, -81.91903686523438, -72.23158264160156, -62.54413604736328, -52.85668182373047, -43.169227600097656, -33.48177719116211, -23.794326782226562, -14.106903076171875, -4.419450759887695, 5.268001556396484, 14.955453872680664, 24.642906188964844, 34.330360412597656, 44.0178108215332, 53.70526123046875, 63.39271545410156, 73.08016967773438, 82.76762390136719, 92.45507049560547, 102.14252471923828, 111.8299789428711, 121.51742553710938, 131.2048797607422, 140.892333984375, 150.5797882080078, 160.26724243164062, 169.95469665527344, 179.64215087890625, 189.32958984375, 199.0170440673828, 208.70449829101562, 218.39195251464844, 228.07940673828125, 237.76686096191406, 247.45431518554688, 257.1417541503906, 266.8292236328125, 276.51666259765625, 286.2041015625, 295.8915710449219]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 6.0, 3.0, 7.0, 3.0, 6.0, 11.0, 9.0, 21.0, 14.0, 17.0, 23.0, 25.0, 34.0, 26.0, 36.0, 34.0, 41.0, 56.0, 45.0, 48.0, 48.0, 45.0, 55.0, 46.0, 41.0, 38.0, 38.0, 33.0, 30.0, 23.0, 23.0, 16.0, 19.0, 9.0, 17.0, 12.0, 5.0, 6.0, 10.0, 7.0, 5.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.15625, -39.7314453125, -38.306640625, -36.8818359375, -35.45703125, -34.0322265625, -32.607421875, -31.1826171875, -29.7578125, -28.3330078125, -26.908203125, -25.4833984375, -24.05859375, -22.6337890625, -21.208984375, -19.7841796875, -18.359375, -16.9345703125, -15.509765625, -14.0849609375, -12.66015625, -11.2353515625, -9.810546875, -8.3857421875, -6.9609375, -5.5361328125, -4.111328125, -2.6865234375, -1.26171875, 0.1630859375, 1.587890625, 3.0126953125, 4.4375, 5.8623046875, 7.287109375, 8.7119140625, 10.13671875, 11.5615234375, 12.986328125, 14.4111328125, 15.8359375, 17.2607421875, 18.685546875, 20.1103515625, 21.53515625, 22.9599609375, 24.384765625, 25.8095703125, 27.234375, 28.6591796875, 30.083984375, 31.5087890625, 32.93359375, 34.3583984375, 35.783203125, 37.2080078125, 38.6328125, 40.0576171875, 41.482421875, 42.9072265625, 44.33203125, 45.7568359375, 47.181640625, 48.6064453125, 50.03125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 5.0, 8.0, 11.0, 15.0, 30.0, 33.0, 41.0, 72.0, 108.0, 159.0, 234.0, 332.0, 468.0, 778.0, 1184.0, 1883.0, 3253.0, 6366.0, 15482.0, 53985.0, 330350.0, 522274.0, 74928.0, 19543.0, 7458.0, 3613.0, 2162.0, 1267.0, 842.0, 527.0, 379.0, 240.0, 170.0, 111.0, 69.0, 59.0, 35.0, 27.0, 16.0, 16.0, 5.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.625, -16.1375732421875, -15.650146484375, -15.1627197265625, -14.67529296875, -14.1878662109375, -13.700439453125, -13.2130126953125, -12.7255859375, -12.2381591796875, -11.750732421875, -11.2633056640625, -10.77587890625, -10.2884521484375, -9.801025390625, -9.3135986328125, -8.826171875, -8.3387451171875, -7.851318359375, -7.3638916015625, -6.87646484375, -6.3890380859375, -5.901611328125, -5.4141845703125, -4.9267578125, -4.4393310546875, -3.951904296875, -3.4644775390625, -2.97705078125, -2.4896240234375, -2.002197265625, -1.5147705078125, -1.02734375, -0.5399169921875, -0.052490234375, 0.4349365234375, 0.92236328125, 1.4097900390625, 1.897216796875, 2.3846435546875, 2.8720703125, 3.3594970703125, 3.846923828125, 4.3343505859375, 4.82177734375, 5.3092041015625, 5.796630859375, 6.2840576171875, 6.771484375, 7.2589111328125, 7.746337890625, 8.2337646484375, 8.72119140625, 9.2086181640625, 9.696044921875, 10.1834716796875, 10.6708984375, 11.1583251953125, 11.645751953125, 12.1331787109375, 12.62060546875, 13.1080322265625, 13.595458984375, 14.0828857421875, 14.5703125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 10.0, 12.0, 11.0, 18.0, 21.0, 20.0, 16.0, 27.0, 38.0, 32.0, 40.0, 36.0, 29.0, 40.0, 34.0, 43.0, 33.0, 1064.0, 39.0, 41.0, 34.0, 35.0, 50.0, 32.0, 47.0, 32.0, 29.0, 27.0, 22.0, 20.0, 15.0, 15.0, 9.0, 9.0, 8.0, 6.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.421875, -27.5126953125, -26.603515625, -25.6943359375, -24.78515625, -23.8759765625, -22.966796875, -22.0576171875, -21.1484375, -20.2392578125, -19.330078125, -18.4208984375, -17.51171875, -16.6025390625, -15.693359375, -14.7841796875, -13.875, -12.9658203125, -12.056640625, -11.1474609375, -10.23828125, -9.3291015625, -8.419921875, -7.5107421875, -6.6015625, -5.6923828125, -4.783203125, -3.8740234375, -2.96484375, -2.0556640625, -1.146484375, -0.2373046875, 0.671875, 1.5810546875, 2.490234375, 3.3994140625, 4.30859375, 5.2177734375, 6.126953125, 7.0361328125, 7.9453125, 8.8544921875, 9.763671875, 10.6728515625, 11.58203125, 12.4912109375, 13.400390625, 14.3095703125, 15.21875, 16.1279296875, 17.037109375, 17.9462890625, 18.85546875, 19.7646484375, 20.673828125, 21.5830078125, 22.4921875, 23.4013671875, 24.310546875, 25.2197265625, 26.12890625, 27.0380859375, 27.947265625, 28.8564453125, 29.765625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 8.0, 4.0, 15.0, 17.0, 21.0, 51.0, 56.0, 96.0, 123.0, 184.0, 315.0, 435.0, 708.0, 1086.0, 1823.0, 3189.0, 5712.0, 11119.0, 24128.0, 58953.0, 163388.0, 1417802.0, 260006.0, 83226.0, 32915.0, 14837.0, 7086.0, 3867.0, 2248.0, 1326.0, 819.0, 534.0, 340.0, 205.0, 158.0, 110.0, 73.0, 37.0, 31.0, 26.0, 17.0, 12.0, 11.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.4453125, -5.2734375, -5.1015625, -4.9296875, -4.7578125, -4.5859375, -4.4140625, -4.2421875, -4.0703125, -3.8984375, -3.7265625, -3.5546875, -3.3828125, -3.2109375, -3.0390625, -2.8671875, -2.6953125, -2.5234375, -2.3515625, -2.1796875, -2.0078125, -1.8359375, -1.6640625, -1.4921875, -1.3203125, -1.1484375, -0.9765625, -0.8046875, -0.6328125, -0.4609375, -0.2890625, -0.1171875, 0.0546875, 0.2265625, 0.3984375, 0.5703125, 0.7421875, 0.9140625, 1.0859375, 1.2578125, 1.4296875, 1.6015625, 1.7734375, 1.9453125, 2.1171875, 2.2890625, 2.4609375, 2.6328125, 2.8046875, 2.9765625, 3.1484375, 3.3203125, 3.4921875, 3.6640625, 3.8359375, 4.0078125, 4.1796875, 4.3515625, 4.5234375, 4.6953125, 4.8671875, 5.0390625, 5.2109375, 5.3828125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 7.0, 3.0, 8.0, 6.0, 6.0, 9.0, 13.0, 7.0, 13.0, 13.0, 18.0, 26.0, 25.0, 21.0, 34.0, 51.0, 68.0, 120.0, 153.0, 103.0, 41.0, 39.0, 36.0, 24.0, 19.0, 24.0, 11.0, 22.0, 14.0, 7.0, 9.0, 5.0, 7.0, 9.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5758209228515625, -0.557403564453125, -0.5389862060546875, -0.52056884765625, -0.5021514892578125, -0.483734130859375, -0.4653167724609375, -0.4468994140625, -0.4284820556640625, -0.410064697265625, -0.3916473388671875, -0.37322998046875, -0.3548126220703125, -0.336395263671875, -0.3179779052734375, -0.299560546875, -0.2811431884765625, -0.262725830078125, -0.2443084716796875, -0.22589111328125, -0.2074737548828125, -0.189056396484375, -0.1706390380859375, -0.1522216796875, -0.1338043212890625, -0.115386962890625, -0.0969696044921875, -0.07855224609375, -0.0601348876953125, -0.041717529296875, -0.0233001708984375, -0.0048828125, 0.0135345458984375, 0.031951904296875, 0.0503692626953125, 0.06878662109375, 0.0872039794921875, 0.105621337890625, 0.1240386962890625, 0.1424560546875, 0.1608734130859375, 0.179290771484375, 0.1977081298828125, 0.21612548828125, 0.2345428466796875, 0.252960205078125, 0.2713775634765625, 0.289794921875, 0.3082122802734375, 0.326629638671875, 0.3450469970703125, 0.36346435546875, 0.3818817138671875, 0.400299072265625, 0.4187164306640625, 0.4371337890625, 0.4555511474609375, 0.473968505859375, 0.4923858642578125, 0.51080322265625, 0.5292205810546875, 0.547637939453125, 0.5660552978515625, 0.58447265625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 3.0, 5.0, 7.0, 10.0, 7.0, 4.0, 8.0, 8.0, 18.0, 13.0, 16.0, 23.0, 22.0, 34.0, 52.0, 63.0, 99.0, 199.0, 1043114.0, 4290.0, 183.0, 84.0, 66.0, 37.0, 32.0, 32.0, 18.0, 13.0, 12.0, 8.0, 15.0, 9.0, 8.0, 5.0, 7.0, 2.0, 10.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.65625, -18.071533203125, -17.48681640625, -16.902099609375, -16.3173828125, -15.732666015625, -15.14794921875, -14.563232421875, -13.978515625, -13.393798828125, -12.80908203125, -12.224365234375, -11.6396484375, -11.054931640625, -10.47021484375, -9.885498046875, -9.30078125, -8.716064453125, -8.13134765625, -7.546630859375, -6.9619140625, -6.377197265625, -5.79248046875, -5.207763671875, -4.623046875, -4.038330078125, -3.45361328125, -2.868896484375, -2.2841796875, -1.699462890625, -1.11474609375, -0.530029296875, 0.0546875, 0.639404296875, 1.22412109375, 1.808837890625, 2.3935546875, 2.978271484375, 3.56298828125, 4.147705078125, 4.732421875, 5.317138671875, 5.90185546875, 6.486572265625, 7.0712890625, 7.656005859375, 8.24072265625, 8.825439453125, 9.41015625, 9.994873046875, 10.57958984375, 11.164306640625, 11.7490234375, 12.333740234375, 12.91845703125, 13.503173828125, 14.087890625, 14.672607421875, 15.25732421875, 15.842041015625, 16.4267578125, 17.011474609375, 17.59619140625, 18.180908203125, 18.765625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1019.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28519344329833984, 0.21804159879684448, 0.7212766408920288, 1.2245116233825684, 1.7277467250823975, 2.2309818267822266, 2.7342166900634766, 3.2374517917633057, 3.7406868934631348, 4.243921756744385, 4.747157096862793, 5.250391960144043, 5.753626823425293, 6.256862163543701, 6.760097026824951, 7.263332366943359, 7.766567230224609, 8.26980209350586, 8.77303695678711, 9.27627182006836, 9.779507637023926, 10.282742500305176, 10.785977363586426, 11.289212226867676, 11.792448043823242, 12.295682907104492, 12.798917770385742, 13.302152633666992, 13.805388450622559, 14.308623313903809, 14.811858177185059, 15.315093040466309, 15.818326950073242, 16.321561813354492, 16.824796676635742, 17.328031539916992, 17.831266403198242, 18.334503173828125, 18.837738037109375, 19.340972900390625, 19.844207763671875, 20.347442626953125, 20.850677490234375, 21.353912353515625, 21.857147216796875, 22.360382080078125, 22.863616943359375, 23.366853713989258, 23.870086669921875, 24.373321533203125, 24.876556396484375, 25.379791259765625, 25.883026123046875, 26.386260986328125, 26.889495849609375, 27.392732620239258, 27.895967483520508, 28.399202346801758, 28.902437210083008, 29.405672073364258, 29.908906936645508, 30.41214370727539, 30.91537857055664, 31.41861343383789, 31.92184829711914]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 5.0, 3.0, 4.0, 9.0, 5.0, 9.0, 8.0, 18.0, 20.0, 14.0, 16.0, 13.0, 28.0, 31.0, 24.0, 19.0, 41.0, 30.0, 36.0, 36.0, 27.0, 25.0, 33.0, 37.0, 43.0, 41.0, 35.0, 31.0, 30.0, 34.0, 30.0, 34.0, 27.0, 23.0, 24.0, 16.0, 26.0, 30.0, 11.0, 13.0, 14.0, 3.0, 11.0, 7.0, 8.0, 7.0, 5.0, 4.0, 2.0, 0.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2132807970046997, -1.1686363220214844, -1.1239919662475586, -1.0793474912643433, -1.0347031354904175, -0.9900586605072021, -0.9454142451286316, -0.900769829750061, -0.8561253547668457, -0.8114809393882751, -0.7668365240097046, -0.7221920490264893, -0.6775476336479187, -0.6329032182693481, -0.5882588028907776, -0.543614387512207, -0.4989699721336365, -0.4543255567550659, -0.409681111574173, -0.3650366961956024, -0.3203922510147095, -0.2757478356361389, -0.23110342025756836, -0.18645897507667542, -0.14181455969810486, -0.09717012941837311, -0.052525706589221954, -0.0078812837600708, 0.03676314651966095, 0.0814075767993927, 0.12605199217796326, 0.1706964373588562, 0.21534085273742676, 0.2599852681159973, 0.30462971329689026, 0.3492741286754608, 0.39391857385635376, 0.4385629892349243, 0.4832074046134949, 0.5278518199920654, 0.5724962949752808, 0.6171407103538513, 0.6617851257324219, 0.7064296007156372, 0.7510740160942078, 0.7957184314727783, 0.8403628468513489, 0.8850072622299194, 0.92965167760849, 0.9742960929870605, 1.0189405679702759, 1.0635849237442017, 1.108229398727417, 1.1528737545013428, 1.197518229484558, 1.2421627044677734, 1.2868070602416992, 1.3314515352249146, 1.3760958909988403, 1.4207403659820557, 1.4653847217559814, 1.5100291967391968, 1.554673671722412, 1.599318027496338, 1.6439625024795532]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 6.0, 3.0, 7.0, 3.0, 6.0, 11.0, 9.0, 21.0, 14.0, 17.0, 23.0, 25.0, 34.0, 26.0, 36.0, 34.0, 41.0, 55.0, 46.0, 48.0, 48.0, 45.0, 55.0, 46.0, 41.0, 38.0, 38.0, 33.0, 30.0, 23.0, 23.0, 16.0, 19.0, 9.0, 17.0, 12.0, 5.0, 6.0, 10.0, 7.0, 5.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.15625, -39.7314453125, -38.306640625, -36.8818359375, -35.45703125, -34.0322265625, -32.607421875, -31.1826171875, -29.7578125, -28.3330078125, -26.908203125, -25.4833984375, -24.05859375, -22.6337890625, -21.208984375, -19.7841796875, -18.359375, -16.9345703125, -15.509765625, -14.0849609375, -12.66015625, -11.2353515625, -9.810546875, -8.3857421875, -6.9609375, -5.5361328125, -4.111328125, -2.6865234375, -1.26171875, 0.1630859375, 1.587890625, 3.0126953125, 4.4375, 5.8623046875, 7.287109375, 8.7119140625, 10.13671875, 11.5615234375, 12.986328125, 14.4111328125, 15.8359375, 17.2607421875, 18.685546875, 20.1103515625, 21.53515625, 22.9599609375, 24.384765625, 25.8095703125, 27.234375, 28.6591796875, 30.083984375, 31.5087890625, 32.93359375, 34.3583984375, 35.783203125, 37.2080078125, 38.6328125, 40.0576171875, 41.482421875, 42.9072265625, 44.33203125, 45.7568359375, 47.181640625, 48.6064453125, 50.03125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 10.0, 9.0, 22.0, 31.0, 23.0, 41.0, 50.0, 79.0, 122.0, 141.0, 196.0, 250.0, 358.0, 549.0, 704.0, 1061.0, 1611.0, 2588.0, 5088.0, 20042.0, 549453.0, 435437.0, 17986.0, 4935.0, 2542.0, 1633.0, 993.0, 748.0, 518.0, 354.0, 242.0, 190.0, 146.0, 111.0, 80.0, 55.0, 39.0, 25.0, 24.0, 20.0, 17.0, 8.0, 7.0, 3.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-80.5625, -78.19140625, -75.8203125, -73.44921875, -71.078125, -68.70703125, -66.3359375, -63.96484375, -61.59375, -59.22265625, -56.8515625, -54.48046875, -52.109375, -49.73828125, -47.3671875, -44.99609375, -42.625, -40.25390625, -37.8828125, -35.51171875, -33.140625, -30.76953125, -28.3984375, -26.02734375, -23.65625, -21.28515625, -18.9140625, -16.54296875, -14.171875, -11.80078125, -9.4296875, -7.05859375, -4.6875, -2.31640625, 0.0546875, 2.42578125, 4.796875, 7.16796875, 9.5390625, 11.91015625, 14.28125, 16.65234375, 19.0234375, 21.39453125, 23.765625, 26.13671875, 28.5078125, 30.87890625, 33.25, 35.62109375, 37.9921875, 40.36328125, 42.734375, 45.10546875, 47.4765625, 49.84765625, 52.21875, 54.58984375, 56.9609375, 59.33203125, 61.703125, 64.07421875, 66.4453125, 68.81640625, 71.1875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 16.0, 10.0, 11.0, 20.0, 24.0, 15.0, 25.0, 19.0, 17.0, 31.0, 26.0, 24.0, 43.0, 33.0, 33.0, 30.0, 39.0, 58.0, 193.0, 1884.0, 70.0, 29.0, 31.0, 37.0, 48.0, 43.0, 30.0, 29.0, 22.0, 22.0, 18.0, 13.0, 18.0, 18.0, 16.0, 10.0, 2.0, 7.0, 10.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.9375, -123.7060546875, -119.474609375, -115.2431640625, -111.01171875, -106.7802734375, -102.548828125, -98.3173828125, -94.0859375, -89.8544921875, -85.623046875, -81.3916015625, -77.16015625, -72.9287109375, -68.697265625, -64.4658203125, -60.234375, -56.0029296875, -51.771484375, -47.5400390625, -43.30859375, -39.0771484375, -34.845703125, -30.6142578125, -26.3828125, -22.1513671875, -17.919921875, -13.6884765625, -9.45703125, -5.2255859375, -0.994140625, 3.2373046875, 7.46875, 11.7001953125, 15.931640625, 20.1630859375, 24.39453125, 28.6259765625, 32.857421875, 37.0888671875, 41.3203125, 45.5517578125, 49.783203125, 54.0146484375, 58.24609375, 62.4775390625, 66.708984375, 70.9404296875, 75.171875, 79.4033203125, 83.634765625, 87.8662109375, 92.09765625, 96.3291015625, 100.560546875, 104.7919921875, 109.0234375, 113.2548828125, 117.486328125, 121.7177734375, 125.94921875, 130.1806640625, 134.412109375, 138.6435546875, 142.875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 4.0, 10.0, 7.0, 5.0, 17.0, 22.0, 27.0, 30.0, 51.0, 53.0, 98.0, 185.0, 330.0, 730.0, 1636.0, 4461.0, 16418.0, 3093897.0, 19484.0, 4690.0, 1700.0, 804.0, 376.0, 221.0, 131.0, 71.0, 52.0, 42.0, 33.0, 35.0, 21.0, 10.0, 18.0, 5.0, 2.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.375, -240.318359375, -231.26171875, -222.205078125, -213.1484375, -204.091796875, -195.03515625, -185.978515625, -176.921875, -167.865234375, -158.80859375, -149.751953125, -140.6953125, -131.638671875, -122.58203125, -113.525390625, -104.46875, -95.412109375, -86.35546875, -77.298828125, -68.2421875, -59.185546875, -50.12890625, -41.072265625, -32.015625, -22.958984375, -13.90234375, -4.845703125, 4.2109375, 13.267578125, 22.32421875, 31.380859375, 40.4375, 49.494140625, 58.55078125, 67.607421875, 76.6640625, 85.720703125, 94.77734375, 103.833984375, 112.890625, 121.947265625, 131.00390625, 140.060546875, 149.1171875, 158.173828125, 167.23046875, 176.287109375, 185.34375, 194.400390625, 203.45703125, 212.513671875, 221.5703125, 230.626953125, 239.68359375, 248.740234375, 257.796875, 266.853515625, 275.91015625, 284.966796875, 294.0234375, 303.080078125, 312.13671875, 321.193359375, 330.25]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 29.0, 633.0, 347.0, 11.0], "bins": [-2950.283203125, -2902.640625, -2854.998046875, -2807.35546875, -2759.712646484375, -2712.070068359375, -2664.427490234375, -2616.784912109375, -2569.142333984375, -2521.499755859375, -2473.857177734375, -2426.214599609375, -2378.57177734375, -2330.92919921875, -2283.28662109375, -2235.64404296875, -2188.00146484375, -2140.35888671875, -2092.71630859375, -2045.0736083984375, -1997.4310302734375, -1949.7884521484375, -1902.145751953125, -1854.503173828125, -1806.8604736328125, -1759.2178955078125, -1711.5751953125, -1663.9326171875, -1616.2900390625, -1568.6474609375, -1521.0047607421875, -1473.3621826171875, -1425.7197265625, -1378.0771484375, -1330.4344482421875, -1282.7918701171875, -1235.1492919921875, -1187.5067138671875, -1139.864013671875, -1092.221435546875, -1044.578857421875, -996.9362182617188, -949.2936401367188, -901.6510009765625, -854.0084228515625, -806.3657836914062, -758.72314453125, -711.08056640625, -663.4379272460938, -615.7952880859375, -568.1527099609375, -520.5100708007812, -472.86749267578125, -425.224853515625, -377.5822448730469, -329.93963623046875, -282.2970275878906, -234.6544189453125, -187.01181030273438, -139.3691864013672, -91.72657775878906, -44.08396911621094, 3.55865478515625, 51.201263427734375, 98.84387969970703]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 7.0, 4.0, 5.0, 12.0, 9.0, 20.0, 19.0, 23.0, 19.0, 33.0, 27.0, 38.0, 30.0, 38.0, 37.0, 36.0, 40.0, 34.0, 39.0, 55.0, 48.0, 46.0, 39.0, 43.0, 48.0, 38.0, 46.0, 23.0, 28.0, 22.0, 23.0, 14.0, 13.0, 11.0, 11.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-507.0089416503906, -491.6144104003906, -476.2198791503906, -460.82537841796875, -445.43084716796875, -430.03631591796875, -414.64178466796875, -399.24725341796875, -383.8527526855469, -368.4582214355469, -353.0636901855469, -337.669189453125, -322.274658203125, -306.880126953125, -291.485595703125, -276.091064453125, -260.696533203125, -245.302001953125, -229.90748596191406, -214.51295471191406, -199.11843872070312, -183.72390747070312, -168.32937622070312, -152.9348602294922, -137.54034423828125, -122.14582061767578, -106.75129699707031, -91.35676574707031, -75.96224975585938, -60.567718505859375, -45.173194885253906, -29.778671264648438, -14.3841552734375, 1.0103693008422852, 16.40489387512207, 31.799419403076172, 47.19394302368164, 62.588470458984375, 77.98299407958984, 93.37751770019531, 108.77204132080078, 124.16656494140625, 139.56109619140625, 154.9556121826172, 170.3501434326172, 185.74465942382812, 201.13919067382812, 216.53372192382812, 231.92823791503906, 247.32276916503906, 262.71728515625, 278.11181640625, 293.50634765625, 308.90087890625, 324.2953796386719, 339.6899108886719, 355.0844421386719, 370.4789733886719, 385.8735046386719, 401.26800537109375, 416.66253662109375, 432.05706787109375, 447.45159912109375, 462.84613037109375, 478.2406311035156]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 2.0, 5.0, 9.0, 7.0, 18.0, 19.0, 15.0, 23.0, 19.0, 23.0, 39.0, 28.0, 46.0, 31.0, 48.0, 49.0, 41.0, 59.0, 44.0, 60.0, 41.0, 35.0, 40.0, 36.0, 42.0, 32.0, 23.0, 27.0, 18.0, 16.0, 16.0, 16.0, 15.0, 6.0, 4.0, 7.0, 10.0, 7.0, 5.0, 3.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.4375, -39.9765625, -38.515625, -37.0546875, -35.59375, -34.1328125, -32.671875, -31.2109375, -29.75, -28.2890625, -26.828125, -25.3671875, -23.90625, -22.4453125, -20.984375, -19.5234375, -18.0625, -16.6015625, -15.140625, -13.6796875, -12.21875, -10.7578125, -9.296875, -7.8359375, -6.375, -4.9140625, -3.453125, -1.9921875, -0.53125, 0.9296875, 2.390625, 3.8515625, 5.3125, 6.7734375, 8.234375, 9.6953125, 11.15625, 12.6171875, 14.078125, 15.5390625, 17.0, 18.4609375, 19.921875, 21.3828125, 22.84375, 24.3046875, 25.765625, 27.2265625, 28.6875, 30.1484375, 31.609375, 33.0703125, 34.53125, 35.9921875, 37.453125, 38.9140625, 40.375, 41.8359375, 43.296875, 44.7578125, 46.21875, 47.6796875, 49.140625, 50.6015625, 52.0625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 5.0, 4.0, 12.0, 18.0, 11.0, 22.0, 36.0, 48.0, 70.0, 100.0, 118.0, 153.0, 210.0, 289.0, 381.0, 501.0, 702.0, 984.0, 1375.0, 1711.0, 2548.0, 3537.0, 5037.0, 7798.0, 13361.0, 37158.0, 273932.0, 2604198.0, 1080139.0, 107831.0, 19370.0, 10031.0, 6383.0, 4462.0, 3149.0, 2176.0, 1692.0, 1118.0, 897.0, 698.0, 499.0, 381.0, 265.0, 208.0, 157.0, 119.0, 114.0, 82.0, 48.0, 34.0, 29.0, 20.0, 22.0, 13.0, 14.0, 8.0, 9.0, 4.0, 4.0, 1.0, 1.0], "bins": [-78.3125, -75.76953125, -73.2265625, -70.68359375, -68.140625, -65.59765625, -63.0546875, -60.51171875, -57.96875, -55.42578125, -52.8828125, -50.33984375, -47.796875, -45.25390625, -42.7109375, -40.16796875, -37.625, -35.08203125, -32.5390625, -29.99609375, -27.453125, -24.91015625, -22.3671875, -19.82421875, -17.28125, -14.73828125, -12.1953125, -9.65234375, -7.109375, -4.56640625, -2.0234375, 0.51953125, 3.0625, 5.60546875, 8.1484375, 10.69140625, 13.234375, 15.77734375, 18.3203125, 20.86328125, 23.40625, 25.94921875, 28.4921875, 31.03515625, 33.578125, 36.12109375, 38.6640625, 41.20703125, 43.75, 46.29296875, 48.8359375, 51.37890625, 53.921875, 56.46484375, 59.0078125, 61.55078125, 64.09375, 66.63671875, 69.1796875, 71.72265625, 74.265625, 76.80859375, 79.3515625, 81.89453125, 84.4375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 1.0, 7.0, 3.0, 9.0, 11.0, 14.0, 7.0, 11.0, 15.0, 25.0, 37.0, 47.0, 59.0, 104.0, 120.0, 246.0, 403.0, 720.0, 785.0, 568.0, 262.0, 177.0, 132.0, 72.0, 60.0, 33.0, 40.0, 21.0, 11.0, 8.0, 13.0, 9.0, 6.0, 6.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-127.75, -124.0224609375, -120.294921875, -116.5673828125, -112.83984375, -109.1123046875, -105.384765625, -101.6572265625, -97.9296875, -94.2021484375, -90.474609375, -86.7470703125, -83.01953125, -79.2919921875, -75.564453125, -71.8369140625, -68.109375, -64.3818359375, -60.654296875, -56.9267578125, -53.19921875, -49.4716796875, -45.744140625, -42.0166015625, -38.2890625, -34.5615234375, -30.833984375, -27.1064453125, -23.37890625, -19.6513671875, -15.923828125, -12.1962890625, -8.46875, -4.7412109375, -1.013671875, 2.7138671875, 6.44140625, 10.1689453125, 13.896484375, 17.6240234375, 21.3515625, 25.0791015625, 28.806640625, 32.5341796875, 36.26171875, 39.9892578125, 43.716796875, 47.4443359375, 51.171875, 54.8994140625, 58.626953125, 62.3544921875, 66.08203125, 69.8095703125, 73.537109375, 77.2646484375, 80.9921875, 84.7197265625, 88.447265625, 92.1748046875, 95.90234375, 99.6298828125, 103.357421875, 107.0849609375, 110.8125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 12.0, 10.0, 11.0, 11.0, 28.0, 35.0, 50.0, 57.0, 84.0, 182.0, 283.0, 541.0, 1093.0, 2418.0, 5485.0, 14331.0, 47760.0, 1405980.0, 2636025.0, 53302.0, 15593.0, 5872.0, 2486.0, 1194.0, 582.0, 322.0, 180.0, 99.0, 58.0, 43.0, 34.0, 18.0, 19.0, 11.0, 16.0, 6.0, 12.0, 7.0, 4.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-317.5, -308.171875, -298.84375, -289.515625, -280.1875, -270.859375, -261.53125, -252.203125, -242.875, -233.546875, -224.21875, -214.890625, -205.5625, -196.234375, -186.90625, -177.578125, -168.25, -158.921875, -149.59375, -140.265625, -130.9375, -121.609375, -112.28125, -102.953125, -93.625, -84.296875, -74.96875, -65.640625, -56.3125, -46.984375, -37.65625, -28.328125, -19.0, -9.671875, -0.34375, 8.984375, 18.3125, 27.640625, 36.96875, 46.296875, 55.625, 64.953125, 74.28125, 83.609375, 92.9375, 102.265625, 111.59375, 120.921875, 130.25, 139.578125, 148.90625, 158.234375, 167.5625, 176.890625, 186.21875, 195.546875, 204.875, 214.203125, 223.53125, 232.859375, 242.1875, 251.515625, 260.84375, 270.171875, 279.5]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 7.0, 5.0, 9.0, 3.0, 9.0, 8.0, 9.0, 16.0, 32.0, 44.0, 71.0, 102.0, 167.0, 173.0, 103.0, 77.0, 43.0, 28.0, 23.0, 20.0, 12.0, 9.0, 11.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-393.4310607910156, -377.6955871582031, -361.96014404296875, -346.22467041015625, -330.48919677734375, -314.7537536621094, -299.0182800292969, -283.2828369140625, -267.54736328125, -251.81190490722656, -236.07644653320312, -220.34097290039062, -204.6055145263672, -188.87005615234375, -173.13458251953125, -157.3991241455078, -141.66366577148438, -125.92820739746094, -110.19274139404297, -94.457275390625, -78.72181701660156, -62.986358642578125, -47.250892639160156, -31.515426635742188, -15.77996826171875, -0.044506072998046875, 15.690956115722656, 31.42641830444336, 47.16188049316406, 62.8973388671875, 78.63280487060547, 94.36827087402344, 110.103759765625, 125.83921813964844, 141.57467651367188, 157.31015014648438, 173.0456085205078, 188.78106689453125, 204.51654052734375, 220.2519989013672, 235.98745727539062, 251.72291564941406, 267.4583740234375, 283.19384765625, 298.9293212890625, 314.6647644042969, 330.4002380371094, 346.13568115234375, 361.87115478515625, 377.60662841796875, 393.3420715332031, 409.0775451660156, 424.81298828125, 440.5484619140625, 456.283935546875, 472.0194091796875, 487.7548522949219, 503.4903259277344, 519.2257690429688, 534.9612426757812, 550.6967163085938, 566.43212890625, 582.1676025390625, 597.903076171875, 613.6385498046875]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 9.0, 5.0, 8.0, 5.0, 8.0, 15.0, 16.0, 13.0, 16.0, 21.0, 23.0, 26.0, 34.0, 37.0, 36.0, 40.0, 36.0, 39.0, 39.0, 38.0, 40.0, 43.0, 42.0, 37.0, 44.0, 34.0, 36.0, 26.0, 28.0, 33.0, 34.0, 27.0, 19.0, 23.0, 12.0, 14.0, 13.0, 7.0, 9.0, 6.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-350.2659606933594, -339.25714111328125, -328.2483215332031, -317.239501953125, -306.23065185546875, -295.2218322753906, -284.2130126953125, -273.2041931152344, -262.19537353515625, -251.18655395507812, -240.17771911621094, -229.1688995361328, -218.1600799560547, -207.1512451171875, -196.14242553710938, -185.13360595703125, -174.12477111816406, -163.11595153808594, -152.10711669921875, -141.09829711914062, -130.0894775390625, -119.08065032958984, -108.07182312011719, -97.06300354003906, -86.0541763305664, -75.04534912109375, -64.03652954101562, -53.02770233154297, -42.01887893676758, -31.010055541992188, -20.00122833251953, -8.992408752441406, 2.01641845703125, 13.025242805480957, 24.034067153930664, 35.04289245605469, 46.05171585083008, 57.06053924560547, 68.06936645507812, 79.07818603515625, 90.0870132446289, 101.09584045410156, 112.10466003417969, 123.11348724365234, 134.122314453125, 145.13113403320312, 156.13995361328125, 167.14877319335938, 178.15760803222656, 189.1664276123047, 200.17526245117188, 211.18408203125, 222.19290161132812, 233.20172119140625, 244.21055603027344, 255.21937561035156, 266.22821044921875, 277.2370300292969, 288.245849609375, 299.25469970703125, 310.2635192871094, 321.2723388671875, 332.2811584472656, 343.28997802734375, 354.2987976074219]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 2.0, 2.0, 6.0, 6.0, 11.0, 16.0, 10.0, 14.0, 21.0, 13.0, 25.0, 32.0, 34.0, 41.0, 31.0, 55.0, 51.0, 51.0, 44.0, 35.0, 51.0, 53.0, 41.0, 35.0, 29.0, 36.0, 46.0, 32.0, 22.0, 21.0, 20.0, 14.0, 16.0, 8.0, 6.0, 17.0, 11.0, 7.0, 6.0, 5.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-45.625, -44.19140625, -42.7578125, -41.32421875, -39.890625, -38.45703125, -37.0234375, -35.58984375, -34.15625, -32.72265625, -31.2890625, -29.85546875, -28.421875, -26.98828125, -25.5546875, -24.12109375, -22.6875, -21.25390625, -19.8203125, -18.38671875, -16.953125, -15.51953125, -14.0859375, -12.65234375, -11.21875, -9.78515625, -8.3515625, -6.91796875, -5.484375, -4.05078125, -2.6171875, -1.18359375, 0.25, 1.68359375, 3.1171875, 4.55078125, 5.984375, 7.41796875, 8.8515625, 10.28515625, 11.71875, 13.15234375, 14.5859375, 16.01953125, 17.453125, 18.88671875, 20.3203125, 21.75390625, 23.1875, 24.62109375, 26.0546875, 27.48828125, 28.921875, 30.35546875, 31.7890625, 33.22265625, 34.65625, 36.08984375, 37.5234375, 38.95703125, 40.390625, 41.82421875, 43.2578125, 44.69140625, 46.125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 9.0, 12.0, 19.0, 17.0, 45.0, 42.0, 57.0, 105.0, 146.0, 233.0, 295.0, 477.0, 682.0, 1023.0, 1591.0, 2606.0, 4349.0, 8575.0, 21662.0, 88365.0, 636567.0, 216233.0, 38029.0, 12547.0, 5854.0, 3163.0, 2009.0, 1290.0, 833.0, 568.0, 350.0, 225.0, 181.0, 109.0, 99.0, 60.0, 27.0, 32.0, 21.0, 16.0, 6.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.825439453125, -19.13525390625, -18.445068359375, -17.7548828125, -17.064697265625, -16.37451171875, -15.684326171875, -14.994140625, -14.303955078125, -13.61376953125, -12.923583984375, -12.2333984375, -11.543212890625, -10.85302734375, -10.162841796875, -9.47265625, -8.782470703125, -8.09228515625, -7.402099609375, -6.7119140625, -6.021728515625, -5.33154296875, -4.641357421875, -3.951171875, -3.260986328125, -2.57080078125, -1.880615234375, -1.1904296875, -0.500244140625, 0.18994140625, 0.880126953125, 1.5703125, 2.260498046875, 2.95068359375, 3.640869140625, 4.3310546875, 5.021240234375, 5.71142578125, 6.401611328125, 7.091796875, 7.781982421875, 8.47216796875, 9.162353515625, 9.8525390625, 10.542724609375, 11.23291015625, 11.923095703125, 12.61328125, 13.303466796875, 13.99365234375, 14.683837890625, 15.3740234375, 16.064208984375, 16.75439453125, 17.444580078125, 18.134765625, 18.824951171875, 19.51513671875, 20.205322265625, 20.8955078125, 21.585693359375, 22.27587890625, 22.966064453125, 23.65625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 4.0, 9.0, 11.0, 11.0, 15.0, 14.0, 20.0, 20.0, 24.0, 20.0, 26.0, 31.0, 23.0, 27.0, 37.0, 43.0, 29.0, 35.0, 46.0, 1067.0, 43.0, 52.0, 42.0, 42.0, 31.0, 24.0, 32.0, 38.0, 23.0, 27.0, 26.0, 15.0, 19.0, 19.0, 4.0, 12.0, 19.0, 10.0, 7.0, 7.0, 3.0, 4.0, 0.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-29.5625, -28.69140625, -27.8203125, -26.94921875, -26.078125, -25.20703125, -24.3359375, -23.46484375, -22.59375, -21.72265625, -20.8515625, -19.98046875, -19.109375, -18.23828125, -17.3671875, -16.49609375, -15.625, -14.75390625, -13.8828125, -13.01171875, -12.140625, -11.26953125, -10.3984375, -9.52734375, -8.65625, -7.78515625, -6.9140625, -6.04296875, -5.171875, -4.30078125, -3.4296875, -2.55859375, -1.6875, -0.81640625, 0.0546875, 0.92578125, 1.796875, 2.66796875, 3.5390625, 4.41015625, 5.28125, 6.15234375, 7.0234375, 7.89453125, 8.765625, 9.63671875, 10.5078125, 11.37890625, 12.25, 13.12109375, 13.9921875, 14.86328125, 15.734375, 16.60546875, 17.4765625, 18.34765625, 19.21875, 20.08984375, 20.9609375, 21.83203125, 22.703125, 23.57421875, 24.4453125, 25.31640625, 26.1875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 7.0, 17.0, 14.0, 19.0, 35.0, 48.0, 59.0, 106.0, 164.0, 273.0, 370.0, 674.0, 1134.0, 2055.0, 3603.0, 6621.0, 14289.0, 33856.0, 97855.0, 553942.0, 1206044.0, 107822.0, 36656.0, 15321.0, 7174.0, 3787.0, 2045.0, 1210.0, 715.0, 433.0, 294.0, 161.0, 122.0, 73.0, 44.0, 28.0, 18.0, 14.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.13671875, -6.90679931640625, -6.6768798828125, -6.44696044921875, -6.217041015625, -5.98712158203125, -5.7572021484375, -5.52728271484375, -5.29736328125, -5.06744384765625, -4.8375244140625, -4.60760498046875, -4.377685546875, -4.14776611328125, -3.9178466796875, -3.68792724609375, -3.4580078125, -3.22808837890625, -2.9981689453125, -2.76824951171875, -2.538330078125, -2.30841064453125, -2.0784912109375, -1.84857177734375, -1.61865234375, -1.38873291015625, -1.1588134765625, -0.92889404296875, -0.698974609375, -0.46905517578125, -0.2391357421875, -0.00921630859375, 0.220703125, 0.45062255859375, 0.6805419921875, 0.91046142578125, 1.140380859375, 1.37030029296875, 1.6002197265625, 1.83013916015625, 2.06005859375, 2.28997802734375, 2.5198974609375, 2.74981689453125, 2.979736328125, 3.20965576171875, 3.4395751953125, 3.66949462890625, 3.8994140625, 4.12933349609375, 4.3592529296875, 4.58917236328125, 4.819091796875, 5.04901123046875, 5.2789306640625, 5.50885009765625, 5.73876953125, 5.96868896484375, 6.1986083984375, 6.42852783203125, 6.658447265625, 6.88836669921875, 7.1182861328125, 7.34820556640625, 7.578125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 6.0, 4.0, 9.0, 14.0, 15.0, 21.0, 16.0, 27.0, 34.0, 47.0, 68.0, 184.0, 198.0, 75.0, 55.0, 27.0, 25.0, 14.0, 19.0, 9.0, 19.0, 12.0, 12.0, 9.0, 9.0, 9.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0986328125, -1.064361572265625, -1.03009033203125, -0.995819091796875, -0.9615478515625, -0.927276611328125, -0.89300537109375, -0.858734130859375, -0.824462890625, -0.790191650390625, -0.75592041015625, -0.721649169921875, -0.6873779296875, -0.653106689453125, -0.61883544921875, -0.584564208984375, -0.55029296875, -0.516021728515625, -0.48175048828125, -0.447479248046875, -0.4132080078125, -0.378936767578125, -0.34466552734375, -0.310394287109375, -0.276123046875, -0.241851806640625, -0.20758056640625, -0.173309326171875, -0.1390380859375, -0.104766845703125, -0.07049560546875, -0.036224365234375, -0.001953125, 0.032318115234375, 0.06658935546875, 0.100860595703125, 0.1351318359375, 0.169403076171875, 0.20367431640625, 0.237945556640625, 0.272216796875, 0.306488037109375, 0.34075927734375, 0.375030517578125, 0.4093017578125, 0.443572998046875, 0.47784423828125, 0.512115478515625, 0.54638671875, 0.580657958984375, 0.61492919921875, 0.649200439453125, 0.6834716796875, 0.717742919921875, 0.75201416015625, 0.786285400390625, 0.820556640625, 0.854827880859375, 0.88909912109375, 0.923370361328125, 0.9576416015625, 0.991912841796875, 1.02618408203125, 1.060455322265625, 1.0947265625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 5.0, 2.0, 5.0, 7.0, 7.0, 9.0, 7.0, 15.0, 11.0, 19.0, 12.0, 22.0, 19.0, 37.0, 65.0, 110.0, 159.0, 1022565.0, 24972.0, 183.0, 68.0, 59.0, 43.0, 33.0, 17.0, 18.0, 14.0, 10.0, 6.0, 5.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.0, -33.90478515625, -32.8095703125, -31.71435546875, -30.619140625, -29.52392578125, -28.4287109375, -27.33349609375, -26.23828125, -25.14306640625, -24.0478515625, -22.95263671875, -21.857421875, -20.76220703125, -19.6669921875, -18.57177734375, -17.4765625, -16.38134765625, -15.2861328125, -14.19091796875, -13.095703125, -12.00048828125, -10.9052734375, -9.81005859375, -8.71484375, -7.61962890625, -6.5244140625, -5.42919921875, -4.333984375, -3.23876953125, -2.1435546875, -1.04833984375, 0.046875, 1.14208984375, 2.2373046875, 3.33251953125, 4.427734375, 5.52294921875, 6.6181640625, 7.71337890625, 8.80859375, 9.90380859375, 10.9990234375, 12.09423828125, 13.189453125, 14.28466796875, 15.3798828125, 16.47509765625, 17.5703125, 18.66552734375, 19.7607421875, 20.85595703125, 21.951171875, 23.04638671875, 24.1416015625, 25.23681640625, 26.33203125, 27.42724609375, 28.5224609375, 29.61767578125, 30.712890625, 31.80810546875, 32.9033203125, 33.99853515625, 35.09375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1019.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4909548759460449, 0.4196431040763855, 1.330241084098816, 2.2408390045166016, 3.1514370441436768, 4.062035083770752, 4.972632884979248, 5.883231163024902, 6.793828964233398, 7.7044267654418945, 8.61502456665039, 9.525623321533203, 10.4362211227417, 11.346818923950195, 12.257416725158691, 13.168014526367188, 14.07861328125, 14.989211082458496, 15.899808883666992, 16.810407638549805, 17.721004486083984, 18.631603240966797, 19.54220199584961, 20.45279884338379, 21.36339569091797, 22.27399444580078, 23.18459129333496, 24.095190048217773, 25.005786895751953, 25.916385650634766, 26.826984405517578, 27.737581253051758, 28.64818000793457, 29.558778762817383, 30.469375610351562, 31.379974365234375, 32.29057312011719, 33.201171875, 34.11176681518555, 35.02236557006836, 35.93296432495117, 36.843563079833984, 37.7541618347168, 38.664756774902344, 39.575355529785156, 40.48595428466797, 41.39655303955078, 42.307151794433594, 43.21774673461914, 44.12834548950195, 45.038944244384766, 45.94953918457031, 46.860137939453125, 47.77073669433594, 48.68133544921875, 49.59193420410156, 50.502532958984375, 51.41313171386719, 52.32373046875, 53.23432540893555, 54.14492416381836, 55.05552291870117, 55.966121673583984, 56.8767204284668, 57.787315368652344]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 7.0, 8.0, 10.0, 11.0, 16.0, 17.0, 18.0, 24.0, 31.0, 29.0, 25.0, 26.0, 37.0, 32.0, 36.0, 32.0, 37.0, 28.0, 38.0, 24.0, 33.0, 47.0, 34.0, 48.0, 37.0, 40.0, 40.0, 24.0, 25.0, 20.0, 21.0, 23.0, 19.0, 16.0, 11.0, 13.0, 8.0, 4.0, 7.0, 4.0, 8.0, 5.0, 3.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4653775691986084, -2.3763115406036377, -2.287245273590088, -2.198179244995117, -2.1091132164001465, -2.020047187805176, -1.930980920791626, -1.8419148921966553, -1.752848744392395, -1.6637825965881348, -1.574716567993164, -1.4856504201889038, -1.3965842723846436, -1.3075182437896729, -1.2184520959854126, -1.1293859481811523, -1.0403199195861816, -0.9512538313865662, -0.8621877431869507, -0.7731215953826904, -0.684055507183075, -0.5949894189834595, -0.5059232711791992, -0.41685718297958374, -0.32779109477996826, -0.2387249916791916, -0.14965888857841492, -0.06059277057647705, 0.028473317623138428, 0.1175394058227539, 0.20660555362701416, 0.29567164182662964, 0.384737491607666, 0.4738035798072815, 0.562869668006897, 0.6519358158111572, 0.7410019040107727, 0.8300679922103882, 0.9191341400146484, 1.0082001686096191, 1.0972663164138794, 1.1863324642181396, 1.2753984928131104, 1.3644646406173706, 1.4535307884216309, 1.5425968170166016, 1.6316629648208618, 1.720729112625122, 1.8097951412200928, 1.898861289024353, 1.9879273176193237, 2.076993465423584, 2.1660594940185547, 2.2551255226135254, 2.344191789627075, 2.433257818222046, 2.5223240852355957, 2.6113901138305664, 2.700456380844116, 2.789522409439087, 2.8785884380340576, 2.9676547050476074, 3.056720733642578, 3.145786762237549, 3.2348527908325195]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 8.0, 2.0, 2.0, 6.0, 6.0, 11.0, 16.0, 10.0, 13.0, 22.0, 13.0, 25.0, 31.0, 35.0, 40.0, 32.0, 54.0, 50.0, 52.0, 45.0, 35.0, 50.0, 52.0, 43.0, 35.0, 29.0, 35.0, 47.0, 32.0, 22.0, 21.0, 20.0, 14.0, 17.0, 7.0, 6.0, 17.0, 11.0, 7.0, 6.0, 5.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-45.65625, -44.22216796875, -42.7880859375, -41.35400390625, -39.919921875, -38.48583984375, -37.0517578125, -35.61767578125, -34.18359375, -32.74951171875, -31.3154296875, -29.88134765625, -28.447265625, -27.01318359375, -25.5791015625, -24.14501953125, -22.7109375, -21.27685546875, -19.8427734375, -18.40869140625, -16.974609375, -15.54052734375, -14.1064453125, -12.67236328125, -11.23828125, -9.80419921875, -8.3701171875, -6.93603515625, -5.501953125, -4.06787109375, -2.6337890625, -1.19970703125, 0.234375, 1.66845703125, 3.1025390625, 4.53662109375, 5.970703125, 7.40478515625, 8.8388671875, 10.27294921875, 11.70703125, 13.14111328125, 14.5751953125, 16.00927734375, 17.443359375, 18.87744140625, 20.3115234375, 21.74560546875, 23.1796875, 24.61376953125, 26.0478515625, 27.48193359375, 28.916015625, 30.35009765625, 31.7841796875, 33.21826171875, 34.65234375, 36.08642578125, 37.5205078125, 38.95458984375, 40.388671875, 41.82275390625, 43.2568359375, 44.69091796875, 46.125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 7.0, 13.0, 6.0, 14.0, 10.0, 11.0, 27.0, 26.0, 36.0, 49.0, 67.0, 95.0, 145.0, 223.0, 351.0, 607.0, 1313.0, 2557.0, 6024.0, 15537.0, 47509.0, 188545.0, 549225.0, 167659.0, 43141.0, 14325.0, 5835.0, 2423.0, 1100.0, 604.0, 343.0, 201.0, 133.0, 101.0, 56.0, 50.0, 41.0, 31.0, 25.0, 14.0, 13.0, 19.0, 12.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-23.59375, -22.866943359375, -22.14013671875, -21.413330078125, -20.6865234375, -19.959716796875, -19.23291015625, -18.506103515625, -17.779296875, -17.052490234375, -16.32568359375, -15.598876953125, -14.8720703125, -14.145263671875, -13.41845703125, -12.691650390625, -11.96484375, -11.238037109375, -10.51123046875, -9.784423828125, -9.0576171875, -8.330810546875, -7.60400390625, -6.877197265625, -6.150390625, -5.423583984375, -4.69677734375, -3.969970703125, -3.2431640625, -2.516357421875, -1.78955078125, -1.062744140625, -0.3359375, 0.390869140625, 1.11767578125, 1.844482421875, 2.5712890625, 3.298095703125, 4.02490234375, 4.751708984375, 5.478515625, 6.205322265625, 6.93212890625, 7.658935546875, 8.3857421875, 9.112548828125, 9.83935546875, 10.566162109375, 11.29296875, 12.019775390625, 12.74658203125, 13.473388671875, 14.2001953125, 14.927001953125, 15.65380859375, 16.380615234375, 17.107421875, 17.834228515625, 18.56103515625, 19.287841796875, 20.0146484375, 20.741455078125, 21.46826171875, 22.195068359375, 22.921875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 8.0, 7.0, 9.0, 13.0, 9.0, 12.0, 9.0, 14.0, 15.0, 14.0, 26.0, 35.0, 22.0, 37.0, 38.0, 27.0, 37.0, 40.0, 44.0, 54.0, 74.0, 1867.0, 170.0, 58.0, 41.0, 34.0, 39.0, 29.0, 40.0, 26.0, 29.0, 28.0, 23.0, 20.0, 8.0, 13.0, 16.0, 11.0, 15.0, 13.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-135.625, -131.48046875, -127.3359375, -123.19140625, -119.046875, -114.90234375, -110.7578125, -106.61328125, -102.46875, -98.32421875, -94.1796875, -90.03515625, -85.890625, -81.74609375, -77.6015625, -73.45703125, -69.3125, -65.16796875, -61.0234375, -56.87890625, -52.734375, -48.58984375, -44.4453125, -40.30078125, -36.15625, -32.01171875, -27.8671875, -23.72265625, -19.578125, -15.43359375, -11.2890625, -7.14453125, -3.0, 1.14453125, 5.2890625, 9.43359375, 13.578125, 17.72265625, 21.8671875, 26.01171875, 30.15625, 34.30078125, 38.4453125, 42.58984375, 46.734375, 50.87890625, 55.0234375, 59.16796875, 63.3125, 67.45703125, 71.6015625, 75.74609375, 79.890625, 84.03515625, 88.1796875, 92.32421875, 96.46875, 100.61328125, 104.7578125, 108.90234375, 113.046875, 117.19140625, 121.3359375, 125.48046875, 129.625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 14.0, 13.0, 12.0, 18.0, 23.0, 16.0, 20.0, 33.0, 55.0, 84.0, 75.0, 109.0, 136.0, 181.0, 346.0, 732.0, 3885.0, 2430475.0, 704096.0, 3389.0, 764.0, 339.0, 199.0, 132.0, 93.0, 92.0, 87.0, 58.0, 49.0, 24.0, 23.0, 22.0, 13.0, 14.0, 12.0, 10.0, 13.0, 8.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-256.5, -248.21875, -239.9375, -231.65625, -223.375, -215.09375, -206.8125, -198.53125, -190.25, -181.96875, -173.6875, -165.40625, -157.125, -148.84375, -140.5625, -132.28125, -124.0, -115.71875, -107.4375, -99.15625, -90.875, -82.59375, -74.3125, -66.03125, -57.75, -49.46875, -41.1875, -32.90625, -24.625, -16.34375, -8.0625, 0.21875, 8.5, 16.78125, 25.0625, 33.34375, 41.625, 49.90625, 58.1875, 66.46875, 74.75, 83.03125, 91.3125, 99.59375, 107.875, 116.15625, 124.4375, 132.71875, 141.0, 149.28125, 157.5625, 165.84375, 174.125, 182.40625, 190.6875, 198.96875, 207.25, 215.53125, 223.8125, 232.09375, 240.375, 248.65625, 256.9375, 265.21875, 273.5]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 75.0, 774.0, 162.0, 9.0], "bins": [-1643.2232666015625, -1616.5428466796875, -1589.8623046875, -1563.181884765625, -1536.50146484375, -1509.8209228515625, -1483.1405029296875, -1456.4600830078125, -1429.779541015625, -1403.09912109375, -1376.4185791015625, -1349.7381591796875, -1323.0577392578125, -1296.377197265625, -1269.69677734375, -1243.016357421875, -1216.3359375, -1189.655517578125, -1162.9749755859375, -1136.2945556640625, -1109.6141357421875, -1082.93359375, -1056.253173828125, -1029.57275390625, -1002.8922119140625, -976.2117309570312, -949.5313110351562, -922.850830078125, -896.1703491210938, -869.4898681640625, -842.8094482421875, -816.1289672851562, -789.4484252929688, -762.7679443359375, -736.0875244140625, -709.4070434570312, -682.7265625, -656.046142578125, -629.3656616210938, -602.6851806640625, -576.0047607421875, -549.3242797851562, -522.6438598632812, -495.96337890625, -469.28289794921875, -442.6024475097656, -415.9219970703125, -389.24151611328125, -362.56103515625, -335.8805847167969, -309.2001037597656, -282.5196533203125, -255.8391876220703, -229.15872192382812, -202.478271484375, -175.7978057861328, -149.11734008789062, -122.43687438964844, -95.75641632080078, -69.07595825195312, -42.39549255371094, -15.71502685546875, 10.965423583984375, 37.64588928222656, 64.32635498046875]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 6.0, 7.0, 5.0, 8.0, 8.0, 8.0, 17.0, 16.0, 18.0, 15.0, 25.0, 23.0, 30.0, 24.0, 33.0, 40.0, 33.0, 47.0, 42.0, 62.0, 42.0, 51.0, 36.0, 45.0, 45.0, 55.0, 22.0, 39.0, 28.0, 35.0, 23.0, 20.0, 20.0, 20.0, 10.0, 8.0, 15.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-367.45843505859375, -354.465576171875, -341.47271728515625, -328.4798278808594, -315.4869689941406, -302.4941101074219, -289.501220703125, -276.50836181640625, -263.5155029296875, -250.52264404296875, -237.52976989746094, -224.53689575195312, -211.54403686523438, -198.55117797851562, -185.5583038330078, -172.5654296875, -159.57257080078125, -146.5797119140625, -133.5868377685547, -120.5939712524414, -107.60110473632812, -94.60823822021484, -81.61537170410156, -68.62250518798828, -55.629638671875, -42.63677215576172, -29.643905639648438, -16.651039123535156, -3.658172607421875, 9.334693908691406, 22.327560424804688, 35.32042694091797, 48.31329345703125, 61.30615997314453, 74.29902648925781, 87.2918930053711, 100.28475952148438, 113.27762603759766, 126.27049255371094, 139.26336669921875, 152.2562255859375, 165.24908447265625, 178.24195861816406, 191.23483276367188, 204.22769165039062, 217.22055053710938, 230.2134246826172, 243.206298828125, 256.19915771484375, 269.1920166015625, 282.18487548828125, 295.1777648925781, 308.1706237792969, 321.1634826660156, 334.1563720703125, 347.14923095703125, 360.14208984375, 373.13494873046875, 386.1278076171875, 399.1206970214844, 412.1135559082031, 425.1064147949219, 438.09930419921875, 451.0921630859375, 464.08502197265625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 3.0, 5.0, 8.0, 7.0, 13.0, 9.0, 12.0, 17.0, 20.0, 18.0, 28.0, 24.0, 42.0, 38.0, 46.0, 52.0, 42.0, 53.0, 39.0, 41.0, 50.0, 48.0, 44.0, 35.0, 23.0, 50.0, 35.0, 26.0, 21.0, 22.0, 21.0, 19.0, 10.0, 6.0, 8.0, 14.0, 14.0, 8.0, 3.0, 3.0, 6.0, 2.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-44.84375, -43.419921875, -41.99609375, -40.572265625, -39.1484375, -37.724609375, -36.30078125, -34.876953125, -33.453125, -32.029296875, -30.60546875, -29.181640625, -27.7578125, -26.333984375, -24.91015625, -23.486328125, -22.0625, -20.638671875, -19.21484375, -17.791015625, -16.3671875, -14.943359375, -13.51953125, -12.095703125, -10.671875, -9.248046875, -7.82421875, -6.400390625, -4.9765625, -3.552734375, -2.12890625, -0.705078125, 0.71875, 2.142578125, 3.56640625, 4.990234375, 6.4140625, 7.837890625, 9.26171875, 10.685546875, 12.109375, 13.533203125, 14.95703125, 16.380859375, 17.8046875, 19.228515625, 20.65234375, 22.076171875, 23.5, 24.923828125, 26.34765625, 27.771484375, 29.1953125, 30.619140625, 32.04296875, 33.466796875, 34.890625, 36.314453125, 37.73828125, 39.162109375, 40.5859375, 42.009765625, 43.43359375, 44.857421875, 46.28125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 12.0, 18.0, 27.0, 51.0, 76.0, 142.0, 244.0, 432.0, 794.0, 1621.0, 3413.0, 7902.0, 22609.0, 533535.0, 3550957.0, 49267.0, 12948.0, 5300.0, 2422.0, 1107.0, 618.0, 302.0, 177.0, 103.0, 50.0, 39.0, 31.0, 13.0, 10.0, 13.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-192.875, -186.494140625, -180.11328125, -173.732421875, -167.3515625, -160.970703125, -154.58984375, -148.208984375, -141.828125, -135.447265625, -129.06640625, -122.685546875, -116.3046875, -109.923828125, -103.54296875, -97.162109375, -90.78125, -84.400390625, -78.01953125, -71.638671875, -65.2578125, -58.876953125, -52.49609375, -46.115234375, -39.734375, -33.353515625, -26.97265625, -20.591796875, -14.2109375, -7.830078125, -1.44921875, 4.931640625, 11.3125, 17.693359375, 24.07421875, 30.455078125, 36.8359375, 43.216796875, 49.59765625, 55.978515625, 62.359375, 68.740234375, 75.12109375, 81.501953125, 87.8828125, 94.263671875, 100.64453125, 107.025390625, 113.40625, 119.787109375, 126.16796875, 132.548828125, 138.9296875, 145.310546875, 151.69140625, 158.072265625, 164.453125, 170.833984375, 177.21484375, 183.595703125, 189.9765625, 196.357421875, 202.73828125, 209.119140625, 215.5]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 9.0, 10.0, 7.0, 11.0, 16.0, 15.0, 25.0, 29.0, 47.0, 85.0, 131.0, 297.0, 581.0, 1059.0, 844.0, 393.0, 194.0, 101.0, 68.0, 36.0, 29.0, 17.0, 18.0, 12.0, 7.0, 4.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-178.625, -174.0166015625, -169.408203125, -164.7998046875, -160.19140625, -155.5830078125, -150.974609375, -146.3662109375, -141.7578125, -137.1494140625, -132.541015625, -127.9326171875, -123.32421875, -118.7158203125, -114.107421875, -109.4990234375, -104.890625, -100.2822265625, -95.673828125, -91.0654296875, -86.45703125, -81.8486328125, -77.240234375, -72.6318359375, -68.0234375, -63.4150390625, -58.806640625, -54.1982421875, -49.58984375, -44.9814453125, -40.373046875, -35.7646484375, -31.15625, -26.5478515625, -21.939453125, -17.3310546875, -12.72265625, -8.1142578125, -3.505859375, 1.1025390625, 5.7109375, 10.3193359375, 14.927734375, 19.5361328125, 24.14453125, 28.7529296875, 33.361328125, 37.9697265625, 42.578125, 47.1865234375, 51.794921875, 56.4033203125, 61.01171875, 65.6201171875, 70.228515625, 74.8369140625, 79.4453125, 84.0537109375, 88.662109375, 93.2705078125, 97.87890625, 102.4873046875, 107.095703125, 111.7041015625, 116.3125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 5.0, 13.0, 17.0, 22.0, 21.0, 34.0, 50.0, 75.0, 115.0, 214.0, 447.0, 983.0, 2125.0, 5760.0, 18489.0, 94836.0, 3918236.0, 121286.0, 20627.0, 6464.0, 2351.0, 917.0, 498.0, 235.0, 156.0, 83.0, 53.0, 49.0, 31.0, 24.0, 12.0, 8.0, 7.0, 6.0, 5.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-292.75, -281.72265625, -270.6953125, -259.66796875, -248.640625, -237.61328125, -226.5859375, -215.55859375, -204.53125, -193.50390625, -182.4765625, -171.44921875, -160.421875, -149.39453125, -138.3671875, -127.33984375, -116.3125, -105.28515625, -94.2578125, -83.23046875, -72.203125, -61.17578125, -50.1484375, -39.12109375, -28.09375, -17.06640625, -6.0390625, 4.98828125, 16.015625, 27.04296875, 38.0703125, 49.09765625, 60.125, 71.15234375, 82.1796875, 93.20703125, 104.234375, 115.26171875, 126.2890625, 137.31640625, 148.34375, 159.37109375, 170.3984375, 181.42578125, 192.453125, 203.48046875, 214.5078125, 225.53515625, 236.5625, 247.58984375, 258.6171875, 269.64453125, 280.671875, 291.69921875, 302.7265625, 313.75390625, 324.78125, 335.80859375, 346.8359375, 357.86328125, 368.890625, 379.91796875, 390.9453125, 401.97265625, 413.0]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 13.0, 14.0, 29.0, 34.0, 42.0, 86.0, 146.0, 219.0, 188.0, 91.0, 60.0, 25.0, 18.0, 9.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-602.813232421875, -578.3146362304688, -553.8159790039062, -529.3173828125, -504.8187255859375, -480.32012939453125, -455.8215026855469, -431.3228759765625, -406.8242492675781, -382.32562255859375, -357.8269958496094, -333.328369140625, -308.82977294921875, -284.33111572265625, -259.83251953125, -235.33389282226562, -210.83526611328125, -186.33663940429688, -161.8380126953125, -137.3394012451172, -112.84077453613281, -88.34214782714844, -63.843536376953125, -39.34490966796875, -14.846282958984375, 9.652339935302734, 34.150962829589844, 58.64958190917969, 83.14820861816406, 107.64683532714844, 132.14544677734375, 156.64407348632812, 181.1427001953125, 205.64132690429688, 230.13995361328125, 254.63856506347656, 279.13720703125, 303.63580322265625, 328.1344299316406, 352.633056640625, 377.1316833496094, 401.63031005859375, 426.1289367675781, 450.6275634765625, 475.12615966796875, 499.62481689453125, 524.1234130859375, 548.6220703125, 573.1206665039062, 597.6192626953125, 622.117919921875, 646.6165161132812, 671.1151733398438, 695.61376953125, 720.1124267578125, 744.6110229492188, 769.109619140625, 793.6082153320312, 818.1068725585938, 842.60546875, 867.1041259765625, 891.6027221679688, 916.101318359375, 940.5999755859375, 965.0986328125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 14.0, 12.0, 15.0, 15.0, 17.0, 28.0, 14.0, 22.0, 45.0, 37.0, 31.0, 33.0, 51.0, 52.0, 34.0, 46.0, 40.0, 30.0, 44.0, 52.0, 41.0, 37.0, 46.0, 38.0, 40.0, 31.0, 30.0, 19.0, 24.0, 12.0, 8.0, 11.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-343.0869445800781, -331.10101318359375, -319.1151123046875, -307.1291809082031, -295.14324951171875, -283.1573181152344, -271.17138671875, -259.18548583984375, -247.19955444335938, -235.213623046875, -223.2277069091797, -211.24179077148438, -199.255859375, -187.26992797851562, -175.2840118408203, -163.298095703125, -151.31216430664062, -139.32623291015625, -127.34031677246094, -115.3543930053711, -103.36846923828125, -91.3825454711914, -79.39662170410156, -67.41069793701172, -55.424774169921875, -43.43885040283203, -31.452926635742188, -19.467002868652344, -7.4810791015625, 4.504844665527344, 16.490768432617188, 28.47669219970703, 40.462615966796875, 52.44853973388672, 64.43446350097656, 76.4203872680664, 88.40631103515625, 100.3922348022461, 112.37815856933594, 124.36408233642578, 136.35000610351562, 148.3359375, 160.3218536376953, 172.30776977539062, 184.293701171875, 196.27963256835938, 208.2655487060547, 220.25146484375, 232.23739624023438, 244.22332763671875, 256.209228515625, 268.1951599121094, 280.18109130859375, 292.1670227050781, 304.1529541015625, 316.13885498046875, 328.1247863769531, 340.1107177734375, 352.09661865234375, 364.0825500488281, 376.0684814453125, 388.0544128417969, 400.04034423828125, 412.0262451171875, 424.0121765136719]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 11.0, 14.0, 21.0, 15.0, 21.0, 27.0, 16.0, 28.0, 34.0, 35.0, 35.0, 58.0, 39.0, 55.0, 45.0, 50.0, 61.0, 46.0, 42.0, 36.0, 43.0, 40.0, 27.0, 26.0, 23.0, 23.0, 16.0, 13.0, 14.0, 10.0, 10.0, 12.0, 9.0, 7.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-46.53125, -45.04833984375, -43.5654296875, -42.08251953125, -40.599609375, -39.11669921875, -37.6337890625, -36.15087890625, -34.66796875, -33.18505859375, -31.7021484375, -30.21923828125, -28.736328125, -27.25341796875, -25.7705078125, -24.28759765625, -22.8046875, -21.32177734375, -19.8388671875, -18.35595703125, -16.873046875, -15.39013671875, -13.9072265625, -12.42431640625, -10.94140625, -9.45849609375, -7.9755859375, -6.49267578125, -5.009765625, -3.52685546875, -2.0439453125, -0.56103515625, 0.921875, 2.40478515625, 3.8876953125, 5.37060546875, 6.853515625, 8.33642578125, 9.8193359375, 11.30224609375, 12.78515625, 14.26806640625, 15.7509765625, 17.23388671875, 18.716796875, 20.19970703125, 21.6826171875, 23.16552734375, 24.6484375, 26.13134765625, 27.6142578125, 29.09716796875, 30.580078125, 32.06298828125, 33.5458984375, 35.02880859375, 36.51171875, 37.99462890625, 39.4775390625, 40.96044921875, 42.443359375, 43.92626953125, 45.4091796875, 46.89208984375, 48.375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 3.0, 7.0, 12.0, 14.0, 12.0, 20.0, 37.0, 51.0, 63.0, 83.0, 119.0, 158.0, 211.0, 292.0, 434.0, 609.0, 861.0, 1400.0, 2559.0, 5935.0, 20107.0, 103970.0, 708431.0, 160341.0, 27381.0, 7521.0, 3071.0, 1634.0, 967.0, 639.0, 450.0, 305.0, 238.0, 157.0, 144.0, 79.0, 65.0, 47.0, 33.0, 26.0, 24.0, 16.0, 10.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-20.03125, -19.452392578125, -18.87353515625, -18.294677734375, -17.7158203125, -17.136962890625, -16.55810546875, -15.979248046875, -15.400390625, -14.821533203125, -14.24267578125, -13.663818359375, -13.0849609375, -12.506103515625, -11.92724609375, -11.348388671875, -10.76953125, -10.190673828125, -9.61181640625, -9.032958984375, -8.4541015625, -7.875244140625, -7.29638671875, -6.717529296875, -6.138671875, -5.559814453125, -4.98095703125, -4.402099609375, -3.8232421875, -3.244384765625, -2.66552734375, -2.086669921875, -1.5078125, -0.928955078125, -0.35009765625, 0.228759765625, 0.8076171875, 1.386474609375, 1.96533203125, 2.544189453125, 3.123046875, 3.701904296875, 4.28076171875, 4.859619140625, 5.4384765625, 6.017333984375, 6.59619140625, 7.175048828125, 7.75390625, 8.332763671875, 8.91162109375, 9.490478515625, 10.0693359375, 10.648193359375, 11.22705078125, 11.805908203125, 12.384765625, 12.963623046875, 13.54248046875, 14.121337890625, 14.7001953125, 15.279052734375, 15.85791015625, 16.436767578125, 17.015625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 4.0, 7.0, 8.0, 6.0, 10.0, 10.0, 16.0, 18.0, 30.0, 13.0, 19.0, 34.0, 25.0, 26.0, 25.0, 32.0, 29.0, 35.0, 54.0, 47.0, 37.0, 1055.0, 42.0, 45.0, 45.0, 33.0, 42.0, 28.0, 31.0, 36.0, 25.0, 15.0, 19.0, 14.0, 17.0, 19.0, 9.0, 11.0, 13.0, 9.0, 4.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.796875, -23.91943359375, -23.0419921875, -22.16455078125, -21.287109375, -20.40966796875, -19.5322265625, -18.65478515625, -17.77734375, -16.89990234375, -16.0224609375, -15.14501953125, -14.267578125, -13.39013671875, -12.5126953125, -11.63525390625, -10.7578125, -9.88037109375, -9.0029296875, -8.12548828125, -7.248046875, -6.37060546875, -5.4931640625, -4.61572265625, -3.73828125, -2.86083984375, -1.9833984375, -1.10595703125, -0.228515625, 0.64892578125, 1.5263671875, 2.40380859375, 3.28125, 4.15869140625, 5.0361328125, 5.91357421875, 6.791015625, 7.66845703125, 8.5458984375, 9.42333984375, 10.30078125, 11.17822265625, 12.0556640625, 12.93310546875, 13.810546875, 14.68798828125, 15.5654296875, 16.44287109375, 17.3203125, 18.19775390625, 19.0751953125, 19.95263671875, 20.830078125, 21.70751953125, 22.5849609375, 23.46240234375, 24.33984375, 25.21728515625, 26.0947265625, 26.97216796875, 27.849609375, 28.72705078125, 29.6044921875, 30.48193359375, 31.359375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 20.0, 29.0, 29.0, 44.0, 60.0, 58.0, 102.0, 142.0, 179.0, 267.0, 378.0, 625.0, 940.0, 1476.0, 2473.0, 4506.0, 8457.0, 17865.0, 40836.0, 103329.0, 397564.0, 1297408.0, 128425.0, 48629.0, 20763.0, 9863.0, 5054.0, 2774.0, 1648.0, 1044.0, 617.0, 493.0, 297.0, 223.0, 147.0, 85.0, 81.0, 48.0, 39.0, 27.0, 17.0, 12.0, 13.0, 12.0, 2.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.53515625, -4.38934326171875, -4.2435302734375, -4.09771728515625, -3.951904296875, -3.80609130859375, -3.6602783203125, -3.51446533203125, -3.36865234375, -3.22283935546875, -3.0770263671875, -2.93121337890625, -2.785400390625, -2.63958740234375, -2.4937744140625, -2.34796142578125, -2.2021484375, -2.05633544921875, -1.9105224609375, -1.76470947265625, -1.618896484375, -1.47308349609375, -1.3272705078125, -1.18145751953125, -1.03564453125, -0.88983154296875, -0.7440185546875, -0.59820556640625, -0.452392578125, -0.30657958984375, -0.1607666015625, -0.01495361328125, 0.130859375, 0.27667236328125, 0.4224853515625, 0.56829833984375, 0.714111328125, 0.85992431640625, 1.0057373046875, 1.15155029296875, 1.29736328125, 1.44317626953125, 1.5889892578125, 1.73480224609375, 1.880615234375, 2.02642822265625, 2.1722412109375, 2.31805419921875, 2.4638671875, 2.60968017578125, 2.7554931640625, 2.90130615234375, 3.047119140625, 3.19293212890625, 3.3387451171875, 3.48455810546875, 3.63037109375, 3.77618408203125, 3.9219970703125, 4.06781005859375, 4.213623046875, 4.35943603515625, 4.5052490234375, 4.65106201171875, 4.796875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 2.0, 7.0, 6.0, 10.0, 9.0, 17.0, 38.0, 43.0, 39.0, 89.0, 225.0, 212.0, 80.0, 51.0, 30.0, 26.0, 17.0, 19.0, 12.0, 8.0, 11.0, 3.0, 7.0, 2.0, 2.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.9453125, -0.9182662963867188, -0.8912200927734375, -0.8641738891601562, -0.837127685546875, -0.8100814819335938, -0.7830352783203125, -0.7559890747070312, -0.72894287109375, -0.7018966674804688, -0.6748504638671875, -0.6478042602539062, -0.620758056640625, -0.5937118530273438, -0.5666656494140625, -0.5396194458007812, -0.5125732421875, -0.48552703857421875, -0.4584808349609375, -0.43143463134765625, -0.404388427734375, -0.37734222412109375, -0.3502960205078125, -0.32324981689453125, -0.29620361328125, -0.26915740966796875, -0.2421112060546875, -0.21506500244140625, -0.188018798828125, -0.16097259521484375, -0.1339263916015625, -0.10688018798828125, -0.079833984375, -0.05278778076171875, -0.0257415771484375, 0.00130462646484375, 0.028350830078125, 0.05539703369140625, 0.0824432373046875, 0.10948944091796875, 0.13653564453125, 0.16358184814453125, 0.1906280517578125, 0.21767425537109375, 0.244720458984375, 0.27176666259765625, 0.2988128662109375, 0.32585906982421875, 0.3529052734375, 0.37995147705078125, 0.4069976806640625, 0.43404388427734375, 0.461090087890625, 0.48813629150390625, 0.5151824951171875, 0.5422286987304688, 0.56927490234375, 0.5963211059570312, 0.6233673095703125, 0.6504135131835938, 0.677459716796875, 0.7045059204101562, 0.7315521240234375, 0.7585983276367188, 0.78564453125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 18.0, 24.0, 23.0, 54.0, 73.0, 157.0, 21887.0, 1025849.0, 157.0, 61.0, 65.0, 38.0, 20.0, 13.0, 11.0, 4.0, 5.0, 6.0, 4.0, 5.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.265625, -24.3955078125, -23.525390625, -22.6552734375, -21.78515625, -20.9150390625, -20.044921875, -19.1748046875, -18.3046875, -17.4345703125, -16.564453125, -15.6943359375, -14.82421875, -13.9541015625, -13.083984375, -12.2138671875, -11.34375, -10.4736328125, -9.603515625, -8.7333984375, -7.86328125, -6.9931640625, -6.123046875, -5.2529296875, -4.3828125, -3.5126953125, -2.642578125, -1.7724609375, -0.90234375, -0.0322265625, 0.837890625, 1.7080078125, 2.578125, 3.4482421875, 4.318359375, 5.1884765625, 6.05859375, 6.9287109375, 7.798828125, 8.6689453125, 9.5390625, 10.4091796875, 11.279296875, 12.1494140625, 13.01953125, 13.8896484375, 14.759765625, 15.6298828125, 16.5, 17.3701171875, 18.240234375, 19.1103515625, 19.98046875, 20.8505859375, 21.720703125, 22.5908203125, 23.4609375, 24.3310546875, 25.201171875, 26.0712890625, 26.94140625, 27.8115234375, 28.681640625, 29.5517578125, 30.421875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 613.0, 405.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7463743686676025, -0.3703273832798004, 0.005719602108001709, 0.38176655769348145, 0.757813572883606, 1.1338605880737305, 1.5099074840545654, 1.8859546184539795, 2.2620015144348145, 2.6380484104156494, 3.0140955448150635, 3.3901424407958984, 3.7661895751953125, 4.142236709594727, 4.518283367156982, 4.8943305015563965, 5.270377159118652, 5.646424293518066, 6.022470951080322, 6.398518085479736, 6.77456521987915, 7.150611877441406, 7.52665901184082, 7.902706146240234, 8.278753280639648, 8.654800415039062, 9.030847549438477, 9.40689468383789, 9.782940864562988, 10.158987998962402, 10.535035133361816, 10.91108226776123, 11.287129402160645, 11.663176536560059, 12.039223670959473, 12.41526985168457, 12.791316986083984, 13.167364120483398, 13.543411254882812, 13.919458389282227, 14.29550552368164, 14.671552658081055, 15.047599792480469, 15.423646926879883, 15.79969310760498, 16.17574119567871, 16.551788330078125, 16.927833557128906, 17.30388069152832, 17.679927825927734, 18.05597496032715, 18.432022094726562, 18.808069229125977, 19.18411636352539, 19.560161590576172, 19.93621063232422, 20.312257766723633, 20.688304901123047, 21.06435203552246, 21.440399169921875, 21.81644630432129, 22.192493438720703, 22.568538665771484, 22.94458770751953, 23.320632934570312]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 8.0, 8.0, 13.0, 15.0, 19.0, 17.0, 28.0, 19.0, 19.0, 26.0, 27.0, 38.0, 41.0, 34.0, 28.0, 47.0, 29.0, 33.0, 31.0, 47.0, 50.0, 49.0, 33.0, 38.0, 20.0, 37.0, 31.0, 26.0, 28.0, 12.0, 18.0, 21.0, 17.0, 16.0, 13.0, 11.0, 10.0, 7.0, 5.0, 3.0, 8.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2013076543807983, -1.1610857248306274, -1.120863914489746, -1.0806419849395752, -1.0404200553894043, -1.0001981258392334, -0.9599762558937073, -0.9197543859481812, -0.8795324563980103, -0.8393105268478394, -0.7990886569023132, -0.7588667869567871, -0.7186448574066162, -0.6784229278564453, -0.6382010579109192, -0.5979791879653931, -0.5577572584152222, -0.5175353288650513, -0.47731345891952515, -0.43709155917167664, -0.3968696594238281, -0.3566477596759796, -0.3164258599281311, -0.2762039601802826, -0.23598206043243408, -0.19576016068458557, -0.15553826093673706, -0.11531636118888855, -0.07509446144104004, -0.03487256169319153, 0.005349338054656982, 0.04557123780250549, 0.08579325675964355, 0.12601515650749207, 0.16623705625534058, 0.2064589560031891, 0.2466808557510376, 0.2869027554988861, 0.3271246552467346, 0.36734655499458313, 0.40756845474243164, 0.44779035449028015, 0.48801225423812866, 0.5282341241836548, 0.5684560537338257, 0.6086779832839966, 0.6488998532295227, 0.6891217231750488, 0.7293436527252197, 0.7695655822753906, 0.8097874522209167, 0.8500093221664429, 0.8902312517166138, 0.9304531812667847, 0.9706750512123108, 1.010896921157837, 1.0511188507080078, 1.0913407802581787, 1.1315627098083496, 1.171784520149231, 1.2120064496994019, 1.2522283792495728, 1.292450189590454, 1.332672119140625, 1.372894048690796]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 10.0, 15.0, 21.0, 15.0, 21.0, 27.0, 16.0, 28.0, 34.0, 35.0, 35.0, 58.0, 39.0, 55.0, 45.0, 50.0, 61.0, 46.0, 42.0, 36.0, 43.0, 40.0, 27.0, 26.0, 23.0, 23.0, 16.0, 13.0, 14.0, 10.0, 10.0, 12.0, 9.0, 7.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-46.53125, -45.04833984375, -43.5654296875, -42.08251953125, -40.599609375, -39.11669921875, -37.6337890625, -36.15087890625, -34.66796875, -33.18505859375, -31.7021484375, -30.21923828125, -28.736328125, -27.25341796875, -25.7705078125, -24.28759765625, -22.8046875, -21.32177734375, -19.8388671875, -18.35595703125, -16.873046875, -15.39013671875, -13.9072265625, -12.42431640625, -10.94140625, -9.45849609375, -7.9755859375, -6.49267578125, -5.009765625, -3.52685546875, -2.0439453125, -0.56103515625, 0.921875, 2.40478515625, 3.8876953125, 5.37060546875, 6.853515625, 8.33642578125, 9.8193359375, 11.30224609375, 12.78515625, 14.26806640625, 15.7509765625, 17.23388671875, 18.716796875, 20.19970703125, 21.6826171875, 23.16552734375, 24.6484375, 26.13134765625, 27.6142578125, 29.09716796875, 30.580078125, 32.06298828125, 33.5458984375, 35.02880859375, 36.51171875, 37.99462890625, 39.4775390625, 40.96044921875, 42.443359375, 43.92626953125, 45.4091796875, 46.89208984375, 48.375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 10.0, 9.0, 6.0, 16.0, 29.0, 30.0, 55.0, 41.0, 92.0, 119.0, 183.0, 275.0, 431.0, 654.0, 1131.0, 1862.0, 3487.0, 6686.0, 14390.0, 47747.0, 875243.0, 63597.0, 16082.0, 7277.0, 3760.0, 2076.0, 1167.0, 695.0, 478.0, 276.0, 194.0, 141.0, 97.0, 55.0, 42.0, 28.0, 20.0, 14.0, 13.0, 15.0, 11.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-113.4375, -110.0576171875, -106.677734375, -103.2978515625, -99.91796875, -96.5380859375, -93.158203125, -89.7783203125, -86.3984375, -83.0185546875, -79.638671875, -76.2587890625, -72.87890625, -69.4990234375, -66.119140625, -62.7392578125, -59.359375, -55.9794921875, -52.599609375, -49.2197265625, -45.83984375, -42.4599609375, -39.080078125, -35.7001953125, -32.3203125, -28.9404296875, -25.560546875, -22.1806640625, -18.80078125, -15.4208984375, -12.041015625, -8.6611328125, -5.28125, -1.9013671875, 1.478515625, 4.8583984375, 8.23828125, 11.6181640625, 14.998046875, 18.3779296875, 21.7578125, 25.1376953125, 28.517578125, 31.8974609375, 35.27734375, 38.6572265625, 42.037109375, 45.4169921875, 48.796875, 52.1767578125, 55.556640625, 58.9365234375, 62.31640625, 65.6962890625, 69.076171875, 72.4560546875, 75.8359375, 79.2158203125, 82.595703125, 85.9755859375, 89.35546875, 92.7353515625, 96.115234375, 99.4951171875, 102.875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 1.0, 8.0, 4.0, 4.0, 8.0, 12.0, 15.0, 14.0, 25.0, 20.0, 28.0, 23.0, 39.0, 28.0, 48.0, 43.0, 55.0, 43.0, 69.0, 96.0, 1815.0, 137.0, 66.0, 66.0, 47.0, 36.0, 38.0, 43.0, 24.0, 30.0, 21.0, 23.0, 17.0, 14.0, 13.0, 12.0, 10.0, 17.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-154.75, -150.166015625, -145.58203125, -140.998046875, -136.4140625, -131.830078125, -127.24609375, -122.662109375, -118.078125, -113.494140625, -108.91015625, -104.326171875, -99.7421875, -95.158203125, -90.57421875, -85.990234375, -81.40625, -76.822265625, -72.23828125, -67.654296875, -63.0703125, -58.486328125, -53.90234375, -49.318359375, -44.734375, -40.150390625, -35.56640625, -30.982421875, -26.3984375, -21.814453125, -17.23046875, -12.646484375, -8.0625, -3.478515625, 1.10546875, 5.689453125, 10.2734375, 14.857421875, 19.44140625, 24.025390625, 28.609375, 33.193359375, 37.77734375, 42.361328125, 46.9453125, 51.529296875, 56.11328125, 60.697265625, 65.28125, 69.865234375, 74.44921875, 79.033203125, 83.6171875, 88.201171875, 92.78515625, 97.369140625, 101.953125, 106.537109375, 111.12109375, 115.705078125, 120.2890625, 124.873046875, 129.45703125, 134.041015625, 138.625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 8.0, 12.0, 5.0, 15.0, 19.0, 28.0, 33.0, 43.0, 68.0, 108.0, 227.0, 629.0, 2419.0, 12444.0, 202910.0, 2902310.0, 19234.0, 3588.0, 897.0, 297.0, 124.0, 83.0, 47.0, 36.0, 26.0, 16.0, 12.0, 15.0, 11.0, 5.0, 5.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-447.5, -433.56640625, -419.6328125, -405.69921875, -391.765625, -377.83203125, -363.8984375, -349.96484375, -336.03125, -322.09765625, -308.1640625, -294.23046875, -280.296875, -266.36328125, -252.4296875, -238.49609375, -224.5625, -210.62890625, -196.6953125, -182.76171875, -168.828125, -154.89453125, -140.9609375, -127.02734375, -113.09375, -99.16015625, -85.2265625, -71.29296875, -57.359375, -43.42578125, -29.4921875, -15.55859375, -1.625, 12.30859375, 26.2421875, 40.17578125, 54.109375, 68.04296875, 81.9765625, 95.91015625, 109.84375, 123.77734375, 137.7109375, 151.64453125, 165.578125, 179.51171875, 193.4453125, 207.37890625, 221.3125, 235.24609375, 249.1796875, 263.11328125, 277.046875, 290.98046875, 304.9140625, 318.84765625, 332.78125, 346.71484375, 360.6484375, 374.58203125, 388.515625, 402.44921875, 416.3828125, 430.31640625, 444.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 17.0, 88.0, 455.0, 360.0, 76.0, 17.0, 4.0], "bins": [-2734.4541015625, -2688.796875, -2643.139404296875, -2597.482177734375, -2551.824951171875, -2506.16748046875, -2460.51025390625, -2414.85302734375, -2369.195556640625, -2323.538330078125, -2277.880859375, -2232.2236328125, -2186.56640625, -2140.908935546875, -2095.251708984375, -2049.594482421875, -2003.9371337890625, -1958.27978515625, -1912.62255859375, -1866.9652099609375, -1821.307861328125, -1775.650634765625, -1729.9932861328125, -1684.3359375, -1638.6787109375, -1593.0213623046875, -1547.3641357421875, -1501.706787109375, -1456.0494384765625, -1410.39208984375, -1364.73486328125, -1319.0775146484375, -1273.420166015625, -1227.7628173828125, -1182.1055908203125, -1136.4482421875, -1090.7908935546875, -1045.133544921875, -999.476318359375, -953.8189697265625, -908.1616821289062, -862.50439453125, -816.8470458984375, -771.1897583007812, -725.532470703125, -679.8751220703125, -634.2178344726562, -588.560546875, -542.9031982421875, -497.2458801269531, -451.58856201171875, -405.9312744140625, -360.2739562988281, -314.61663818359375, -268.9593505859375, -223.30203247070312, -177.6447296142578, -131.9874267578125, -86.33010864257812, -40.67280578613281, 4.9845123291015625, 50.64183044433594, 96.29911804199219, 141.95643615722656, 187.61375427246094]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 7.0, 3.0, 8.0, 10.0, 13.0, 11.0, 10.0, 19.0, 24.0, 24.0, 34.0, 29.0, 37.0, 43.0, 35.0, 43.0, 55.0, 58.0, 46.0, 55.0, 44.0, 47.0, 41.0, 37.0, 34.0, 37.0, 37.0, 33.0, 29.0, 21.0, 17.0, 12.0, 6.0, 12.0, 13.0, 4.0, 6.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-533.1029663085938, -517.2779541015625, -501.452880859375, -485.62786865234375, -469.8028259277344, -453.977783203125, -438.1527404785156, -422.32769775390625, -406.502685546875, -390.6776428222656, -374.85260009765625, -359.027587890625, -343.2025451660156, -327.37750244140625, -311.5524597167969, -295.7274169921875, -279.9023742675781, -264.07733154296875, -248.25230407714844, -232.42726135253906, -216.60223388671875, -200.77719116210938, -184.9521484375, -169.12710571289062, -153.3020782470703, -137.47703552246094, -121.65200805664062, -105.82696533203125, -90.0019302368164, -74.17689514160156, -58.35185241699219, -42.526817321777344, -26.701751708984375, -10.876714706420898, 4.948322296142578, 20.773361206054688, 36.59839630126953, 52.423431396484375, 68.24847412109375, 84.0735092163086, 99.89854431152344, 115.72357940673828, 131.54861450195312, 147.3736572265625, 163.19869995117188, 179.0237274169922, 194.84877014160156, 210.67379760742188, 226.49884033203125, 242.32388305664062, 258.14892578125, 273.97393798828125, 289.7989807128906, 305.6240234375, 321.4490661621094, 337.27410888671875, 353.09912109375, 368.9241638183594, 384.74920654296875, 400.57421875, 416.3992614746094, 432.22430419921875, 448.0493469238281, 463.8743896484375, 479.6994323730469]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 8.0, 5.0, 7.0, 12.0, 16.0, 16.0, 18.0, 18.0, 21.0, 14.0, 21.0, 27.0, 42.0, 46.0, 41.0, 43.0, 40.0, 57.0, 48.0, 56.0, 52.0, 39.0, 47.0, 39.0, 33.0, 24.0, 26.0, 29.0, 28.0, 20.0, 22.0, 13.0, 12.0, 10.0, 10.0, 7.0, 5.0, 9.0, 3.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.15625, -46.59716796875, -45.0380859375, -43.47900390625, -41.919921875, -40.36083984375, -38.8017578125, -37.24267578125, -35.68359375, -34.12451171875, -32.5654296875, -31.00634765625, -29.447265625, -27.88818359375, -26.3291015625, -24.77001953125, -23.2109375, -21.65185546875, -20.0927734375, -18.53369140625, -16.974609375, -15.41552734375, -13.8564453125, -12.29736328125, -10.73828125, -9.17919921875, -7.6201171875, -6.06103515625, -4.501953125, -2.94287109375, -1.3837890625, 0.17529296875, 1.734375, 3.29345703125, 4.8525390625, 6.41162109375, 7.970703125, 9.52978515625, 11.0888671875, 12.64794921875, 14.20703125, 15.76611328125, 17.3251953125, 18.88427734375, 20.443359375, 22.00244140625, 23.5615234375, 25.12060546875, 26.6796875, 28.23876953125, 29.7978515625, 31.35693359375, 32.916015625, 34.47509765625, 36.0341796875, 37.59326171875, 39.15234375, 40.71142578125, 42.2705078125, 43.82958984375, 45.388671875, 46.94775390625, 48.5068359375, 50.06591796875, 51.625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 10.0, 13.0, 23.0, 19.0, 43.0, 56.0, 78.0, 92.0, 175.0, 281.0, 431.0, 687.0, 1123.0, 1962.0, 3420.0, 6595.0, 14468.0, 51786.0, 1587943.0, 2426542.0, 66099.0, 15745.0, 7358.0, 3899.0, 2123.0, 1204.0, 772.0, 455.0, 296.0, 185.0, 114.0, 84.0, 57.0, 30.0, 25.0, 25.0, 6.0, 11.0, 14.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-156.625, -152.025390625, -147.42578125, -142.826171875, -138.2265625, -133.626953125, -129.02734375, -124.427734375, -119.828125, -115.228515625, -110.62890625, -106.029296875, -101.4296875, -96.830078125, -92.23046875, -87.630859375, -83.03125, -78.431640625, -73.83203125, -69.232421875, -64.6328125, -60.033203125, -55.43359375, -50.833984375, -46.234375, -41.634765625, -37.03515625, -32.435546875, -27.8359375, -23.236328125, -18.63671875, -14.037109375, -9.4375, -4.837890625, -0.23828125, 4.361328125, 8.9609375, 13.560546875, 18.16015625, 22.759765625, 27.359375, 31.958984375, 36.55859375, 41.158203125, 45.7578125, 50.357421875, 54.95703125, 59.556640625, 64.15625, 68.755859375, 73.35546875, 77.955078125, 82.5546875, 87.154296875, 91.75390625, 96.353515625, 100.953125, 105.552734375, 110.15234375, 114.751953125, 119.3515625, 123.951171875, 128.55078125, 133.150390625, 137.75]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 11.0, 16.0, 20.0, 34.0, 36.0, 71.0, 140.0, 261.0, 704.0, 1349.0, 808.0, 284.0, 137.0, 80.0, 40.0, 29.0, 19.0, 6.0, 9.0, 6.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-259.25, -253.16015625, -247.0703125, -240.98046875, -234.890625, -228.80078125, -222.7109375, -216.62109375, -210.53125, -204.44140625, -198.3515625, -192.26171875, -186.171875, -180.08203125, -173.9921875, -167.90234375, -161.8125, -155.72265625, -149.6328125, -143.54296875, -137.453125, -131.36328125, -125.2734375, -119.18359375, -113.09375, -107.00390625, -100.9140625, -94.82421875, -88.734375, -82.64453125, -76.5546875, -70.46484375, -64.375, -58.28515625, -52.1953125, -46.10546875, -40.015625, -33.92578125, -27.8359375, -21.74609375, -15.65625, -9.56640625, -3.4765625, 2.61328125, 8.703125, 14.79296875, 20.8828125, 26.97265625, 33.0625, 39.15234375, 45.2421875, 51.33203125, 57.421875, 63.51171875, 69.6015625, 75.69140625, 81.78125, 87.87109375, 93.9609375, 100.05078125, 106.140625, 112.23046875, 118.3203125, 124.41015625, 130.5]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 9.0, 10.0, 12.0, 14.0, 21.0, 15.0, 28.0, 30.0, 40.0, 51.0, 83.0, 104.0, 151.0, 280.0, 516.0, 1159.0, 3071.0, 9541.0, 40129.0, 1737747.0, 2343235.0, 42357.0, 9685.0, 3232.0, 1247.0, 560.0, 297.0, 184.0, 122.0, 75.0, 58.0, 46.0, 38.0, 26.0, 25.0, 16.0, 14.0, 14.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-319.0, -308.71484375, -298.4296875, -288.14453125, -277.859375, -267.57421875, -257.2890625, -247.00390625, -236.71875, -226.43359375, -216.1484375, -205.86328125, -195.578125, -185.29296875, -175.0078125, -164.72265625, -154.4375, -144.15234375, -133.8671875, -123.58203125, -113.296875, -103.01171875, -92.7265625, -82.44140625, -72.15625, -61.87109375, -51.5859375, -41.30078125, -31.015625, -20.73046875, -10.4453125, -0.16015625, 10.125, 20.41015625, 30.6953125, 40.98046875, 51.265625, 61.55078125, 71.8359375, 82.12109375, 92.40625, 102.69140625, 112.9765625, 123.26171875, 133.546875, 143.83203125, 154.1171875, 164.40234375, 174.6875, 184.97265625, 195.2578125, 205.54296875, 215.828125, 226.11328125, 236.3984375, 246.68359375, 256.96875, 267.25390625, 277.5390625, 287.82421875, 298.109375, 308.39453125, 318.6796875, 328.96484375, 339.25]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 8.0, 11.0, 28.0, 26.0, 40.0, 71.0, 130.0, 194.0, 169.0, 111.0, 60.0, 44.0, 28.0, 17.0, 13.0, 19.0, 5.0, 1.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.8833312988281, -399.8243103027344, -379.7652587890625, -359.70623779296875, -339.647216796875, -319.58819580078125, -299.5291442871094, -279.4701232910156, -259.41107177734375, -239.35203552246094, -219.2930145263672, -199.23397827148438, -179.17495727539062, -159.1159210205078, -139.056884765625, -118.99786376953125, -98.9388427734375, -78.87981414794922, -58.82078170776367, -38.761749267578125, -18.702720642089844, 1.3563079833984375, 21.41534423828125, 41.474365234375, 61.53340148925781, 81.5924301147461, 101.65145874023438, 121.71049499511719, 141.76953125, 161.82855224609375, 181.88758850097656, 201.9466094970703, 222.005615234375, 242.0646514892578, 262.1236877441406, 282.1827087402344, 302.2417297363281, 322.30078125, 342.35980224609375, 362.4188232421875, 382.47784423828125, 402.536865234375, 422.5959167480469, 442.6549377441406, 462.7139587402344, 482.77301025390625, 502.83203125, 522.8910522460938, 542.9500732421875, 563.0090942382812, 583.068115234375, 603.127197265625, 623.1862182617188, 643.2452392578125, 663.3042602539062, 683.36328125, 703.42236328125, 723.4813842773438, 743.5404052734375, 763.5994873046875, 783.6585083007812, 803.717529296875, 823.7765502929688, 843.8355712890625, 863.8945922851562]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 9.0, 10.0, 9.0, 9.0, 17.0, 11.0, 19.0, 18.0, 16.0, 18.0, 25.0, 22.0, 28.0, 34.0, 31.0, 35.0, 21.0, 35.0, 36.0, 37.0, 30.0, 46.0, 33.0, 24.0, 38.0, 35.0, 36.0, 28.0, 25.0, 32.0, 24.0, 29.0, 21.0, 23.0, 19.0, 17.0, 13.0, 20.0, 6.0, 10.0, 7.0, 11.0, 8.0, 4.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-271.6313781738281, -262.5910339355469, -253.55068969726562, -244.51036071777344, -235.4700164794922, -226.42967224121094, -217.38934326171875, -208.3489990234375, -199.30865478515625, -190.268310546875, -181.22796630859375, -172.18763732910156, -163.1472930908203, -154.10694885253906, -145.06661987304688, -136.02627563476562, -126.98593139648438, -117.94558715820312, -108.9052505493164, -99.86491394042969, -90.82456970214844, -81.78422546386719, -72.74388885498047, -63.703548431396484, -54.6632080078125, -45.622867584228516, -36.58252716064453, -27.542186737060547, -18.501846313476562, -9.461505889892578, -0.42116546630859375, 8.61917495727539, 17.65948486328125, 26.699825286865234, 35.74016571044922, 44.7805061340332, 53.82084655761719, 62.86118698120117, 71.90152740478516, 80.94186401367188, 89.98220825195312, 99.02255249023438, 108.0628890991211, 117.10322570800781, 126.14356994628906, 135.1839141845703, 144.2242431640625, 153.26458740234375, 162.304931640625, 171.34527587890625, 180.3856201171875, 189.4259490966797, 198.46629333496094, 207.5066375732422, 216.54696655273438, 225.58731079101562, 234.62765502929688, 243.66799926757812, 252.70834350585938, 261.7486877441406, 270.78900146484375, 279.829345703125, 288.86968994140625, 297.9100341796875, 306.95037841796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 5.0, 8.0, 19.0, 18.0, 17.0, 17.0, 25.0, 28.0, 23.0, 30.0, 31.0, 43.0, 43.0, 40.0, 53.0, 44.0, 55.0, 56.0, 50.0, 54.0, 38.0, 38.0, 27.0, 42.0, 27.0, 21.0, 14.0, 27.0, 18.0, 17.0, 9.0, 9.0, 11.0, 7.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5, -42.8916015625, -41.283203125, -39.6748046875, -38.06640625, -36.4580078125, -34.849609375, -33.2412109375, -31.6328125, -30.0244140625, -28.416015625, -26.8076171875, -25.19921875, -23.5908203125, -21.982421875, -20.3740234375, -18.765625, -17.1572265625, -15.548828125, -13.9404296875, -12.33203125, -10.7236328125, -9.115234375, -7.5068359375, -5.8984375, -4.2900390625, -2.681640625, -1.0732421875, 0.53515625, 2.1435546875, 3.751953125, 5.3603515625, 6.96875, 8.5771484375, 10.185546875, 11.7939453125, 13.40234375, 15.0107421875, 16.619140625, 18.2275390625, 19.8359375, 21.4443359375, 23.052734375, 24.6611328125, 26.26953125, 27.8779296875, 29.486328125, 31.0947265625, 32.703125, 34.3115234375, 35.919921875, 37.5283203125, 39.13671875, 40.7451171875, 42.353515625, 43.9619140625, 45.5703125, 47.1787109375, 48.787109375, 50.3955078125, 52.00390625, 53.6123046875, 55.220703125, 56.8291015625, 58.4375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 6.0, 19.0, 15.0, 22.0, 17.0, 31.0, 64.0, 81.0, 99.0, 169.0, 233.0, 455.0, 660.0, 1221.0, 2402.0, 5301.0, 13121.0, 40953.0, 174907.0, 594000.0, 155189.0, 37205.0, 12269.0, 4826.0, 2257.0, 1173.0, 684.0, 376.0, 247.0, 170.0, 106.0, 80.0, 54.0, 34.0, 32.0, 20.0, 16.0, 11.0, 10.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.71875, -13.28271484375, -12.8466796875, -12.41064453125, -11.974609375, -11.53857421875, -11.1025390625, -10.66650390625, -10.23046875, -9.79443359375, -9.3583984375, -8.92236328125, -8.486328125, -8.05029296875, -7.6142578125, -7.17822265625, -6.7421875, -6.30615234375, -5.8701171875, -5.43408203125, -4.998046875, -4.56201171875, -4.1259765625, -3.68994140625, -3.25390625, -2.81787109375, -2.3818359375, -1.94580078125, -1.509765625, -1.07373046875, -0.6376953125, -0.20166015625, 0.234375, 0.67041015625, 1.1064453125, 1.54248046875, 1.978515625, 2.41455078125, 2.8505859375, 3.28662109375, 3.72265625, 4.15869140625, 4.5947265625, 5.03076171875, 5.466796875, 5.90283203125, 6.3388671875, 6.77490234375, 7.2109375, 7.64697265625, 8.0830078125, 8.51904296875, 8.955078125, 9.39111328125, 9.8271484375, 10.26318359375, 10.69921875, 11.13525390625, 11.5712890625, 12.00732421875, 12.443359375, 12.87939453125, 13.3154296875, 13.75146484375, 14.1875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 13.0, 12.0, 8.0, 10.0, 12.0, 16.0, 21.0, 24.0, 25.0, 22.0, 32.0, 34.0, 32.0, 30.0, 38.0, 31.0, 32.0, 42.0, 42.0, 1058.0, 40.0, 37.0, 29.0, 38.0, 30.0, 41.0, 27.0, 28.0, 32.0, 30.0, 23.0, 12.0, 23.0, 16.0, 16.0, 8.0, 11.0, 9.0, 8.0, 6.0, 5.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-30.71875, -29.78564453125, -28.8525390625, -27.91943359375, -26.986328125, -26.05322265625, -25.1201171875, -24.18701171875, -23.25390625, -22.32080078125, -21.3876953125, -20.45458984375, -19.521484375, -18.58837890625, -17.6552734375, -16.72216796875, -15.7890625, -14.85595703125, -13.9228515625, -12.98974609375, -12.056640625, -11.12353515625, -10.1904296875, -9.25732421875, -8.32421875, -7.39111328125, -6.4580078125, -5.52490234375, -4.591796875, -3.65869140625, -2.7255859375, -1.79248046875, -0.859375, 0.07373046875, 1.0068359375, 1.93994140625, 2.873046875, 3.80615234375, 4.7392578125, 5.67236328125, 6.60546875, 7.53857421875, 8.4716796875, 9.40478515625, 10.337890625, 11.27099609375, 12.2041015625, 13.13720703125, 14.0703125, 15.00341796875, 15.9365234375, 16.86962890625, 17.802734375, 18.73583984375, 19.6689453125, 20.60205078125, 21.53515625, 22.46826171875, 23.4013671875, 24.33447265625, 25.267578125, 26.20068359375, 27.1337890625, 28.06689453125, 29.0]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 9.0, 8.0, 14.0, 23.0, 34.0, 35.0, 63.0, 90.0, 116.0, 193.0, 249.0, 338.0, 540.0, 773.0, 1236.0, 1899.0, 3018.0, 4752.0, 7770.0, 12928.0, 22229.0, 39487.0, 72856.0, 141735.0, 1104096.0, 406431.0, 124952.0, 64349.0, 35431.0, 20247.0, 11916.0, 7137.0, 4200.0, 2733.0, 1762.0, 1130.0, 741.0, 504.0, 360.0, 236.0, 150.0, 119.0, 64.0, 54.0, 44.0, 27.0, 16.0, 9.0, 19.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-3.216796875, -3.119049072265625, -3.02130126953125, -2.923553466796875, -2.8258056640625, -2.728057861328125, -2.63031005859375, -2.532562255859375, -2.434814453125, -2.337066650390625, -2.23931884765625, -2.141571044921875, -2.0438232421875, -1.946075439453125, -1.84832763671875, -1.750579833984375, -1.65283203125, -1.555084228515625, -1.45733642578125, -1.359588623046875, -1.2618408203125, -1.164093017578125, -1.06634521484375, -0.968597412109375, -0.870849609375, -0.773101806640625, -0.67535400390625, -0.577606201171875, -0.4798583984375, -0.382110595703125, -0.28436279296875, -0.186614990234375, -0.0888671875, 0.008880615234375, 0.10662841796875, 0.204376220703125, 0.3021240234375, 0.399871826171875, 0.49761962890625, 0.595367431640625, 0.693115234375, 0.790863037109375, 0.88861083984375, 0.986358642578125, 1.0841064453125, 1.181854248046875, 1.27960205078125, 1.377349853515625, 1.47509765625, 1.572845458984375, 1.67059326171875, 1.768341064453125, 1.8660888671875, 1.963836669921875, 2.06158447265625, 2.159332275390625, 2.257080078125, 2.354827880859375, 2.45257568359375, 2.550323486328125, 2.6480712890625, 2.745819091796875, 2.84356689453125, 2.941314697265625, 3.0390625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 4.0, 6.0, 5.0, 3.0, 10.0, 14.0, 14.0, 24.0, 25.0, 18.0, 29.0, 29.0, 43.0, 62.0, 83.0, 163.0, 114.0, 62.0, 60.0, 44.0, 29.0, 26.0, 23.0, 21.0, 12.0, 9.0, 9.0, 9.0, 11.0, 7.0, 5.0, 0.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.8662109375, -0.8425979614257812, -0.8189849853515625, -0.7953720092773438, -0.771759033203125, -0.7481460571289062, -0.7245330810546875, -0.7009201049804688, -0.67730712890625, -0.6536941528320312, -0.6300811767578125, -0.6064682006835938, -0.582855224609375, -0.5592422485351562, -0.5356292724609375, -0.5120162963867188, -0.4884033203125, -0.46479034423828125, -0.4411773681640625, -0.41756439208984375, -0.393951416015625, -0.37033843994140625, -0.3467254638671875, -0.32311248779296875, -0.29949951171875, -0.27588653564453125, -0.2522735595703125, -0.22866058349609375, -0.205047607421875, -0.18143463134765625, -0.1578216552734375, -0.13420867919921875, -0.110595703125, -0.08698272705078125, -0.0633697509765625, -0.03975677490234375, -0.016143798828125, 0.00746917724609375, 0.0310821533203125, 0.05469512939453125, 0.07830810546875, 0.10192108154296875, 0.1255340576171875, 0.14914703369140625, 0.172760009765625, 0.19637298583984375, 0.2199859619140625, 0.24359893798828125, 0.2672119140625, 0.29082489013671875, 0.3144378662109375, 0.33805084228515625, 0.361663818359375, 0.38527679443359375, 0.4088897705078125, 0.43250274658203125, 0.45611572265625, 0.47972869873046875, 0.5033416748046875, 0.5269546508789062, 0.550567626953125, 0.5741806030273438, 0.5977935791015625, 0.6214065551757812, 0.64501953125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 4.0, 7.0, 8.0, 11.0, 8.0, 8.0, 13.0, 15.0, 24.0, 23.0, 40.0, 45.0, 83.0, 101.0, 226.0, 1046862.0, 570.0, 156.0, 85.0, 57.0, 38.0, 23.0, 22.0, 25.0, 21.0, 15.0, 10.0, 8.0, 4.0, 5.0, 8.0, 2.0, 8.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.03125, -20.2744140625, -19.517578125, -18.7607421875, -18.00390625, -17.2470703125, -16.490234375, -15.7333984375, -14.9765625, -14.2197265625, -13.462890625, -12.7060546875, -11.94921875, -11.1923828125, -10.435546875, -9.6787109375, -8.921875, -8.1650390625, -7.408203125, -6.6513671875, -5.89453125, -5.1376953125, -4.380859375, -3.6240234375, -2.8671875, -2.1103515625, -1.353515625, -0.5966796875, 0.16015625, 0.9169921875, 1.673828125, 2.4306640625, 3.1875, 3.9443359375, 4.701171875, 5.4580078125, 6.21484375, 6.9716796875, 7.728515625, 8.4853515625, 9.2421875, 9.9990234375, 10.755859375, 11.5126953125, 12.26953125, 13.0263671875, 13.783203125, 14.5400390625, 15.296875, 16.0537109375, 16.810546875, 17.5673828125, 18.32421875, 19.0810546875, 19.837890625, 20.5947265625, 21.3515625, 22.1083984375, 22.865234375, 23.6220703125, 24.37890625, 25.1357421875, 25.892578125, 26.6494140625, 27.40625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [7.0, 1012.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46293744444847107, -0.1248236894607544, 0.21329006552696228, 0.5514037609100342, 0.8895175457000732, 1.2276313304901123, 1.5657449960708618, 1.9038587808609009, 2.2419726848602295, 2.5800864696502686, 2.9182002544403076, 3.2563138008117676, 3.5944275856018066, 3.9325413703918457, 4.270655155181885, 4.608768939971924, 4.946882724761963, 5.284996509552002, 5.623110294342041, 5.96122407913208, 6.299337863922119, 6.637451648712158, 6.975564956665039, 7.313678741455078, 7.651792526245117, 7.989906311035156, 8.328020095825195, 8.666133880615234, 9.004247665405273, 9.342361450195312, 9.680475234985352, 10.01858901977539, 10.356701850891113, 10.694815635681152, 11.032929420471191, 11.37104320526123, 11.70915699005127, 12.047270774841309, 12.385384559631348, 12.723498344421387, 13.061612129211426, 13.399725914001465, 13.737839698791504, 14.075953483581543, 14.414067268371582, 14.752181053161621, 15.09029483795166, 15.4284086227417, 15.766521453857422, 16.10463523864746, 16.4427490234375, 16.78086280822754, 17.118976593017578, 17.457090377807617, 17.795204162597656, 18.133317947387695, 18.471431732177734, 18.809545516967773, 19.147659301757812, 19.48577308654785, 19.82388687133789, 20.16200065612793, 20.50011444091797, 20.838228225708008, 21.176342010498047]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 6.0, 9.0, 20.0, 11.0, 10.0, 19.0, 21.0, 32.0, 47.0, 25.0, 30.0, 28.0, 42.0, 41.0, 37.0, 35.0, 42.0, 50.0, 39.0, 40.0, 38.0, 35.0, 39.0, 35.0, 23.0, 35.0, 20.0, 35.0, 24.0, 28.0, 17.0, 7.0, 20.0, 10.0, 9.0, 13.0, 6.0, 4.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9654772281646729, -1.9001182317733765, -1.83475923538208, -1.7694002389907837, -1.7040412425994873, -1.6386821269989014, -1.573323130607605, -1.5079641342163086, -1.4426051378250122, -1.3772461414337158, -1.3118871450424194, -1.246528148651123, -1.181169033050537, -1.1158101558685303, -1.0504510402679443, -0.985092043876648, -0.9197330474853516, -0.8543740510940552, -0.7890150547027588, -0.7236559987068176, -0.6582970023155212, -0.5929380059242249, -0.5275789499282837, -0.4622199535369873, -0.3968609571456909, -0.33150196075439453, -0.26614293456077576, -0.20078392326831818, -0.1354249119758606, -0.07006591558456421, -0.004706889390945435, 0.06065213680267334, 0.12601137161254883, 0.1913703829050064, 0.256729394197464, 0.32208842039108276, 0.38744741678237915, 0.45280641317367554, 0.5181654691696167, 0.5835244655609131, 0.6488834619522095, 0.7142424583435059, 0.7796014547348022, 0.8449605107307434, 0.9103195071220398, 0.9756785035133362, 1.0410375595092773, 1.1063965559005737, 1.1717555522918701, 1.2371145486831665, 1.302473545074463, 1.3678325414657593, 1.4331915378570557, 1.4985506534576416, 1.563909649848938, 1.6292686462402344, 1.6946276426315308, 1.7599866390228271, 1.8253456354141235, 1.89070463180542, 1.9560637474060059, 2.0214226245880127, 2.0867817401885986, 2.1521406173706055, 2.2174997329711914]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 5.0, 8.0, 19.0, 18.0, 18.0, 16.0, 25.0, 28.0, 23.0, 31.0, 30.0, 43.0, 43.0, 40.0, 53.0, 44.0, 55.0, 56.0, 50.0, 54.0, 38.0, 39.0, 26.0, 42.0, 27.0, 21.0, 14.0, 28.0, 17.0, 17.0, 10.0, 8.0, 11.0, 7.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.46875, -42.86083984375, -41.2529296875, -39.64501953125, -38.037109375, -36.42919921875, -34.8212890625, -33.21337890625, -31.60546875, -29.99755859375, -28.3896484375, -26.78173828125, -25.173828125, -23.56591796875, -21.9580078125, -20.35009765625, -18.7421875, -17.13427734375, -15.5263671875, -13.91845703125, -12.310546875, -10.70263671875, -9.0947265625, -7.48681640625, -5.87890625, -4.27099609375, -2.6630859375, -1.05517578125, 0.552734375, 2.16064453125, 3.7685546875, 5.37646484375, 6.984375, 8.59228515625, 10.2001953125, 11.80810546875, 13.416015625, 15.02392578125, 16.6318359375, 18.23974609375, 19.84765625, 21.45556640625, 23.0634765625, 24.67138671875, 26.279296875, 27.88720703125, 29.4951171875, 31.10302734375, 32.7109375, 34.31884765625, 35.9267578125, 37.53466796875, 39.142578125, 40.75048828125, 42.3583984375, 43.96630859375, 45.57421875, 47.18212890625, 48.7900390625, 50.39794921875, 52.005859375, 53.61376953125, 55.2216796875, 56.82958984375, 58.4375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 10.0, 13.0, 18.0, 19.0, 34.0, 40.0, 67.0, 84.0, 151.0, 221.0, 281.0, 425.0, 727.0, 1150.0, 1793.0, 2818.0, 4758.0, 8208.0, 15881.0, 36256.0, 157698.0, 673274.0, 87195.0, 27122.0, 12634.0, 6956.0, 3958.0, 2414.0, 1526.0, 947.0, 621.0, 407.0, 263.0, 183.0, 126.0, 85.0, 52.0, 45.0, 32.0, 21.0, 15.0, 6.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.90625, -58.83056640625, -56.7548828125, -54.67919921875, -52.603515625, -50.52783203125, -48.4521484375, -46.37646484375, -44.30078125, -42.22509765625, -40.1494140625, -38.07373046875, -35.998046875, -33.92236328125, -31.8466796875, -29.77099609375, -27.6953125, -25.61962890625, -23.5439453125, -21.46826171875, -19.392578125, -17.31689453125, -15.2412109375, -13.16552734375, -11.08984375, -9.01416015625, -6.9384765625, -4.86279296875, -2.787109375, -0.71142578125, 1.3642578125, 3.43994140625, 5.515625, 7.59130859375, 9.6669921875, 11.74267578125, 13.818359375, 15.89404296875, 17.9697265625, 20.04541015625, 22.12109375, 24.19677734375, 26.2724609375, 28.34814453125, 30.423828125, 32.49951171875, 34.5751953125, 36.65087890625, 38.7265625, 40.80224609375, 42.8779296875, 44.95361328125, 47.029296875, 49.10498046875, 51.1806640625, 53.25634765625, 55.33203125, 57.40771484375, 59.4833984375, 61.55908203125, 63.634765625, 65.71044921875, 67.7861328125, 69.86181640625, 71.9375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 12.0, 7.0, 11.0, 17.0, 13.0, 19.0, 28.0, 24.0, 32.0, 43.0, 43.0, 55.0, 61.0, 72.0, 99.0, 213.0, 1709.0, 107.0, 74.0, 76.0, 51.0, 50.0, 50.0, 26.0, 22.0, 30.0, 16.0, 18.0, 14.0, 14.0, 9.0, 6.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.0, -150.0390625, -144.078125, -138.1171875, -132.15625, -126.1953125, -120.234375, -114.2734375, -108.3125, -102.3515625, -96.390625, -90.4296875, -84.46875, -78.5078125, -72.546875, -66.5859375, -60.625, -54.6640625, -48.703125, -42.7421875, -36.78125, -30.8203125, -24.859375, -18.8984375, -12.9375, -6.9765625, -1.015625, 4.9453125, 10.90625, 16.8671875, 22.828125, 28.7890625, 34.75, 40.7109375, 46.671875, 52.6328125, 58.59375, 64.5546875, 70.515625, 76.4765625, 82.4375, 88.3984375, 94.359375, 100.3203125, 106.28125, 112.2421875, 118.203125, 124.1640625, 130.125, 136.0859375, 142.046875, 148.0078125, 153.96875, 159.9296875, 165.890625, 171.8515625, 177.8125, 183.7734375, 189.734375, 195.6953125, 201.65625, 207.6171875, 213.578125, 219.5390625, 225.5]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 10.0, 10.0, 24.0, 24.0, 30.0, 28.0, 53.0, 89.0, 119.0, 212.0, 368.0, 1117.0, 5204.0, 47509.0, 2996302.0, 84454.0, 7490.0, 1485.0, 482.0, 216.0, 136.0, 102.0, 59.0, 37.0, 34.0, 32.0, 18.0, 18.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-486.5, -472.01953125, -457.5390625, -443.05859375, -428.578125, -414.09765625, -399.6171875, -385.13671875, -370.65625, -356.17578125, -341.6953125, -327.21484375, -312.734375, -298.25390625, -283.7734375, -269.29296875, -254.8125, -240.33203125, -225.8515625, -211.37109375, -196.890625, -182.41015625, -167.9296875, -153.44921875, -138.96875, -124.48828125, -110.0078125, -95.52734375, -81.046875, -66.56640625, -52.0859375, -37.60546875, -23.125, -8.64453125, 5.8359375, 20.31640625, 34.796875, 49.27734375, 63.7578125, 78.23828125, 92.71875, 107.19921875, 121.6796875, 136.16015625, 150.640625, 165.12109375, 179.6015625, 194.08203125, 208.5625, 223.04296875, 237.5234375, 252.00390625, 266.484375, 280.96484375, 295.4453125, 309.92578125, 324.40625, 338.88671875, 353.3671875, 367.84765625, 382.328125, 396.80859375, 411.2890625, 425.76953125, 440.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.0, 905.0, 41.0], "bins": [-8190.32373046875, -8059.06640625, -7927.80908203125, -7796.5517578125, -7665.29443359375, -7534.037109375, -7402.77978515625, -7271.5224609375, -7140.26513671875, -7009.0078125, -6877.75048828125, -6746.4931640625, -6615.23583984375, -6483.978515625, -6352.72119140625, -6221.4638671875, -6090.20703125, -5958.94970703125, -5827.6923828125, -5696.43505859375, -5565.177734375, -5433.92041015625, -5302.6630859375, -5171.40576171875, -5040.1484375, -4908.89111328125, -4777.6337890625, -4646.37646484375, -4515.119140625, -4383.86181640625, -4252.6044921875, -4121.34716796875, -3990.08935546875, -3858.83203125, -3727.57470703125, -3596.3173828125, -3465.06005859375, -3333.802734375, -3202.54541015625, -3071.2880859375, -2940.031005859375, -2808.773681640625, -2677.516357421875, -2546.259033203125, -2415.001708984375, -2283.744384765625, -2152.4873046875, -2021.2298583984375, -1889.9725341796875, -1758.7152099609375, -1627.4578857421875, -1496.20068359375, -1364.943359375, -1233.68603515625, -1102.4287109375, -971.17138671875, -839.9140625, -708.65673828125, -577.3994140625, -446.14215087890625, -314.88482666015625, -183.62750244140625, -52.3702392578125, 78.8870849609375, 210.1444091796875]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 9.0, 4.0, 12.0, 9.0, 15.0, 12.0, 14.0, 17.0, 18.0, 22.0, 31.0, 31.0, 33.0, 34.0, 37.0, 33.0, 35.0, 41.0, 32.0, 42.0, 28.0, 49.0, 37.0, 36.0, 31.0, 36.0, 30.0, 25.0, 38.0, 20.0, 22.0, 23.0, 24.0, 20.0, 10.0, 13.0, 14.0, 10.0, 8.0, 10.0, 6.0, 3.0, 8.0, 4.0, 8.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-363.2686767578125, -351.8797912597656, -340.49090576171875, -329.1020202636719, -317.713134765625, -306.32421875, -294.9353332519531, -283.54644775390625, -272.1575622558594, -260.7686767578125, -249.37979125976562, -237.9908905029297, -226.6020050048828, -215.21311950683594, -203.82421875, -192.43533325195312, -181.04644775390625, -169.65756225585938, -158.2686767578125, -146.87977600097656, -135.4908905029297, -124.10200500488281, -112.7131118774414, -101.32421875, -89.93533325195312, -78.54644775390625, -67.15755462646484, -55.7686653137207, -44.37977600097656, -32.99088668823242, -21.60199737548828, -10.213104248046875, 1.17578125, 12.56467056274414, 23.95355987548828, 35.34244918823242, 46.73133850097656, 58.1202278137207, 69.50911712646484, 80.89801025390625, 92.28689575195312, 103.67578125, 115.0646743774414, 126.45356750488281, 137.8424530029297, 149.23133850097656, 160.6202392578125, 172.00912475585938, 183.39801025390625, 194.78689575195312, 206.17578125, 217.56468200683594, 228.9535675048828, 240.3424530029297, 251.73135375976562, 263.1202392578125, 274.5091247558594, 285.89801025390625, 297.2868957519531, 308.67578125, 320.064697265625, 331.4535827636719, 342.84246826171875, 354.2313537597656, 365.6202392578125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 2.0, 4.0, 5.0, 7.0, 10.0, 9.0, 10.0, 13.0, 25.0, 22.0, 27.0, 19.0, 28.0, 37.0, 31.0, 43.0, 28.0, 45.0, 58.0, 44.0, 41.0, 53.0, 56.0, 35.0, 42.0, 38.0, 33.0, 34.0, 30.0, 25.0, 14.0, 19.0, 10.0, 18.0, 10.0, 15.0, 11.0, 7.0, 9.0, 5.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.59375, -43.9951171875, -42.396484375, -40.7978515625, -39.19921875, -37.6005859375, -36.001953125, -34.4033203125, -32.8046875, -31.2060546875, -29.607421875, -28.0087890625, -26.41015625, -24.8115234375, -23.212890625, -21.6142578125, -20.015625, -18.4169921875, -16.818359375, -15.2197265625, -13.62109375, -12.0224609375, -10.423828125, -8.8251953125, -7.2265625, -5.6279296875, -4.029296875, -2.4306640625, -0.83203125, 0.7666015625, 2.365234375, 3.9638671875, 5.5625, 7.1611328125, 8.759765625, 10.3583984375, 11.95703125, 13.5556640625, 15.154296875, 16.7529296875, 18.3515625, 19.9501953125, 21.548828125, 23.1474609375, 24.74609375, 26.3447265625, 27.943359375, 29.5419921875, 31.140625, 32.7392578125, 34.337890625, 35.9365234375, 37.53515625, 39.1337890625, 40.732421875, 42.3310546875, 43.9296875, 45.5283203125, 47.126953125, 48.7255859375, 50.32421875, 51.9228515625, 53.521484375, 55.1201171875, 56.71875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 6.0, 8.0, 8.0, 8.0, 15.0, 14.0, 23.0, 30.0, 53.0, 72.0, 120.0, 219.0, 344.0, 604.0, 1127.0, 2278.0, 5163.0, 13063.0, 71325.0, 3426351.0, 633047.0, 24821.0, 8179.0, 3495.0, 1745.0, 838.0, 523.0, 312.0, 148.0, 107.0, 57.0, 42.0, 32.0, 20.0, 19.0, 5.0, 11.0, 5.0, 8.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.25, -173.228515625, -167.20703125, -161.185546875, -155.1640625, -149.142578125, -143.12109375, -137.099609375, -131.078125, -125.056640625, -119.03515625, -113.013671875, -106.9921875, -100.970703125, -94.94921875, -88.927734375, -82.90625, -76.884765625, -70.86328125, -64.841796875, -58.8203125, -52.798828125, -46.77734375, -40.755859375, -34.734375, -28.712890625, -22.69140625, -16.669921875, -10.6484375, -4.626953125, 1.39453125, 7.416015625, 13.4375, 19.458984375, 25.48046875, 31.501953125, 37.5234375, 43.544921875, 49.56640625, 55.587890625, 61.609375, 67.630859375, 73.65234375, 79.673828125, 85.6953125, 91.716796875, 97.73828125, 103.759765625, 109.78125, 115.802734375, 121.82421875, 127.845703125, 133.8671875, 139.888671875, 145.91015625, 151.931640625, 157.953125, 163.974609375, 169.99609375, 176.017578125, 182.0390625, 188.060546875, 194.08203125, 200.103515625, 206.125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 10.0, 17.0, 19.0, 34.0, 71.0, 142.0, 346.0, 885.0, 1442.0, 585.0, 260.0, 97.0, 56.0, 36.0, 24.0, 16.0, 9.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.0, -203.509765625, -197.01953125, -190.529296875, -184.0390625, -177.548828125, -171.05859375, -164.568359375, -158.078125, -151.587890625, -145.09765625, -138.607421875, -132.1171875, -125.626953125, -119.13671875, -112.646484375, -106.15625, -99.666015625, -93.17578125, -86.685546875, -80.1953125, -73.705078125, -67.21484375, -60.724609375, -54.234375, -47.744140625, -41.25390625, -34.763671875, -28.2734375, -21.783203125, -15.29296875, -8.802734375, -2.3125, 4.177734375, 10.66796875, 17.158203125, 23.6484375, 30.138671875, 36.62890625, 43.119140625, 49.609375, 56.099609375, 62.58984375, 69.080078125, 75.5703125, 82.060546875, 88.55078125, 95.041015625, 101.53125, 108.021484375, 114.51171875, 121.001953125, 127.4921875, 133.982421875, 140.47265625, 146.962890625, 153.453125, 159.943359375, 166.43359375, 172.923828125, 179.4140625, 185.904296875, 192.39453125, 198.884765625, 205.375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 0.0, 2.0, 4.0, 7.0, 5.0, 14.0, 12.0, 24.0, 33.0, 44.0, 59.0, 80.0, 113.0, 188.0, 280.0, 592.0, 1375.0, 3984.0, 17229.0, 271074.0, 3845174.0, 42543.0, 7278.0, 2158.0, 851.0, 393.0, 272.0, 146.0, 98.0, 72.0, 43.0, 37.0, 18.0, 27.0, 14.0, 15.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-391.5, -378.546875, -365.59375, -352.640625, -339.6875, -326.734375, -313.78125, -300.828125, -287.875, -274.921875, -261.96875, -249.015625, -236.0625, -223.109375, -210.15625, -197.203125, -184.25, -171.296875, -158.34375, -145.390625, -132.4375, -119.484375, -106.53125, -93.578125, -80.625, -67.671875, -54.71875, -41.765625, -28.8125, -15.859375, -2.90625, 10.046875, 23.0, 35.953125, 48.90625, 61.859375, 74.8125, 87.765625, 100.71875, 113.671875, 126.625, 139.578125, 152.53125, 165.484375, 178.4375, 191.390625, 204.34375, 217.296875, 230.25, 243.203125, 256.15625, 269.109375, 282.0625, 295.015625, 307.96875, 320.921875, 333.875, 346.828125, 359.78125, 372.734375, 385.6875, 398.640625, 411.59375, 424.546875, 437.5]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 5.0, 8.0, 16.0, 19.0, 16.0, 36.0, 64.0, 75.0, 125.0, 143.0, 120.0, 117.0, 73.0, 54.0, 38.0, 21.0, 16.0, 12.0, 4.0, 10.0, 7.0, 2.0, 5.0, 0.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-459.1439208984375, -443.13702392578125, -427.130126953125, -411.1232604980469, -395.1163635253906, -379.1094665527344, -363.10260009765625, -347.095703125, -331.08880615234375, -315.0819091796875, -299.07501220703125, -283.0681457519531, -267.0612487792969, -251.05435180664062, -235.04747009277344, -219.04058837890625, -203.03369140625, -187.02679443359375, -171.01991271972656, -155.01303100585938, -139.00613403320312, -122.9992446899414, -106.99235534667969, -90.98546600341797, -74.97857666015625, -58.97168731689453, -42.96479797363281, -26.957908630371094, -10.951019287109375, 5.055870056152344, 21.062759399414062, 37.06964874267578, 53.07647705078125, 69.08336639404297, 85.09025573730469, 101.0971450805664, 117.10403442382812, 133.11093139648438, 149.11781311035156, 165.12469482421875, 181.131591796875, 197.13848876953125, 213.14537048339844, 229.15225219726562, 245.15914916992188, 261.1660461425781, 277.17291259765625, 293.1798095703125, 309.18670654296875, 325.193603515625, 341.20050048828125, 357.2073669433594, 373.2142639160156, 389.2211608886719, 405.22802734375, 421.23492431640625, 437.2418212890625, 453.24871826171875, 469.255615234375, 485.2624816894531, 501.2693786621094, 517.2762451171875, 533.2831420898438, 549.2900390625, 565.2969360351562]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 4.0, 12.0, 8.0, 12.0, 5.0, 14.0, 13.0, 19.0, 22.0, 23.0, 26.0, 25.0, 32.0, 27.0, 33.0, 37.0, 42.0, 55.0, 40.0, 49.0, 47.0, 49.0, 50.0, 37.0, 41.0, 39.0, 33.0, 32.0, 33.0, 25.0, 21.0, 19.0, 17.0, 10.0, 9.0, 17.0, 8.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-350.869384765625, -339.45782470703125, -328.0462951660156, -316.6347351074219, -305.22320556640625, -293.8116455078125, -282.40008544921875, -270.9885559082031, -259.5770263671875, -248.1654815673828, -236.75393676757812, -225.34237670898438, -213.93084716796875, -202.519287109375, -191.1077423095703, -179.69619750976562, -168.28463745117188, -156.8730926513672, -145.4615478515625, -134.04998779296875, -122.6384506225586, -111.2269058227539, -99.81535339355469, -88.40380859375, -76.99226379394531, -65.58071899414062, -54.16917037963867, -42.75762176513672, -31.34607696533203, -19.934532165527344, -8.522979736328125, 2.8885650634765625, 14.30010986328125, 25.71165657043457, 37.12320327758789, 48.534751892089844, 59.94629669189453, 71.35784149169922, 82.76939392089844, 94.18093872070312, 105.59248352050781, 117.0040283203125, 128.4155731201172, 139.82711791992188, 151.23867797851562, 162.65020751953125, 174.061767578125, 185.4733123779297, 196.88485717773438, 208.29640197753906, 219.70794677734375, 231.1195068359375, 242.53103637695312, 253.94259643554688, 265.3541259765625, 276.76568603515625, 288.17724609375, 299.58880615234375, 311.0003356933594, 322.4118957519531, 333.82342529296875, 345.2349853515625, 356.64654541015625, 368.0580749511719, 379.4696044921875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 12.0, 18.0, 11.0, 11.0, 10.0, 14.0, 30.0, 25.0, 20.0, 37.0, 38.0, 44.0, 47.0, 48.0, 46.0, 47.0, 43.0, 54.0, 50.0, 41.0, 48.0, 40.0, 36.0, 29.0, 32.0, 19.0, 21.0, 23.0, 12.0, 14.0, 14.0, 15.0, 8.0, 7.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.8125, -44.0888671875, -42.365234375, -40.6416015625, -38.91796875, -37.1943359375, -35.470703125, -33.7470703125, -32.0234375, -30.2998046875, -28.576171875, -26.8525390625, -25.12890625, -23.4052734375, -21.681640625, -19.9580078125, -18.234375, -16.5107421875, -14.787109375, -13.0634765625, -11.33984375, -9.6162109375, -7.892578125, -6.1689453125, -4.4453125, -2.7216796875, -0.998046875, 0.7255859375, 2.44921875, 4.1728515625, 5.896484375, 7.6201171875, 9.34375, 11.0673828125, 12.791015625, 14.5146484375, 16.23828125, 17.9619140625, 19.685546875, 21.4091796875, 23.1328125, 24.8564453125, 26.580078125, 28.3037109375, 30.02734375, 31.7509765625, 33.474609375, 35.1982421875, 36.921875, 38.6455078125, 40.369140625, 42.0927734375, 43.81640625, 45.5400390625, 47.263671875, 48.9873046875, 50.7109375, 52.4345703125, 54.158203125, 55.8818359375, 57.60546875, 59.3291015625, 61.052734375, 62.7763671875, 64.5]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 7.0, 18.0, 23.0, 22.0, 28.0, 37.0, 40.0, 64.0, 95.0, 141.0, 167.0, 276.0, 422.0, 702.0, 1003.0, 1743.0, 3440.0, 7990.0, 23805.0, 96224.0, 541140.0, 288118.0, 55234.0, 15476.0, 5761.0, 2565.0, 1458.0, 795.0, 538.0, 384.0, 217.0, 161.0, 161.0, 102.0, 61.0, 45.0, 26.0, 21.0, 15.0, 9.0, 10.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-18.984375, -18.4390869140625, -17.893798828125, -17.3485107421875, -16.80322265625, -16.2579345703125, -15.712646484375, -15.1673583984375, -14.6220703125, -14.0767822265625, -13.531494140625, -12.9862060546875, -12.44091796875, -11.8956298828125, -11.350341796875, -10.8050537109375, -10.259765625, -9.7144775390625, -9.169189453125, -8.6239013671875, -8.07861328125, -7.5333251953125, -6.988037109375, -6.4427490234375, -5.8974609375, -5.3521728515625, -4.806884765625, -4.2615966796875, -3.71630859375, -3.1710205078125, -2.625732421875, -2.0804443359375, -1.53515625, -0.9898681640625, -0.444580078125, 0.1007080078125, 0.64599609375, 1.1912841796875, 1.736572265625, 2.2818603515625, 2.8271484375, 3.3724365234375, 3.917724609375, 4.4630126953125, 5.00830078125, 5.5535888671875, 6.098876953125, 6.6441650390625, 7.189453125, 7.7347412109375, 8.280029296875, 8.8253173828125, 9.37060546875, 9.9158935546875, 10.461181640625, 11.0064697265625, 11.5517578125, 12.0970458984375, 12.642333984375, 13.1876220703125, 13.73291015625, 14.2781982421875, 14.823486328125, 15.3687744140625, 15.9140625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 2.0, 7.0, 9.0, 6.0, 7.0, 9.0, 16.0, 13.0, 15.0, 25.0, 25.0, 23.0, 34.0, 41.0, 27.0, 39.0, 40.0, 53.0, 49.0, 33.0, 1082.0, 41.0, 52.0, 43.0, 44.0, 30.0, 42.0, 26.0, 27.0, 22.0, 24.0, 20.0, 24.0, 13.0, 15.0, 16.0, 9.0, 10.0, 3.0, 3.0, 2.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.64111328125, -35.4697265625, -34.29833984375, -33.126953125, -31.95556640625, -30.7841796875, -29.61279296875, -28.44140625, -27.27001953125, -26.0986328125, -24.92724609375, -23.755859375, -22.58447265625, -21.4130859375, -20.24169921875, -19.0703125, -17.89892578125, -16.7275390625, -15.55615234375, -14.384765625, -13.21337890625, -12.0419921875, -10.87060546875, -9.69921875, -8.52783203125, -7.3564453125, -6.18505859375, -5.013671875, -3.84228515625, -2.6708984375, -1.49951171875, -0.328125, 0.84326171875, 2.0146484375, 3.18603515625, 4.357421875, 5.52880859375, 6.7001953125, 7.87158203125, 9.04296875, 10.21435546875, 11.3857421875, 12.55712890625, 13.728515625, 14.89990234375, 16.0712890625, 17.24267578125, 18.4140625, 19.58544921875, 20.7568359375, 21.92822265625, 23.099609375, 24.27099609375, 25.4423828125, 26.61376953125, 27.78515625, 28.95654296875, 30.1279296875, 31.29931640625, 32.470703125, 33.64208984375, 34.8134765625, 35.98486328125, 37.15625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 13.0, 14.0, 25.0, 29.0, 43.0, 71.0, 110.0, 147.0, 219.0, 349.0, 515.0, 850.0, 1478.0, 2437.0, 4478.0, 8231.0, 16373.0, 33618.0, 74385.0, 185385.0, 1358979.0, 238190.0, 90542.0, 39996.0, 18952.0, 9588.0, 5139.0, 2792.0, 1546.0, 965.0, 545.0, 399.0, 226.0, 169.0, 113.0, 58.0, 45.0, 28.0, 22.0, 19.0, 10.0, 10.0, 5.0, 7.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.60546875, -4.45977783203125, -4.3140869140625, -4.16839599609375, -4.022705078125, -3.87701416015625, -3.7313232421875, -3.58563232421875, -3.43994140625, -3.29425048828125, -3.1485595703125, -3.00286865234375, -2.857177734375, -2.71148681640625, -2.5657958984375, -2.42010498046875, -2.2744140625, -2.12872314453125, -1.9830322265625, -1.83734130859375, -1.691650390625, -1.54595947265625, -1.4002685546875, -1.25457763671875, -1.10888671875, -0.96319580078125, -0.8175048828125, -0.67181396484375, -0.526123046875, -0.38043212890625, -0.2347412109375, -0.08905029296875, 0.056640625, 0.20233154296875, 0.3480224609375, 0.49371337890625, 0.639404296875, 0.78509521484375, 0.9307861328125, 1.07647705078125, 1.22216796875, 1.36785888671875, 1.5135498046875, 1.65924072265625, 1.804931640625, 1.95062255859375, 2.0963134765625, 2.24200439453125, 2.3876953125, 2.53338623046875, 2.6790771484375, 2.82476806640625, 2.970458984375, 3.11614990234375, 3.2618408203125, 3.40753173828125, 3.55322265625, 3.69891357421875, 3.8446044921875, 3.99029541015625, 4.135986328125, 4.28167724609375, 4.4273681640625, 4.57305908203125, 4.71875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 8.0, 7.0, 5.0, 13.0, 12.0, 25.0, 30.0, 36.0, 57.0, 61.0, 85.0, 144.0, 188.0, 82.0, 54.0, 45.0, 42.0, 19.0, 21.0, 9.0, 13.0, 8.0, 9.0, 7.0, 4.0, 1.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98095703125, -0.9494552612304688, -0.9179534912109375, -0.8864517211914062, -0.854949951171875, -0.8234481811523438, -0.7919464111328125, -0.7604446411132812, -0.72894287109375, -0.6974411010742188, -0.6659393310546875, -0.6344375610351562, -0.602935791015625, -0.5714340209960938, -0.5399322509765625, -0.5084304809570312, -0.4769287109375, -0.44542694091796875, -0.4139251708984375, -0.38242340087890625, -0.350921630859375, -0.31941986083984375, -0.2879180908203125, -0.25641632080078125, -0.22491455078125, -0.19341278076171875, -0.1619110107421875, -0.13040924072265625, -0.098907470703125, -0.06740570068359375, -0.0359039306640625, -0.00440216064453125, 0.027099609375, 0.05860137939453125, 0.0901031494140625, 0.12160491943359375, 0.153106689453125, 0.18460845947265625, 0.2161102294921875, 0.24761199951171875, 0.27911376953125, 0.31061553955078125, 0.3421173095703125, 0.37361907958984375, 0.405120849609375, 0.43662261962890625, 0.4681243896484375, 0.49962615966796875, 0.5311279296875, 0.5626296997070312, 0.5941314697265625, 0.6256332397460938, 0.657135009765625, 0.6886367797851562, 0.7201385498046875, 0.7516403198242188, 0.78314208984375, 0.8146438598632812, 0.8461456298828125, 0.8776473999023438, 0.909149169921875, 0.9406509399414062, 0.9721527099609375, 1.0036544799804688, 1.03515625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 2.0, 5.0, 6.0, 8.0, 9.0, 12.0, 11.0, 25.0, 19.0, 49.0, 58.0, 98.0, 199.0, 1046968.0, 618.0, 159.0, 95.0, 56.0, 40.0, 31.0, 26.0, 12.0, 13.0, 4.0, 6.0, 12.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.3125, -33.26611328125, -32.2197265625, -31.17333984375, -30.126953125, -29.08056640625, -28.0341796875, -26.98779296875, -25.94140625, -24.89501953125, -23.8486328125, -22.80224609375, -21.755859375, -20.70947265625, -19.6630859375, -18.61669921875, -17.5703125, -16.52392578125, -15.4775390625, -14.43115234375, -13.384765625, -12.33837890625, -11.2919921875, -10.24560546875, -9.19921875, -8.15283203125, -7.1064453125, -6.06005859375, -5.013671875, -3.96728515625, -2.9208984375, -1.87451171875, -0.828125, 0.21826171875, 1.2646484375, 2.31103515625, 3.357421875, 4.40380859375, 5.4501953125, 6.49658203125, 7.54296875, 8.58935546875, 9.6357421875, 10.68212890625, 11.728515625, 12.77490234375, 13.8212890625, 14.86767578125, 15.9140625, 16.96044921875, 18.0068359375, 19.05322265625, 20.099609375, 21.14599609375, 22.1923828125, 23.23876953125, 24.28515625, 25.33154296875, 26.3779296875, 27.42431640625, 28.470703125, 29.51708984375, 30.5634765625, 31.60986328125, 32.65625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 1015.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7138117551803589, -0.24255841970443726, 0.22869491577148438, 0.6999481916427612, 1.1712015867233276, 1.642454981803894, 2.113708019256592, 2.584961414337158, 3.0562148094177246, 3.527468204498291, 3.9987215995788574, 4.469974517822266, 4.941227912902832, 5.412481307983398, 5.883734703063965, 6.354988098144531, 6.826241493225098, 7.297494888305664, 7.7687482833862305, 8.240001678466797, 8.711255073547363, 9.18250846862793, 9.65376091003418, 10.125015258789062, 10.596268653869629, 11.067522048950195, 11.538775444030762, 12.010028839111328, 12.481282234191895, 12.952535629272461, 13.423788070678711, 13.895042419433594, 14.366294860839844, 14.83754825592041, 15.308801651000977, 15.780055046081543, 16.25130844116211, 16.72256088256836, 17.193815231323242, 17.665067672729492, 18.136322021484375, 18.607574462890625, 19.078828811645508, 19.550081253051758, 20.02133560180664, 20.49258804321289, 20.963842391967773, 21.435094833374023, 21.906349182128906, 22.377601623535156, 22.84885597229004, 23.32010841369629, 23.791362762451172, 24.262615203857422, 24.733869552612305, 25.205121994018555, 25.676374435424805, 26.147626876831055, 26.618881225585938, 27.090133666992188, 27.56138801574707, 28.03264045715332, 28.503894805908203, 28.975147247314453, 29.446401596069336]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 9.0, 8.0, 7.0, 10.0, 19.0, 10.0, 17.0, 26.0, 19.0, 27.0, 30.0, 28.0, 39.0, 26.0, 33.0, 25.0, 46.0, 36.0, 51.0, 37.0, 39.0, 38.0, 39.0, 30.0, 31.0, 30.0, 40.0, 34.0, 29.0, 35.0, 24.0, 20.0, 16.0, 11.0, 5.0, 11.0, 20.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.0322227478027344, -1.9668182134628296, -1.9014136791229248, -1.8360092639923096, -1.7706047296524048, -1.7052001953125, -1.6397957801818848, -1.57439124584198, -1.5089867115020752, -1.4435821771621704, -1.3781776428222656, -1.3127732276916504, -1.2473686933517456, -1.1819641590118408, -1.1165597438812256, -1.0511552095413208, -0.985750675201416, -0.9203461408615112, -0.8549416661262512, -0.7895371913909912, -0.7241326570510864, -0.6587281227111816, -0.5933236479759216, -0.5279191732406616, -0.46251463890075684, -0.39711013436317444, -0.33170562982559204, -0.26630112528800964, -0.20089662075042725, -0.13549211621284485, -0.07008761167526245, -0.004683107137680054, 0.060721397399902344, 0.12612590193748474, 0.19153040647506714, 0.25693491101264954, 0.32233941555023193, 0.38774392008781433, 0.45314842462539673, 0.5185528993606567, 0.5839574337005615, 0.6493619680404663, 0.7147664427757263, 0.7801709175109863, 0.8455754518508911, 0.9109799861907959, 0.9763844609260559, 1.041788935661316, 1.1071934700012207, 1.1725980043411255, 1.2380025386810303, 1.3034069538116455, 1.3688114881515503, 1.434216022491455, 1.4996204376220703, 1.565024971961975, 1.6304295063018799, 1.6958340406417847, 1.7612385749816895, 1.8266429901123047, 1.8920475244522095, 1.9574520587921143, 2.0228564739227295, 2.088261127471924, 2.153665542602539]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 12.0, 18.0, 11.0, 11.0, 10.0, 14.0, 30.0, 25.0, 20.0, 37.0, 39.0, 43.0, 47.0, 48.0, 46.0, 47.0, 43.0, 54.0, 49.0, 42.0, 48.0, 40.0, 36.0, 29.0, 32.0, 19.0, 21.0, 23.0, 12.0, 14.0, 14.0, 15.0, 8.0, 7.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.8125, -44.0888671875, -42.365234375, -40.6416015625, -38.91796875, -37.1943359375, -35.470703125, -33.7470703125, -32.0234375, -30.2998046875, -28.576171875, -26.8525390625, -25.12890625, -23.4052734375, -21.681640625, -19.9580078125, -18.234375, -16.5107421875, -14.787109375, -13.0634765625, -11.33984375, -9.6162109375, -7.892578125, -6.1689453125, -4.4453125, -2.7216796875, -0.998046875, 0.7255859375, 2.44921875, 4.1728515625, 5.896484375, 7.6201171875, 9.34375, 11.0673828125, 12.791015625, 14.5146484375, 16.23828125, 17.9619140625, 19.685546875, 21.4091796875, 23.1328125, 24.8564453125, 26.580078125, 28.3037109375, 30.02734375, 31.7509765625, 33.474609375, 35.1982421875, 36.921875, 38.6455078125, 40.369140625, 42.0927734375, 43.81640625, 45.5400390625, 47.263671875, 48.9873046875, 50.7109375, 52.4345703125, 54.158203125, 55.8818359375, 57.60546875, 59.3291015625, 61.052734375, 62.7763671875, 64.5]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 13.0, 11.0, 13.0, 28.0, 23.0, 26.0, 44.0, 66.0, 118.0, 166.0, 232.0, 396.0, 590.0, 930.0, 1596.0, 3101.0, 7632.0, 30350.0, 762044.0, 212255.0, 17192.0, 5630.0, 2487.0, 1250.0, 841.0, 491.0, 328.0, 235.0, 149.0, 101.0, 58.0, 43.0, 23.0, 21.0, 13.0, 15.0, 11.0, 13.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-96.0, -92.88671875, -89.7734375, -86.66015625, -83.546875, -80.43359375, -77.3203125, -74.20703125, -71.09375, -67.98046875, -64.8671875, -61.75390625, -58.640625, -55.52734375, -52.4140625, -49.30078125, -46.1875, -43.07421875, -39.9609375, -36.84765625, -33.734375, -30.62109375, -27.5078125, -24.39453125, -21.28125, -18.16796875, -15.0546875, -11.94140625, -8.828125, -5.71484375, -2.6015625, 0.51171875, 3.625, 6.73828125, 9.8515625, 12.96484375, 16.078125, 19.19140625, 22.3046875, 25.41796875, 28.53125, 31.64453125, 34.7578125, 37.87109375, 40.984375, 44.09765625, 47.2109375, 50.32421875, 53.4375, 56.55078125, 59.6640625, 62.77734375, 65.890625, 69.00390625, 72.1171875, 75.23046875, 78.34375, 81.45703125, 84.5703125, 87.68359375, 90.796875, 93.91015625, 97.0234375, 100.13671875, 103.25]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 14.0, 11.0, 16.0, 14.0, 21.0, 24.0, 25.0, 25.0, 35.0, 44.0, 31.0, 60.0, 60.0, 63.0, 115.0, 1808.0, 150.0, 76.0, 68.0, 42.0, 46.0, 58.0, 39.0, 25.0, 29.0, 32.0, 24.0, 15.0, 15.0, 14.0, 10.0, 8.0, 6.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-214.75, -208.88671875, -203.0234375, -197.16015625, -191.296875, -185.43359375, -179.5703125, -173.70703125, -167.84375, -161.98046875, -156.1171875, -150.25390625, -144.390625, -138.52734375, -132.6640625, -126.80078125, -120.9375, -115.07421875, -109.2109375, -103.34765625, -97.484375, -91.62109375, -85.7578125, -79.89453125, -74.03125, -68.16796875, -62.3046875, -56.44140625, -50.578125, -44.71484375, -38.8515625, -32.98828125, -27.125, -21.26171875, -15.3984375, -9.53515625, -3.671875, 2.19140625, 8.0546875, 13.91796875, 19.78125, 25.64453125, 31.5078125, 37.37109375, 43.234375, 49.09765625, 54.9609375, 60.82421875, 66.6875, 72.55078125, 78.4140625, 84.27734375, 90.140625, 96.00390625, 101.8671875, 107.73046875, 113.59375, 119.45703125, 125.3203125, 131.18359375, 137.046875, 142.91015625, 148.7734375, 154.63671875, 160.5]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 1.0, 6.0, 6.0, 8.0, 15.0, 17.0, 21.0, 23.0, 32.0, 42.0, 70.0, 110.0, 178.0, 293.0, 651.0, 1800.0, 7665.0, 173711.0, 2942835.0, 13852.0, 2559.0, 857.0, 373.0, 194.0, 121.0, 69.0, 48.0, 34.0, 28.0, 22.0, 21.0, 17.0, 10.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-390.5, -376.1171875, -361.734375, -347.3515625, -332.96875, -318.5859375, -304.203125, -289.8203125, -275.4375, -261.0546875, -246.671875, -232.2890625, -217.90625, -203.5234375, -189.140625, -174.7578125, -160.375, -145.9921875, -131.609375, -117.2265625, -102.84375, -88.4609375, -74.078125, -59.6953125, -45.3125, -30.9296875, -16.546875, -2.1640625, 12.21875, 26.6015625, 40.984375, 55.3671875, 69.75, 84.1328125, 98.515625, 112.8984375, 127.28125, 141.6640625, 156.046875, 170.4296875, 184.8125, 199.1953125, 213.578125, 227.9609375, 242.34375, 256.7265625, 271.109375, 285.4921875, 299.875, 314.2578125, 328.640625, 343.0234375, 357.40625, 371.7890625, 386.171875, 400.5546875, 414.9375, 429.3203125, 443.703125, 458.0859375, 472.46875, 486.8515625, 501.234375, 515.6171875, 530.0]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 926.0, 83.0, 1.0], "bins": [-10219.6171875, -10053.9287109375, -9888.2392578125, -9722.55078125, -9556.8623046875, -9391.1728515625, -9225.484375, -9059.794921875, -8894.1064453125, -8728.41796875, -8562.728515625, -8397.0400390625, -8231.3515625, -8065.662109375, -7899.9736328125, -7734.28466796875, -7568.595703125, -7402.90673828125, -7237.21826171875, -7071.529296875, -6905.84033203125, -6740.1513671875, -6574.462890625, -6408.77392578125, -6243.08544921875, -6077.396484375, -5911.7080078125, -5746.01904296875, -5580.330078125, -5414.64111328125, -5248.95263671875, -5083.263671875, -4917.5751953125, -4751.88623046875, -4586.19775390625, -4420.5087890625, -4254.81982421875, -4089.131103515625, -3923.4423828125, -3757.75341796875, -3592.064453125, -3426.375732421875, -3260.686767578125, -3094.998046875, -2929.30908203125, -2763.620361328125, -2597.931640625, -2432.24267578125, -2266.553955078125, -2100.865234375, -1935.17626953125, -1769.487548828125, -1603.798583984375, -1438.10986328125, -1272.4210205078125, -1106.732177734375, -941.0432739257812, -775.3544311523438, -609.6656494140625, -443.976806640625, -278.2879638671875, -112.59912109375, 53.08966064453125, 218.77850341796875, 384.46734619140625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 4.0, 9.0, 11.0, 13.0, 13.0, 16.0, 15.0, 20.0, 19.0, 18.0, 31.0, 25.0, 37.0, 38.0, 31.0, 45.0, 26.0, 49.0, 44.0, 45.0, 35.0, 31.0, 41.0, 34.0, 42.0, 32.0, 42.0, 24.0, 28.0, 25.0, 25.0, 20.0, 22.0, 16.0, 15.0, 12.0, 13.0, 4.0, 6.0, 5.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-561.266845703125, -545.1923217773438, -529.1177978515625, -513.0432739257812, -496.9687194824219, -480.8941955566406, -464.8196716308594, -448.7451477050781, -432.67059326171875, -416.5960693359375, -400.52154541015625, -384.447021484375, -368.3724670410156, -352.2979431152344, -336.2234191894531, -320.1488952636719, -304.0743713378906, -287.9998474121094, -271.9253234863281, -255.8507843017578, -239.7762451171875, -223.70172119140625, -207.627197265625, -191.55267333984375, -175.47813415527344, -159.4036102294922, -143.32907104492188, -127.25454711914062, -111.18001556396484, -95.10548400878906, -79.03096008300781, -62.95642852783203, -46.881927490234375, -30.807397842407227, -14.732868194580078, 1.3416595458984375, 17.41619110107422, 33.49072265625, 49.56524658203125, 65.63977813720703, 81.71430969238281, 97.7888412475586, 113.86337280273438, 129.93789672851562, 146.01242065429688, 162.0869598388672, 178.16148376464844, 194.23602294921875, 210.310546875, 226.38507080078125, 242.45960998535156, 258.53411865234375, 274.6086730957031, 290.6831970214844, 306.7577209472656, 322.8322448730469, 338.90679931640625, 354.9813232421875, 371.05584716796875, 387.13037109375, 403.2049255371094, 419.2794494628906, 435.3539733886719, 451.4284973144531, 467.5030212402344]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 9.0, 4.0, 11.0, 10.0, 10.0, 13.0, 15.0, 14.0, 26.0, 25.0, 26.0, 31.0, 37.0, 45.0, 47.0, 45.0, 54.0, 53.0, 46.0, 43.0, 51.0, 41.0, 45.0, 31.0, 40.0, 34.0, 31.0, 23.0, 25.0, 14.0, 13.0, 16.0, 18.0, 11.0, 7.0, 3.0, 12.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -50.71875, -48.875, -47.03125, -45.1875, -43.34375, -41.5, -39.65625, -37.8125, -35.96875, -34.125, -32.28125, -30.4375, -28.59375, -26.75, -24.90625, -23.0625, -21.21875, -19.375, -17.53125, -15.6875, -13.84375, -12.0, -10.15625, -8.3125, -6.46875, -4.625, -2.78125, -0.9375, 0.90625, 2.75, 4.59375, 6.4375, 8.28125, 10.125, 11.96875, 13.8125, 15.65625, 17.5, 19.34375, 21.1875, 23.03125, 24.875, 26.71875, 28.5625, 30.40625, 32.25, 34.09375, 35.9375, 37.78125, 39.625, 41.46875, 43.3125, 45.15625, 47.0, 48.84375, 50.6875, 52.53125, 54.375, 56.21875, 58.0625, 59.90625, 61.75, 63.59375, 65.4375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 13.0, 13.0, 23.0, 22.0, 41.0, 40.0, 47.0, 51.0, 84.0, 131.0, 256.0, 446.0, 799.0, 1409.0, 2968.0, 6583.0, 18766.0, 162901.0, 3649898.0, 311209.0, 23042.0, 8152.0, 3569.0, 1651.0, 860.0, 459.0, 256.0, 155.0, 110.0, 77.0, 62.0, 39.0, 43.0, 27.0, 16.0, 17.0, 7.0, 7.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.0, -168.119140625, -162.23828125, -156.357421875, -150.4765625, -144.595703125, -138.71484375, -132.833984375, -126.953125, -121.072265625, -115.19140625, -109.310546875, -103.4296875, -97.548828125, -91.66796875, -85.787109375, -79.90625, -74.025390625, -68.14453125, -62.263671875, -56.3828125, -50.501953125, -44.62109375, -38.740234375, -32.859375, -26.978515625, -21.09765625, -15.216796875, -9.3359375, -3.455078125, 2.42578125, 8.306640625, 14.1875, 20.068359375, 25.94921875, 31.830078125, 37.7109375, 43.591796875, 49.47265625, 55.353515625, 61.234375, 67.115234375, 72.99609375, 78.876953125, 84.7578125, 90.638671875, 96.51953125, 102.400390625, 108.28125, 114.162109375, 120.04296875, 125.923828125, 131.8046875, 137.685546875, 143.56640625, 149.447265625, 155.328125, 161.208984375, 167.08984375, 172.970703125, 178.8515625, 184.732421875, 190.61328125, 196.494140625, 202.375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 8.0, 9.0, 14.0, 21.0, 22.0, 25.0, 42.0, 73.0, 97.0, 201.0, 384.0, 993.0, 1115.0, 511.0, 225.0, 124.0, 72.0, 34.0, 24.0, 25.0, 14.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-172.25, -167.048828125, -161.84765625, -156.646484375, -151.4453125, -146.244140625, -141.04296875, -135.841796875, -130.640625, -125.439453125, -120.23828125, -115.037109375, -109.8359375, -104.634765625, -99.43359375, -94.232421875, -89.03125, -83.830078125, -78.62890625, -73.427734375, -68.2265625, -63.025390625, -57.82421875, -52.623046875, -47.421875, -42.220703125, -37.01953125, -31.818359375, -26.6171875, -21.416015625, -16.21484375, -11.013671875, -5.8125, -0.611328125, 4.58984375, 9.791015625, 14.9921875, 20.193359375, 25.39453125, 30.595703125, 35.796875, 40.998046875, 46.19921875, 51.400390625, 56.6015625, 61.802734375, 67.00390625, 72.205078125, 77.40625, 82.607421875, 87.80859375, 93.009765625, 98.2109375, 103.412109375, 108.61328125, 113.814453125, 119.015625, 124.216796875, 129.41796875, 134.619140625, 139.8203125, 145.021484375, 150.22265625, 155.423828125, 160.625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 13.0, 10.0, 11.0, 13.0, 22.0, 25.0, 48.0, 60.0, 95.0, 118.0, 204.0, 338.0, 659.0, 1305.0, 3613.0, 12240.0, 75915.0, 3881795.0, 189803.0, 19416.0, 4908.0, 1661.0, 752.0, 405.0, 254.0, 164.0, 99.0, 82.0, 57.0, 49.0, 40.0, 15.0, 12.0, 18.0, 15.0, 8.0, 5.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-378.0, -366.05859375, -354.1171875, -342.17578125, -330.234375, -318.29296875, -306.3515625, -294.41015625, -282.46875, -270.52734375, -258.5859375, -246.64453125, -234.703125, -222.76171875, -210.8203125, -198.87890625, -186.9375, -174.99609375, -163.0546875, -151.11328125, -139.171875, -127.23046875, -115.2890625, -103.34765625, -91.40625, -79.46484375, -67.5234375, -55.58203125, -43.640625, -31.69921875, -19.7578125, -7.81640625, 4.125, 16.06640625, 28.0078125, 39.94921875, 51.890625, 63.83203125, 75.7734375, 87.71484375, 99.65625, 111.59765625, 123.5390625, 135.48046875, 147.421875, 159.36328125, 171.3046875, 183.24609375, 195.1875, 207.12890625, 219.0703125, 231.01171875, 242.953125, 254.89453125, 266.8359375, 278.77734375, 290.71875, 302.66015625, 314.6015625, 326.54296875, 338.484375, 350.42578125, 362.3671875, 374.30859375, 386.25]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 10.0, 11.0, 17.0, 21.0, 48.0, 84.0, 145.0, 225.0, 209.0, 97.0, 58.0, 26.0, 28.0, 13.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-889.161376953125, -860.4528198242188, -831.7442626953125, -803.03564453125, -774.3270874023438, -745.6185302734375, -716.9099731445312, -688.201416015625, -659.4927978515625, -630.7842407226562, -602.07568359375, -573.3670654296875, -544.6585083007812, -515.949951171875, -487.24139404296875, -458.5328369140625, -429.82427978515625, -401.11572265625, -372.4071350097656, -343.6985778808594, -314.989990234375, -286.28143310546875, -257.5728759765625, -228.8643035888672, -200.15573120117188, -171.44715881347656, -142.73858642578125, -114.030029296875, -85.32145690917969, -56.612884521484375, -27.904327392578125, 0.8042449951171875, 29.51275634765625, 58.2213249206543, 86.92989349365234, 115.63845825195312, 144.34703063964844, 173.05560302734375, 201.76416015625, 230.4727325439453, 259.1813049316406, 287.8898620605469, 316.59844970703125, 345.3070068359375, 374.01556396484375, 402.7241516113281, 431.4327087402344, 460.14129638671875, 488.849853515625, 517.5584106445312, 546.2669677734375, 574.9755859375, 603.6841430664062, 632.3927001953125, 661.1012573242188, 689.809814453125, 718.5184326171875, 747.2269897460938, 775.935546875, 804.6441650390625, 833.3527221679688, 862.061279296875, 890.7698364257812, 919.4783935546875, 948.1869506835938]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 9.0, 8.0, 6.0, 7.0, 16.0, 14.0, 16.0, 19.0, 23.0, 13.0, 28.0, 28.0, 35.0, 43.0, 47.0, 40.0, 32.0, 39.0, 45.0, 38.0, 48.0, 44.0, 40.0, 47.0, 33.0, 39.0, 34.0, 33.0, 26.0, 23.0, 26.0, 20.0, 16.0, 13.0, 17.0, 11.0, 4.0, 8.0, 1.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-343.57000732421875, -331.92864990234375, -320.2873229980469, -308.6459655761719, -297.0046081542969, -285.3632507324219, -273.721923828125, -262.08056640625, -250.439208984375, -238.79786682128906, -227.15650939941406, -215.51516723632812, -203.87380981445312, -192.2324676513672, -180.59112548828125, -168.94976806640625, -157.3084259033203, -145.66708374023438, -134.02572631835938, -122.38438415527344, -110.74302673339844, -99.1016845703125, -87.46033477783203, -75.81898498535156, -64.1776351928711, -52.536285400390625, -40.894935607910156, -29.253589630126953, -17.612239837646484, -5.970890045166016, 5.6704559326171875, 17.311805725097656, 28.953155517578125, 40.594505310058594, 52.23585510253906, 63.877201080322266, 75.5185546875, 87.15989685058594, 98.8012466430664, 110.44259643554688, 122.08394622802734, 133.7252960205078, 145.36663818359375, 157.00799560546875, 168.6493377685547, 180.2906951904297, 191.93203735351562, 203.57339477539062, 215.21473693847656, 226.8560791015625, 238.4974365234375, 250.13877868652344, 261.7801208496094, 273.4214782714844, 285.0628356933594, 296.70416259765625, 308.34552001953125, 319.98687744140625, 331.6282043457031, 343.2695617675781, 354.9109191894531, 366.5522766113281, 378.193603515625, 389.8349609375, 401.476318359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 7.0, 6.0, 12.0, 7.0, 14.0, 15.0, 21.0, 26.0, 17.0, 32.0, 26.0, 45.0, 35.0, 46.0, 34.0, 30.0, 54.0, 56.0, 39.0, 51.0, 38.0, 51.0, 41.0, 27.0, 40.0, 34.0, 29.0, 19.0, 20.0, 17.0, 18.0, 15.0, 15.0, 8.0, 11.0, 12.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.8125, -50.0302734375, -48.248046875, -46.4658203125, -44.68359375, -42.9013671875, -41.119140625, -39.3369140625, -37.5546875, -35.7724609375, -33.990234375, -32.2080078125, -30.42578125, -28.6435546875, -26.861328125, -25.0791015625, -23.296875, -21.5146484375, -19.732421875, -17.9501953125, -16.16796875, -14.3857421875, -12.603515625, -10.8212890625, -9.0390625, -7.2568359375, -5.474609375, -3.6923828125, -1.91015625, -0.1279296875, 1.654296875, 3.4365234375, 5.21875, 7.0009765625, 8.783203125, 10.5654296875, 12.34765625, 14.1298828125, 15.912109375, 17.6943359375, 19.4765625, 21.2587890625, 23.041015625, 24.8232421875, 26.60546875, 28.3876953125, 30.169921875, 31.9521484375, 33.734375, 35.5166015625, 37.298828125, 39.0810546875, 40.86328125, 42.6455078125, 44.427734375, 46.2099609375, 47.9921875, 49.7744140625, 51.556640625, 53.3388671875, 55.12109375, 56.9033203125, 58.685546875, 60.4677734375, 62.25]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 7.0, 19.0, 19.0, 23.0, 28.0, 47.0, 60.0, 87.0, 145.0, 183.0, 210.0, 346.0, 513.0, 743.0, 1141.0, 1869.0, 3227.0, 5603.0, 11050.0, 23022.0, 52237.0, 138704.0, 418007.0, 242274.0, 81129.0, 33514.0, 15529.0, 7929.0, 4255.0, 2298.0, 1418.0, 922.0, 596.0, 410.0, 280.0, 148.0, 165.0, 113.0, 63.0, 61.0, 40.0, 36.0, 22.0, 14.0, 16.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.890625, -10.5579833984375, -10.225341796875, -9.8927001953125, -9.56005859375, -9.2274169921875, -8.894775390625, -8.5621337890625, -8.2294921875, -7.8968505859375, -7.564208984375, -7.2315673828125, -6.89892578125, -6.5662841796875, -6.233642578125, -5.9010009765625, -5.568359375, -5.2357177734375, -4.903076171875, -4.5704345703125, -4.23779296875, -3.9051513671875, -3.572509765625, -3.2398681640625, -2.9072265625, -2.5745849609375, -2.241943359375, -1.9093017578125, -1.57666015625, -1.2440185546875, -0.911376953125, -0.5787353515625, -0.24609375, 0.0865478515625, 0.419189453125, 0.7518310546875, 1.08447265625, 1.4171142578125, 1.749755859375, 2.0823974609375, 2.4150390625, 2.7476806640625, 3.080322265625, 3.4129638671875, 3.74560546875, 4.0782470703125, 4.410888671875, 4.7435302734375, 5.076171875, 5.4088134765625, 5.741455078125, 6.0740966796875, 6.40673828125, 6.7393798828125, 7.072021484375, 7.4046630859375, 7.7373046875, 8.0699462890625, 8.402587890625, 8.7352294921875, 9.06787109375, 9.4005126953125, 9.733154296875, 10.0657958984375, 10.3984375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 3.0, 6.0, 3.0, 10.0, 4.0, 13.0, 7.0, 17.0, 9.0, 20.0, 24.0, 19.0, 23.0, 17.0, 33.0, 29.0, 35.0, 33.0, 34.0, 23.0, 41.0, 38.0, 51.0, 1064.0, 33.0, 41.0, 45.0, 44.0, 37.0, 31.0, 27.0, 28.0, 27.0, 23.0, 17.0, 15.0, 16.0, 11.0, 16.0, 14.0, 10.0, 7.0, 5.0, 8.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-36.46875, -35.40185546875, -34.3349609375, -33.26806640625, -32.201171875, -31.13427734375, -30.0673828125, -29.00048828125, -27.93359375, -26.86669921875, -25.7998046875, -24.73291015625, -23.666015625, -22.59912109375, -21.5322265625, -20.46533203125, -19.3984375, -18.33154296875, -17.2646484375, -16.19775390625, -15.130859375, -14.06396484375, -12.9970703125, -11.93017578125, -10.86328125, -9.79638671875, -8.7294921875, -7.66259765625, -6.595703125, -5.52880859375, -4.4619140625, -3.39501953125, -2.328125, -1.26123046875, -0.1943359375, 0.87255859375, 1.939453125, 3.00634765625, 4.0732421875, 5.14013671875, 6.20703125, 7.27392578125, 8.3408203125, 9.40771484375, 10.474609375, 11.54150390625, 12.6083984375, 13.67529296875, 14.7421875, 15.80908203125, 16.8759765625, 17.94287109375, 19.009765625, 20.07666015625, 21.1435546875, 22.21044921875, 23.27734375, 24.34423828125, 25.4111328125, 26.47802734375, 27.544921875, 28.61181640625, 29.6787109375, 30.74560546875, 31.8125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 11.0, 7.0, 12.0, 27.0, 34.0, 38.0, 58.0, 82.0, 139.0, 201.0, 370.0, 660.0, 1277.0, 2552.0, 5305.0, 12103.0, 28194.0, 70867.0, 192746.0, 1458954.0, 198393.0, 73072.0, 28645.0, 12245.0, 5580.0, 2574.0, 1273.0, 703.0, 395.0, 218.0, 129.0, 82.0, 50.0, 39.0, 24.0, 24.0, 14.0, 12.0, 4.0, 6.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.50701904296875, -5.3265380859375, -5.14605712890625, -4.965576171875, -4.78509521484375, -4.6046142578125, -4.42413330078125, -4.24365234375, -4.06317138671875, -3.8826904296875, -3.70220947265625, -3.521728515625, -3.34124755859375, -3.1607666015625, -2.98028564453125, -2.7998046875, -2.61932373046875, -2.4388427734375, -2.25836181640625, -2.077880859375, -1.89739990234375, -1.7169189453125, -1.53643798828125, -1.35595703125, -1.17547607421875, -0.9949951171875, -0.81451416015625, -0.634033203125, -0.45355224609375, -0.2730712890625, -0.09259033203125, 0.087890625, 0.26837158203125, 0.4488525390625, 0.62933349609375, 0.809814453125, 0.99029541015625, 1.1707763671875, 1.35125732421875, 1.53173828125, 1.71221923828125, 1.8927001953125, 2.07318115234375, 2.253662109375, 2.43414306640625, 2.6146240234375, 2.79510498046875, 2.9755859375, 3.15606689453125, 3.3365478515625, 3.51702880859375, 3.697509765625, 3.87799072265625, 4.0584716796875, 4.23895263671875, 4.41943359375, 4.59991455078125, 4.7803955078125, 4.96087646484375, 5.141357421875, 5.32183837890625, 5.5023193359375, 5.68280029296875, 5.86328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 10.0, 6.0, 14.0, 12.0, 11.0, 23.0, 17.0, 32.0, 42.0, 54.0, 65.0, 92.0, 99.0, 120.0, 110.0, 65.0, 50.0, 40.0, 28.0, 23.0, 22.0, 12.0, 13.0, 10.0, 3.0, 10.0, 6.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6259765625, -0.609100341796875, -0.59222412109375, -0.575347900390625, -0.5584716796875, -0.541595458984375, -0.52471923828125, -0.507843017578125, -0.490966796875, -0.474090576171875, -0.45721435546875, -0.440338134765625, -0.4234619140625, -0.406585693359375, -0.38970947265625, -0.372833251953125, -0.35595703125, -0.339080810546875, -0.32220458984375, -0.305328369140625, -0.2884521484375, -0.271575927734375, -0.25469970703125, -0.237823486328125, -0.220947265625, -0.204071044921875, -0.18719482421875, -0.170318603515625, -0.1534423828125, -0.136566162109375, -0.11968994140625, -0.102813720703125, -0.0859375, -0.069061279296875, -0.05218505859375, -0.035308837890625, -0.0184326171875, -0.001556396484375, 0.01531982421875, 0.032196044921875, 0.049072265625, 0.065948486328125, 0.08282470703125, 0.099700927734375, 0.1165771484375, 0.133453369140625, 0.15032958984375, 0.167205810546875, 0.18408203125, 0.200958251953125, 0.21783447265625, 0.234710693359375, 0.2515869140625, 0.268463134765625, 0.28533935546875, 0.302215576171875, 0.319091796875, 0.335968017578125, 0.35284423828125, 0.369720458984375, 0.3865966796875, 0.403472900390625, 0.42034912109375, 0.437225341796875, 0.4541015625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 6.0, 9.0, 3.0, 8.0, 10.0, 16.0, 18.0, 25.0, 23.0, 42.0, 66.0, 97.0, 209.0, 1044303.0, 3204.0, 162.0, 97.0, 82.0, 36.0, 36.0, 22.0, 16.0, 13.0, 12.0, 11.0, 5.0, 10.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8671875, -14.3148193359375, -13.762451171875, -13.2100830078125, -12.65771484375, -12.1053466796875, -11.552978515625, -11.0006103515625, -10.4482421875, -9.8958740234375, -9.343505859375, -8.7911376953125, -8.23876953125, -7.6864013671875, -7.134033203125, -6.5816650390625, -6.029296875, -5.4769287109375, -4.924560546875, -4.3721923828125, -3.81982421875, -3.2674560546875, -2.715087890625, -2.1627197265625, -1.6103515625, -1.0579833984375, -0.505615234375, 0.0467529296875, 0.59912109375, 1.1514892578125, 1.703857421875, 2.2562255859375, 2.80859375, 3.3609619140625, 3.913330078125, 4.4656982421875, 5.01806640625, 5.5704345703125, 6.122802734375, 6.6751708984375, 7.2275390625, 7.7799072265625, 8.332275390625, 8.8846435546875, 9.43701171875, 9.9893798828125, 10.541748046875, 11.0941162109375, 11.646484375, 12.1988525390625, 12.751220703125, 13.3035888671875, 13.85595703125, 14.4083251953125, 14.960693359375, 15.5130615234375, 16.0654296875, 16.6177978515625, 17.170166015625, 17.7225341796875, 18.27490234375, 18.8272705078125, 19.379638671875, 19.9320068359375, 20.484375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 51.0, 960.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5375372171401978, -0.37334200739860535, -0.20914679765701294, -0.04495158791542053, 0.11924362182617188, 0.2834388017654419, 0.4476340413093567, 0.6118292808532715, 0.7760244607925415, 0.9402196407318115, 1.104414939880371, 1.2686101198196411, 1.4328052997589111, 1.5970004796981812, 1.7611956596374512, 1.9253909587860107, 2.0895862579345703, 2.25378155708313, 2.4179766178131104, 2.58217191696167, 2.7463669776916504, 2.91056227684021, 3.0747575759887695, 3.23895263671875, 3.4031476974487305, 3.56734299659729, 3.7315380573272705, 3.89573335647583, 4.0599284172058105, 4.224123954772949, 4.38831901550293, 4.55251407623291, 4.716709136962891, 4.880904197692871, 5.04509973526001, 5.20929479598999, 5.373489856719971, 5.537685394287109, 5.70188045501709, 5.86607551574707, 6.030270576477051, 6.194465637207031, 6.35866117477417, 6.52285623550415, 6.687051296234131, 6.8512468338012695, 7.01544189453125, 7.1796369552612305, 7.343832492828369, 7.50802755355835, 7.672223091125488, 7.836418151855469, 8.00061321258545, 8.16480827331543, 8.32900333404541, 8.493199348449707, 8.657394409179688, 8.821589469909668, 8.985784530639648, 9.149979591369629, 9.314175605773926, 9.478370666503906, 9.642565727233887, 9.806760787963867, 9.970955848693848]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 10.0, 8.0, 14.0, 16.0, 22.0, 14.0, 26.0, 27.0, 34.0, 34.0, 31.0, 36.0, 33.0, 36.0, 39.0, 39.0, 51.0, 34.0, 43.0, 44.0, 36.0, 31.0, 37.0, 42.0, 27.0, 33.0, 28.0, 23.0, 24.0, 18.0, 20.0, 14.0, 8.0, 7.0, 13.0, 9.0, 2.0, 10.0, 4.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.6692379117012024, -0.6474929451942444, -0.6257479190826416, -0.6040029525756836, -0.5822579264640808, -0.5605129599571228, -0.53876793384552, -0.517022967338562, -0.4952779710292816, -0.4735329747200012, -0.4517879784107208, -0.43004298210144043, -0.4082980155944824, -0.38655298948287964, -0.36480802297592163, -0.34306302666664124, -0.32131803035736084, -0.29957303404808044, -0.27782803773880005, -0.25608307123184204, -0.23433806002140045, -0.21259306371212006, -0.19084808230400085, -0.16910308599472046, -0.14735808968544006, -0.12561309337615967, -0.10386810451745987, -0.08212311565876007, -0.060378119349479675, -0.03863312304019928, -0.016888141632080078, 0.004856854677200317, 0.026601791381835938, 0.048346783965826035, 0.07009177654981613, 0.09183676540851593, 0.11358176171779633, 0.13532675802707672, 0.15707173943519592, 0.17881673574447632, 0.2005617320537567, 0.2223067283630371, 0.2440517246723175, 0.2657967209815979, 0.2875416874885559, 0.3092867136001587, 0.3310316801071167, 0.3527766764163971, 0.3745216727256775, 0.3962666690349579, 0.4180116653442383, 0.4397566318511963, 0.4615016579627991, 0.4832466244697571, 0.5049916505813599, 0.5267366170883179, 0.5484815835952759, 0.5702265501022339, 0.5919715762138367, 0.6137165427207947, 0.6354615688323975, 0.6572065353393555, 0.6789515018463135, 0.7006965279579163, 0.722441554069519]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 7.0, 6.0, 12.0, 6.0, 14.0, 16.0, 21.0, 26.0, 17.0, 32.0, 26.0, 44.0, 36.0, 46.0, 34.0, 30.0, 54.0, 55.0, 40.0, 51.0, 38.0, 50.0, 42.0, 28.0, 39.0, 34.0, 29.0, 20.0, 19.0, 17.0, 18.0, 14.0, 16.0, 8.0, 11.0, 12.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.8125, -50.0302734375, -48.248046875, -46.4658203125, -44.68359375, -42.9013671875, -41.119140625, -39.3369140625, -37.5546875, -35.7724609375, -33.990234375, -32.2080078125, -30.42578125, -28.6435546875, -26.861328125, -25.0791015625, -23.296875, -21.5146484375, -19.732421875, -17.9501953125, -16.16796875, -14.3857421875, -12.603515625, -10.8212890625, -9.0390625, -7.2568359375, -5.474609375, -3.6923828125, -1.91015625, -0.1279296875, 1.654296875, 3.4365234375, 5.21875, 7.0009765625, 8.783203125, 10.5654296875, 12.34765625, 14.1298828125, 15.912109375, 17.6943359375, 19.4765625, 21.2587890625, 23.041015625, 24.8232421875, 26.60546875, 28.3876953125, 30.169921875, 31.9521484375, 33.734375, 35.5166015625, 37.298828125, 39.0810546875, 40.86328125, 42.6455078125, 44.427734375, 46.2099609375, 47.9921875, 49.7744140625, 51.556640625, 53.3388671875, 55.12109375, 56.9033203125, 58.685546875, 60.4677734375, 62.25]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 9.0, 25.0, 24.0, 26.0, 46.0, 40.0, 93.0, 132.0, 191.0, 275.0, 395.0, 584.0, 898.0, 1467.0, 2387.0, 3939.0, 6927.0, 14675.0, 66619.0, 870562.0, 49299.0, 13437.0, 6656.0, 3616.0, 2136.0, 1364.0, 884.0, 591.0, 437.0, 246.0, 178.0, 89.0, 72.0, 57.0, 42.0, 38.0, 24.0, 17.0, 11.0, 9.0, 10.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0], "bins": [-119.4375, -116.16015625, -112.8828125, -109.60546875, -106.328125, -103.05078125, -99.7734375, -96.49609375, -93.21875, -89.94140625, -86.6640625, -83.38671875, -80.109375, -76.83203125, -73.5546875, -70.27734375, -67.0, -63.72265625, -60.4453125, -57.16796875, -53.890625, -50.61328125, -47.3359375, -44.05859375, -40.78125, -37.50390625, -34.2265625, -30.94921875, -27.671875, -24.39453125, -21.1171875, -17.83984375, -14.5625, -11.28515625, -8.0078125, -4.73046875, -1.453125, 1.82421875, 5.1015625, 8.37890625, 11.65625, 14.93359375, 18.2109375, 21.48828125, 24.765625, 28.04296875, 31.3203125, 34.59765625, 37.875, 41.15234375, 44.4296875, 47.70703125, 50.984375, 54.26171875, 57.5390625, 60.81640625, 64.09375, 67.37109375, 70.6484375, 73.92578125, 77.203125, 80.48046875, 83.7578125, 87.03515625, 90.3125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 5.0, 10.0, 9.0, 8.0, 9.0, 19.0, 23.0, 27.0, 24.0, 28.0, 28.0, 38.0, 41.0, 53.0, 44.0, 68.0, 80.0, 319.0, 1679.0, 76.0, 66.0, 60.0, 51.0, 48.0, 35.0, 24.0, 25.0, 30.0, 36.0, 23.0, 21.0, 10.0, 11.0, 8.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-241.625, -235.27734375, -228.9296875, -222.58203125, -216.234375, -209.88671875, -203.5390625, -197.19140625, -190.84375, -184.49609375, -178.1484375, -171.80078125, -165.453125, -159.10546875, -152.7578125, -146.41015625, -140.0625, -133.71484375, -127.3671875, -121.01953125, -114.671875, -108.32421875, -101.9765625, -95.62890625, -89.28125, -82.93359375, -76.5859375, -70.23828125, -63.890625, -57.54296875, -51.1953125, -44.84765625, -38.5, -32.15234375, -25.8046875, -19.45703125, -13.109375, -6.76171875, -0.4140625, 5.93359375, 12.28125, 18.62890625, 24.9765625, 31.32421875, 37.671875, 44.01953125, 50.3671875, 56.71484375, 63.0625, 69.41015625, 75.7578125, 82.10546875, 88.453125, 94.80078125, 101.1484375, 107.49609375, 113.84375, 120.19140625, 126.5390625, 132.88671875, 139.234375, 145.58203125, 151.9296875, 158.27734375, 164.625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 14.0, 11.0, 19.0, 20.0, 37.0, 77.0, 94.0, 126.0, 222.0, 526.0, 1933.0, 12350.0, 2946461.0, 173575.0, 7797.0, 1427.0, 403.0, 181.0, 128.0, 95.0, 61.0, 31.0, 25.0, 23.0, 18.0, 10.0, 6.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-627.0, -607.9375, -588.875, -569.8125, -550.75, -531.6875, -512.625, -493.5625, -474.5, -455.4375, -436.375, -417.3125, -398.25, -379.1875, -360.125, -341.0625, -322.0, -302.9375, -283.875, -264.8125, -245.75, -226.6875, -207.625, -188.5625, -169.5, -150.4375, -131.375, -112.3125, -93.25, -74.1875, -55.125, -36.0625, -17.0, 2.0625, 21.125, 40.1875, 59.25, 78.3125, 97.375, 116.4375, 135.5, 154.5625, 173.625, 192.6875, 211.75, 230.8125, 249.875, 268.9375, 288.0, 307.0625, 326.125, 345.1875, 364.25, 383.3125, 402.375, 421.4375, 440.5, 459.5625, 478.625, 497.6875, 516.75, 535.8125, 554.875, 573.9375, 593.0]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 273.0, 712.0, 29.0], "bins": [-6241.05419921875, -6140.65478515625, -6040.25537109375, -5939.85595703125, -5839.45654296875, -5739.05712890625, -5638.65771484375, -5538.25830078125, -5437.85888671875, -5337.45947265625, -5237.06005859375, -5136.66064453125, -5036.26123046875, -4935.86181640625, -4835.46240234375, -4735.06298828125, -4634.66357421875, -4534.26416015625, -4433.86474609375, -4333.46533203125, -4233.06591796875, -4132.66650390625, -4032.26708984375, -3931.86767578125, -3831.46826171875, -3731.06884765625, -3630.66943359375, -3530.27001953125, -3429.87060546875, -3329.47119140625, -3229.07177734375, -3128.67236328125, -3028.272705078125, -2927.873291015625, -2827.473876953125, -2727.074462890625, -2626.675048828125, -2526.275634765625, -2425.876220703125, -2325.476806640625, -2225.077392578125, -2124.677978515625, -2024.278564453125, -1923.879150390625, -1823.479736328125, -1723.080322265625, -1622.680908203125, -1522.281494140625, -1421.882080078125, -1321.482666015625, -1221.083251953125, -1120.683837890625, -1020.284423828125, -919.885009765625, -819.485595703125, -719.086181640625, -618.6868286132812, -518.2874145507812, -417.88800048828125, -317.48858642578125, -217.08917236328125, -116.68975830078125, -16.29034423828125, 84.10906982421875, 184.50848388671875]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 11.0, 13.0, 11.0, 17.0, 17.0, 18.0, 24.0, 22.0, 27.0, 29.0, 27.0, 40.0, 41.0, 35.0, 36.0, 35.0, 35.0, 35.0, 35.0, 52.0, 46.0, 37.0, 41.0, 31.0, 40.0, 30.0, 19.0, 26.0, 26.0, 21.0, 17.0, 13.0, 13.0, 9.0, 11.0, 10.0, 4.0, 7.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0], "bins": [-521.9562377929688, -507.3730163574219, -492.7898254394531, -478.20660400390625, -463.6233825683594, -449.0401611328125, -434.45697021484375, -419.8737487792969, -405.29052734375, -390.7073059082031, -376.1241149902344, -361.5408935546875, -346.9576721191406, -332.37445068359375, -317.791259765625, -303.2080383300781, -288.62481689453125, -274.0415954589844, -259.4584045410156, -244.87518310546875, -230.29196166992188, -215.70875549316406, -201.12554931640625, -186.54232788085938, -171.95913696289062, -157.3759307861328, -142.79270935058594, -128.20950317382812, -113.62628173828125, -99.04307556152344, -84.4598617553711, -69.87664794921875, -55.293426513671875, -40.71021270751953, -26.12700080871582, -11.54378890991211, 3.0394248962402344, 17.622634887695312, 32.205848693847656, 46.7890625, 61.372276306152344, 75.95549011230469, 90.53870391845703, 105.12191772460938, 119.70512390136719, 134.288330078125, 148.87155151367188, 163.45477294921875, 178.03797912597656, 192.62118530273438, 207.20440673828125, 221.78761291503906, 236.37083435058594, 250.95404052734375, 265.5372619628906, 280.1204833984375, 294.70367431640625, 309.2868957519531, 323.8700866699219, 338.45330810546875, 353.0365295410156, 367.6197509765625, 382.20294189453125, 396.7861633300781, 411.369384765625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 7.0, 7.0, 5.0, 9.0, 8.0, 14.0, 12.0, 19.0, 30.0, 28.0, 29.0, 31.0, 31.0, 38.0, 34.0, 43.0, 42.0, 55.0, 40.0, 44.0, 55.0, 45.0, 45.0, 43.0, 41.0, 30.0, 27.0, 27.0, 21.0, 23.0, 19.0, 16.0, 16.0, 15.0, 7.0, 10.0, 7.0, 4.0, 5.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.1875, -60.24755859375, -58.3076171875, -56.36767578125, -54.427734375, -52.48779296875, -50.5478515625, -48.60791015625, -46.66796875, -44.72802734375, -42.7880859375, -40.84814453125, -38.908203125, -36.96826171875, -35.0283203125, -33.08837890625, -31.1484375, -29.20849609375, -27.2685546875, -25.32861328125, -23.388671875, -21.44873046875, -19.5087890625, -17.56884765625, -15.62890625, -13.68896484375, -11.7490234375, -9.80908203125, -7.869140625, -5.92919921875, -3.9892578125, -2.04931640625, -0.109375, 1.83056640625, 3.7705078125, 5.71044921875, 7.650390625, 9.59033203125, 11.5302734375, 13.47021484375, 15.41015625, 17.35009765625, 19.2900390625, 21.22998046875, 23.169921875, 25.10986328125, 27.0498046875, 28.98974609375, 30.9296875, 32.86962890625, 34.8095703125, 36.74951171875, 38.689453125, 40.62939453125, 42.5693359375, 44.50927734375, 46.44921875, 48.38916015625, 50.3291015625, 52.26904296875, 54.208984375, 56.14892578125, 58.0888671875, 60.02880859375, 61.96875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 6.0, 13.0, 11.0, 21.0, 40.0, 63.0, 102.0, 129.0, 161.0, 207.0, 281.0, 388.0, 586.0, 988.0, 1637.0, 2738.0, 5034.0, 11042.0, 36254.0, 499846.0, 3310410.0, 275397.0, 28174.0, 9392.0, 4478.0, 2358.0, 1469.0, 976.0, 644.0, 412.0, 283.0, 161.0, 124.0, 113.0, 75.0, 81.0, 67.0, 35.0, 26.0, 18.0, 6.0, 10.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-137.125, -132.615234375, -128.10546875, -123.595703125, -119.0859375, -114.576171875, -110.06640625, -105.556640625, -101.046875, -96.537109375, -92.02734375, -87.517578125, -83.0078125, -78.498046875, -73.98828125, -69.478515625, -64.96875, -60.458984375, -55.94921875, -51.439453125, -46.9296875, -42.419921875, -37.91015625, -33.400390625, -28.890625, -24.380859375, -19.87109375, -15.361328125, -10.8515625, -6.341796875, -1.83203125, 2.677734375, 7.1875, 11.697265625, 16.20703125, 20.716796875, 25.2265625, 29.736328125, 34.24609375, 38.755859375, 43.265625, 47.775390625, 52.28515625, 56.794921875, 61.3046875, 65.814453125, 70.32421875, 74.833984375, 79.34375, 83.853515625, 88.36328125, 92.873046875, 97.3828125, 101.892578125, 106.40234375, 110.912109375, 115.421875, 119.931640625, 124.44140625, 128.951171875, 133.4609375, 137.970703125, 142.48046875, 146.990234375, 151.5]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 5.0, 4.0, 6.0, 15.0, 13.0, 15.0, 17.0, 26.0, 36.0, 50.0, 58.0, 108.0, 156.0, 286.0, 582.0, 941.0, 762.0, 399.0, 200.0, 125.0, 73.0, 60.0, 31.0, 27.0, 11.0, 7.0, 5.0, 13.0, 6.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-145.5, -141.5380859375, -137.576171875, -133.6142578125, -129.65234375, -125.6904296875, -121.728515625, -117.7666015625, -113.8046875, -109.8427734375, -105.880859375, -101.9189453125, -97.95703125, -93.9951171875, -90.033203125, -86.0712890625, -82.109375, -78.1474609375, -74.185546875, -70.2236328125, -66.26171875, -62.2998046875, -58.337890625, -54.3759765625, -50.4140625, -46.4521484375, -42.490234375, -38.5283203125, -34.56640625, -30.6044921875, -26.642578125, -22.6806640625, -18.71875, -14.7568359375, -10.794921875, -6.8330078125, -2.87109375, 1.0908203125, 5.052734375, 9.0146484375, 12.9765625, 16.9384765625, 20.900390625, 24.8623046875, 28.82421875, 32.7861328125, 36.748046875, 40.7099609375, 44.671875, 48.6337890625, 52.595703125, 56.5576171875, 60.51953125, 64.4814453125, 68.443359375, 72.4052734375, 76.3671875, 80.3291015625, 84.291015625, 88.2529296875, 92.21484375, 96.1767578125, 100.138671875, 104.1005859375, 108.0625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 8.0, 9.0, 16.0, 14.0, 12.0, 12.0, 19.0, 31.0, 33.0, 45.0, 63.0, 79.0, 116.0, 193.0, 403.0, 1061.0, 3515.0, 15641.0, 134235.0, 3926803.0, 94352.0, 12577.0, 3041.0, 992.0, 353.0, 172.0, 108.0, 99.0, 61.0, 35.0, 51.0, 22.0, 25.0, 23.0, 19.0, 13.0, 14.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-414.0, -401.23828125, -388.4765625, -375.71484375, -362.953125, -350.19140625, -337.4296875, -324.66796875, -311.90625, -299.14453125, -286.3828125, -273.62109375, -260.859375, -248.09765625, -235.3359375, -222.57421875, -209.8125, -197.05078125, -184.2890625, -171.52734375, -158.765625, -146.00390625, -133.2421875, -120.48046875, -107.71875, -94.95703125, -82.1953125, -69.43359375, -56.671875, -43.91015625, -31.1484375, -18.38671875, -5.625, 7.13671875, 19.8984375, 32.66015625, 45.421875, 58.18359375, 70.9453125, 83.70703125, 96.46875, 109.23046875, 121.9921875, 134.75390625, 147.515625, 160.27734375, 173.0390625, 185.80078125, 198.5625, 211.32421875, 224.0859375, 236.84765625, 249.609375, 262.37109375, 275.1328125, 287.89453125, 300.65625, 313.41796875, 326.1796875, 338.94140625, 351.703125, 364.46484375, 377.2265625, 389.98828125, 402.75]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 9.0, 9.0, 7.0, 15.0, 17.0, 27.0, 41.0, 35.0, 54.0, 71.0, 81.0, 103.0, 110.0, 78.0, 85.0, 65.0, 40.0, 42.0, 26.0, 14.0, 13.0, 13.0, 8.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-402.7503967285156, -390.7337951660156, -378.7171936035156, -366.7005920410156, -354.6839904785156, -342.6673889160156, -330.6507873535156, -318.6341857910156, -306.6175842285156, -294.6009826660156, -282.5843811035156, -270.5677795410156, -258.5511779785156, -246.53457641601562, -234.51797485351562, -222.50137329101562, -210.48477172851562, -198.46817016601562, -186.45156860351562, -174.43496704101562, -162.41836547851562, -150.40176391601562, -138.38516235351562, -126.36856079101562, -114.35195922851562, -102.33535766601562, -90.31875610351562, -78.30215454101562, -66.28555297851562, -54.268951416015625, -42.252349853515625, -30.235748291015625, -18.21917724609375, -6.20257568359375, 5.81402587890625, 17.83062744140625, 29.84722900390625, 41.86383056640625, 53.88043212890625, 65.89703369140625, 77.91363525390625, 89.93023681640625, 101.94683837890625, 113.96343994140625, 125.98004150390625, 137.99664306640625, 150.01324462890625, 162.02984619140625, 174.04644775390625, 186.06304931640625, 198.07965087890625, 210.09625244140625, 222.11285400390625, 234.12945556640625, 246.14605712890625, 258.16265869140625, 270.17926025390625, 282.19586181640625, 294.21246337890625, 306.22906494140625, 318.24566650390625, 330.26226806640625, 342.27886962890625, 354.29547119140625, 366.31207275390625]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 3.0, 3.0, 5.0, 12.0, 6.0, 12.0, 11.0, 17.0, 16.0, 11.0, 14.0, 25.0, 27.0, 30.0, 31.0, 31.0, 36.0, 27.0, 41.0, 44.0, 39.0, 39.0, 41.0, 41.0, 26.0, 45.0, 31.0, 34.0, 40.0, 38.0, 32.0, 21.0, 16.0, 26.0, 22.0, 15.0, 15.0, 14.0, 16.0, 7.0, 5.0, 4.0, 9.0, 5.0, 8.0, 6.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-283.37322998046875, -274.0124206542969, -264.6515808105469, -255.29075622558594, -245.929931640625, -236.56912231445312, -227.2082977294922, -217.84747314453125, -208.4866485595703, -199.12582397460938, -189.76499938964844, -180.4041748046875, -171.04336547851562, -161.68252563476562, -152.32171630859375, -142.9608917236328, -133.60006713867188, -124.23924255371094, -114.87841796875, -105.5176010131836, -96.15677642822266, -86.79595184326172, -77.43513488769531, -68.07431030273438, -58.71348571777344, -49.3526611328125, -39.99184036254883, -30.631017684936523, -21.27019500732422, -11.909370422363281, -2.5485496520996094, 6.8122711181640625, 16.173095703125, 25.533918380737305, 34.89474105834961, 44.25556182861328, 53.61638641357422, 62.977210998535156, 72.33802795410156, 81.6988525390625, 91.05967712402344, 100.42050170898438, 109.78132629394531, 119.14214324951172, 128.50296020507812, 137.86380004882812, 147.224609375, 156.58543395996094, 165.94625854492188, 175.3070831298828, 184.66790771484375, 194.0287322998047, 203.38955688476562, 212.7503662109375, 222.11119079589844, 231.47201538085938, 240.8328399658203, 250.19366455078125, 259.5544738769531, 268.9153137207031, 278.276123046875, 287.636962890625, 296.9977722167969, 306.35858154296875, 315.71942138671875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 6.0, 6.0, 11.0, 10.0, 9.0, 16.0, 15.0, 24.0, 39.0, 26.0, 34.0, 42.0, 33.0, 47.0, 51.0, 36.0, 49.0, 65.0, 39.0, 47.0, 46.0, 40.0, 42.0, 34.0, 32.0, 37.0, 30.0, 19.0, 24.0, 8.0, 17.0, 9.0, 16.0, 11.0, 4.0, 2.0, 6.0, 1.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-63.96875, -62.00341796875, -60.0380859375, -58.07275390625, -56.107421875, -54.14208984375, -52.1767578125, -50.21142578125, -48.24609375, -46.28076171875, -44.3154296875, -42.35009765625, -40.384765625, -38.41943359375, -36.4541015625, -34.48876953125, -32.5234375, -30.55810546875, -28.5927734375, -26.62744140625, -24.662109375, -22.69677734375, -20.7314453125, -18.76611328125, -16.80078125, -14.83544921875, -12.8701171875, -10.90478515625, -8.939453125, -6.97412109375, -5.0087890625, -3.04345703125, -1.078125, 0.88720703125, 2.8525390625, 4.81787109375, 6.783203125, 8.74853515625, 10.7138671875, 12.67919921875, 14.64453125, 16.60986328125, 18.5751953125, 20.54052734375, 22.505859375, 24.47119140625, 26.4365234375, 28.40185546875, 30.3671875, 32.33251953125, 34.2978515625, 36.26318359375, 38.228515625, 40.19384765625, 42.1591796875, 44.12451171875, 46.08984375, 48.05517578125, 50.0205078125, 51.98583984375, 53.951171875, 55.91650390625, 57.8818359375, 59.84716796875, 61.8125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 6.0, 16.0, 17.0, 49.0, 52.0, 64.0, 136.0, 188.0, 291.0, 501.0, 893.0, 1785.0, 3697.0, 9122.0, 26910.0, 101286.0, 525509.0, 288923.0, 59171.0, 17320.0, 6467.0, 2815.0, 1350.0, 780.0, 439.0, 285.0, 162.0, 135.0, 41.0, 45.0, 32.0, 18.0, 5.0, 11.0, 9.0, 3.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1875, -14.660400390625, -14.13330078125, -13.606201171875, -13.0791015625, -12.552001953125, -12.02490234375, -11.497802734375, -10.970703125, -10.443603515625, -9.91650390625, -9.389404296875, -8.8623046875, -8.335205078125, -7.80810546875, -7.281005859375, -6.75390625, -6.226806640625, -5.69970703125, -5.172607421875, -4.6455078125, -4.118408203125, -3.59130859375, -3.064208984375, -2.537109375, -2.010009765625, -1.48291015625, -0.955810546875, -0.4287109375, 0.098388671875, 0.62548828125, 1.152587890625, 1.6796875, 2.206787109375, 2.73388671875, 3.260986328125, 3.7880859375, 4.315185546875, 4.84228515625, 5.369384765625, 5.896484375, 6.423583984375, 6.95068359375, 7.477783203125, 8.0048828125, 8.531982421875, 9.05908203125, 9.586181640625, 10.11328125, 10.640380859375, 11.16748046875, 11.694580078125, 12.2216796875, 12.748779296875, 13.27587890625, 13.802978515625, 14.330078125, 14.857177734375, 15.38427734375, 15.911376953125, 16.4384765625, 16.965576171875, 17.49267578125, 18.019775390625, 18.546875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 4.0, 12.0, 7.0, 9.0, 12.0, 9.0, 27.0, 21.0, 21.0, 21.0, 26.0, 32.0, 36.0, 48.0, 49.0, 41.0, 48.0, 37.0, 43.0, 1062.0, 34.0, 40.0, 41.0, 39.0, 31.0, 34.0, 26.0, 28.0, 32.0, 27.0, 17.0, 15.0, 12.0, 18.0, 11.0, 10.0, 10.0, 11.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-39.125, -37.92724609375, -36.7294921875, -35.53173828125, -34.333984375, -33.13623046875, -31.9384765625, -30.74072265625, -29.54296875, -28.34521484375, -27.1474609375, -25.94970703125, -24.751953125, -23.55419921875, -22.3564453125, -21.15869140625, -19.9609375, -18.76318359375, -17.5654296875, -16.36767578125, -15.169921875, -13.97216796875, -12.7744140625, -11.57666015625, -10.37890625, -9.18115234375, -7.9833984375, -6.78564453125, -5.587890625, -4.39013671875, -3.1923828125, -1.99462890625, -0.796875, 0.40087890625, 1.5986328125, 2.79638671875, 3.994140625, 5.19189453125, 6.3896484375, 7.58740234375, 8.78515625, 9.98291015625, 11.1806640625, 12.37841796875, 13.576171875, 14.77392578125, 15.9716796875, 17.16943359375, 18.3671875, 19.56494140625, 20.7626953125, 21.96044921875, 23.158203125, 24.35595703125, 25.5537109375, 26.75146484375, 27.94921875, 29.14697265625, 30.3447265625, 31.54248046875, 32.740234375, 33.93798828125, 35.1357421875, 36.33349609375, 37.53125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 13.0, 22.0, 29.0, 40.0, 46.0, 93.0, 136.0, 200.0, 328.0, 520.0, 705.0, 1169.0, 1816.0, 2956.0, 5044.0, 8563.0, 15092.0, 27637.0, 52066.0, 104100.0, 245789.0, 1302335.0, 161205.0, 76882.0, 39446.0, 21632.0, 11871.0, 6801.0, 4006.0, 2358.0, 1472.0, 949.0, 616.0, 399.0, 237.0, 189.0, 120.0, 68.0, 54.0, 38.0, 27.0, 20.0, 11.0, 10.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.775726318359375, -3.65106201171875, -3.526397705078125, -3.4017333984375, -3.277069091796875, -3.15240478515625, -3.027740478515625, -2.903076171875, -2.778411865234375, -2.65374755859375, -2.529083251953125, -2.4044189453125, -2.279754638671875, -2.15509033203125, -2.030426025390625, -1.90576171875, -1.781097412109375, -1.65643310546875, -1.531768798828125, -1.4071044921875, -1.282440185546875, -1.15777587890625, -1.033111572265625, -0.908447265625, -0.783782958984375, -0.65911865234375, -0.534454345703125, -0.4097900390625, -0.285125732421875, -0.16046142578125, -0.035797119140625, 0.0888671875, 0.213531494140625, 0.33819580078125, 0.462860107421875, 0.5875244140625, 0.712188720703125, 0.83685302734375, 0.961517333984375, 1.086181640625, 1.210845947265625, 1.33551025390625, 1.460174560546875, 1.5848388671875, 1.709503173828125, 1.83416748046875, 1.958831787109375, 2.08349609375, 2.208160400390625, 2.33282470703125, 2.457489013671875, 2.5821533203125, 2.706817626953125, 2.83148193359375, 2.956146240234375, 3.080810546875, 3.205474853515625, 3.33013916015625, 3.454803466796875, 3.5794677734375, 3.704132080078125, 3.82879638671875, 3.953460693359375, 4.078125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 3.0, 2.0, 6.0, 1.0, 7.0, 3.0, 5.0, 5.0, 11.0, 5.0, 6.0, 14.0, 19.0, 25.0, 31.0, 33.0, 46.0, 100.0, 191.0, 156.0, 91.0, 46.0, 36.0, 34.0, 26.0, 13.0, 16.0, 8.0, 11.0, 12.0, 8.0, 5.0, 4.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6558990478515625, -0.630645751953125, -0.6053924560546875, -0.58013916015625, -0.5548858642578125, -0.529632568359375, -0.5043792724609375, -0.4791259765625, -0.4538726806640625, -0.428619384765625, -0.4033660888671875, -0.37811279296875, -0.3528594970703125, -0.327606201171875, -0.3023529052734375, -0.277099609375, -0.2518463134765625, -0.226593017578125, -0.2013397216796875, -0.17608642578125, -0.1508331298828125, -0.125579833984375, -0.1003265380859375, -0.0750732421875, -0.0498199462890625, -0.024566650390625, 0.0006866455078125, 0.02593994140625, 0.0511932373046875, 0.076446533203125, 0.1016998291015625, 0.126953125, 0.1522064208984375, 0.177459716796875, 0.2027130126953125, 0.22796630859375, 0.2532196044921875, 0.278472900390625, 0.3037261962890625, 0.3289794921875, 0.3542327880859375, 0.379486083984375, 0.4047393798828125, 0.42999267578125, 0.4552459716796875, 0.480499267578125, 0.5057525634765625, 0.531005859375, 0.5562591552734375, 0.581512451171875, 0.6067657470703125, 0.63201904296875, 0.6572723388671875, 0.682525634765625, 0.7077789306640625, 0.7330322265625, 0.7582855224609375, 0.783538818359375, 0.8087921142578125, 0.83404541015625, 0.8592987060546875, 0.884552001953125, 0.9098052978515625, 0.93505859375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 5.0, 6.0, 5.0, 9.0, 7.0, 16.0, 16.0, 14.0, 34.0, 38.0, 57.0, 83.0, 207.0, 1046555.0, 1065.0, 151.0, 59.0, 52.0, 45.0, 22.0, 20.0, 9.0, 9.0, 5.0, 9.0, 4.0, 4.0, 4.0, 7.0, 1.0, 6.0, 2.0, 4.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-30.265625, -29.44384765625, -28.6220703125, -27.80029296875, -26.978515625, -26.15673828125, -25.3349609375, -24.51318359375, -23.69140625, -22.86962890625, -22.0478515625, -21.22607421875, -20.404296875, -19.58251953125, -18.7607421875, -17.93896484375, -17.1171875, -16.29541015625, -15.4736328125, -14.65185546875, -13.830078125, -13.00830078125, -12.1865234375, -11.36474609375, -10.54296875, -9.72119140625, -8.8994140625, -8.07763671875, -7.255859375, -6.43408203125, -5.6123046875, -4.79052734375, -3.96875, -3.14697265625, -2.3251953125, -1.50341796875, -0.681640625, 0.14013671875, 0.9619140625, 1.78369140625, 2.60546875, 3.42724609375, 4.2490234375, 5.07080078125, 5.892578125, 6.71435546875, 7.5361328125, 8.35791015625, 9.1796875, 10.00146484375, 10.8232421875, 11.64501953125, 12.466796875, 13.28857421875, 14.1103515625, 14.93212890625, 15.75390625, 16.57568359375, 17.3974609375, 18.21923828125, 19.041015625, 19.86279296875, 20.6845703125, 21.50634765625, 22.328125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 64.0, 954.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0713794231414795, -0.7348067760467529, -0.39823412895202637, -0.061661481857299805, 0.27491116523742676, 0.6114838123321533, 0.9480564594268799, 1.2846291065216064, 1.621201753616333, 1.9577744007110596, 2.294347047805786, 2.6309196949005127, 2.9674923419952393, 3.304064989089966, 3.6406376361846924, 3.977210283279419, 4.313782691955566, 4.650355339050293, 4.9869279861450195, 5.323500633239746, 5.660073280334473, 5.996645927429199, 6.333218574523926, 6.669791221618652, 7.006363868713379, 7.3429365158081055, 7.679509162902832, 8.016081809997559, 8.352654457092285, 8.689227104187012, 9.025799751281738, 9.362372398376465, 9.698945999145508, 10.035518646240234, 10.372091293334961, 10.708663940429688, 11.045236587524414, 11.38180923461914, 11.718381881713867, 12.054954528808594, 12.39152717590332, 12.728099822998047, 13.064672470092773, 13.4012451171875, 13.737817764282227, 14.074390411376953, 14.41096305847168, 14.747535705566406, 15.084108352661133, 15.42068099975586, 15.757253646850586, 16.093826293945312, 16.43039894104004, 16.766971588134766, 17.103544235229492, 17.44011688232422, 17.776689529418945, 18.113262176513672, 18.4498348236084, 18.786407470703125, 19.12298011779785, 19.459552764892578, 19.796125411987305, 20.13269805908203, 20.469270706176758]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 7.0, 11.0, 12.0, 13.0, 13.0, 22.0, 24.0, 18.0, 33.0, 27.0, 31.0, 56.0, 43.0, 31.0, 28.0, 41.0, 57.0, 46.0, 48.0, 43.0, 33.0, 40.0, 44.0, 39.0, 32.0, 36.0, 24.0, 24.0, 20.0, 22.0, 16.0, 12.0, 13.0, 5.0, 10.0, 8.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2212004661560059, -1.1785672903060913, -1.1359341144561768, -1.0933010578155518, -1.0506678819656372, -1.0080347061157227, -0.9654015898704529, -0.9227684736251831, -0.8801352977752686, -0.837502121925354, -0.7948690056800842, -0.7522358894348145, -0.7096027135848999, -0.6669695377349854, -0.6243364214897156, -0.5817033052444458, -0.5390701293945312, -0.4964369833469391, -0.4538038372993469, -0.41117069125175476, -0.3685375452041626, -0.32590439915657043, -0.28327125310897827, -0.2406381070613861, -0.19800496101379395, -0.15537181496620178, -0.11273866891860962, -0.07010552287101746, -0.027472376823425293, 0.01516076922416687, 0.05779391527175903, 0.1004270613193512, 0.14306020736694336, 0.18569335341453552, 0.22832649946212769, 0.27095964550971985, 0.313592791557312, 0.3562259376049042, 0.39885908365249634, 0.4414922297000885, 0.48412537574768066, 0.5267585515975952, 0.569391667842865, 0.6120247840881348, 0.6546579599380493, 0.6972911357879639, 0.7399242520332336, 0.7825573682785034, 0.825190544128418, 0.8678237199783325, 0.9104568362236023, 0.9530899524688721, 0.9957231283187866, 1.0383563041687012, 1.0809893608093262, 1.1236225366592407, 1.1662557125091553, 1.2088888883590698, 1.2515220642089844, 1.2941551208496094, 1.336788296699524, 1.3794214725494385, 1.4220545291900635, 1.464687705039978, 1.5073208808898926]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 6.0, 6.0, 11.0, 10.0, 9.0, 16.0, 15.0, 24.0, 39.0, 26.0, 34.0, 42.0, 34.0, 45.0, 52.0, 36.0, 49.0, 65.0, 39.0, 48.0, 45.0, 40.0, 42.0, 34.0, 32.0, 37.0, 30.0, 19.0, 24.0, 8.0, 17.0, 9.0, 16.0, 11.0, 4.0, 2.0, 6.0, 1.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-63.9375, -61.97314453125, -60.0087890625, -58.04443359375, -56.080078125, -54.11572265625, -52.1513671875, -50.18701171875, -48.22265625, -46.25830078125, -44.2939453125, -42.32958984375, -40.365234375, -38.40087890625, -36.4365234375, -34.47216796875, -32.5078125, -30.54345703125, -28.5791015625, -26.61474609375, -24.650390625, -22.68603515625, -20.7216796875, -18.75732421875, -16.79296875, -14.82861328125, -12.8642578125, -10.89990234375, -8.935546875, -6.97119140625, -5.0068359375, -3.04248046875, -1.078125, 0.88623046875, 2.8505859375, 4.81494140625, 6.779296875, 8.74365234375, 10.7080078125, 12.67236328125, 14.63671875, 16.60107421875, 18.5654296875, 20.52978515625, 22.494140625, 24.45849609375, 26.4228515625, 28.38720703125, 30.3515625, 32.31591796875, 34.2802734375, 36.24462890625, 38.208984375, 40.17333984375, 42.1376953125, 44.10205078125, 46.06640625, 48.03076171875, 49.9951171875, 51.95947265625, 53.923828125, 55.88818359375, 57.8525390625, 59.81689453125, 61.78125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 3.0, 6.0, 8.0, 10.0, 12.0, 13.0, 22.0, 20.0, 46.0, 43.0, 55.0, 80.0, 127.0, 167.0, 245.0, 348.0, 482.0, 836.0, 1648.0, 3322.0, 8077.0, 26375.0, 212184.0, 716748.0, 54750.0, 12860.0, 4740.0, 2154.0, 1130.0, 666.0, 413.0, 273.0, 184.0, 115.0, 95.0, 58.0, 59.0, 49.0, 39.0, 26.0, 11.0, 14.0, 12.0, 7.0, 9.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-59.65625, -57.8046875, -55.953125, -54.1015625, -52.25, -50.3984375, -48.546875, -46.6953125, -44.84375, -42.9921875, -41.140625, -39.2890625, -37.4375, -35.5859375, -33.734375, -31.8828125, -30.03125, -28.1796875, -26.328125, -24.4765625, -22.625, -20.7734375, -18.921875, -17.0703125, -15.21875, -13.3671875, -11.515625, -9.6640625, -7.8125, -5.9609375, -4.109375, -2.2578125, -0.40625, 1.4453125, 3.296875, 5.1484375, 7.0, 8.8515625, 10.703125, 12.5546875, 14.40625, 16.2578125, 18.109375, 19.9609375, 21.8125, 23.6640625, 25.515625, 27.3671875, 29.21875, 31.0703125, 32.921875, 34.7734375, 36.625, 38.4765625, 40.328125, 42.1796875, 44.03125, 45.8828125, 47.734375, 49.5859375, 51.4375, 53.2890625, 55.140625, 56.9921875, 58.84375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0, 5.0, 5.0, 4.0, 7.0, 11.0, 9.0, 18.0, 23.0, 19.0, 15.0, 22.0, 31.0, 25.0, 27.0, 32.0, 39.0, 38.0, 48.0, 74.0, 103.0, 301.0, 1698.0, 84.0, 53.0, 55.0, 38.0, 41.0, 30.0, 29.0, 28.0, 27.0, 18.0, 20.0, 8.0, 6.0, 19.0, 10.0, 8.0, 7.0, 0.0, 2.0, 3.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-215.625, -209.291015625, -202.95703125, -196.623046875, -190.2890625, -183.955078125, -177.62109375, -171.287109375, -164.953125, -158.619140625, -152.28515625, -145.951171875, -139.6171875, -133.283203125, -126.94921875, -120.615234375, -114.28125, -107.947265625, -101.61328125, -95.279296875, -88.9453125, -82.611328125, -76.27734375, -69.943359375, -63.609375, -57.275390625, -50.94140625, -44.607421875, -38.2734375, -31.939453125, -25.60546875, -19.271484375, -12.9375, -6.603515625, -0.26953125, 6.064453125, 12.3984375, 18.732421875, 25.06640625, 31.400390625, 37.734375, 44.068359375, 50.40234375, 56.736328125, 63.0703125, 69.404296875, 75.73828125, 82.072265625, 88.40625, 94.740234375, 101.07421875, 107.408203125, 113.7421875, 120.076171875, 126.41015625, 132.744140625, 139.078125, 145.412109375, 151.74609375, 158.080078125, 164.4140625, 170.748046875, 177.08203125, 183.416015625, 189.75]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 4.0, 3.0, 3.0, 5.0, 10.0, 12.0, 18.0, 17.0, 17.0, 34.0, 48.0, 58.0, 69.0, 88.0, 126.0, 190.0, 402.0, 1252.0, 6707.0, 909151.0, 2218127.0, 6900.0, 1232.0, 375.0, 194.0, 148.0, 115.0, 93.0, 59.0, 52.0, 37.0, 25.0, 34.0, 25.0, 15.0, 12.0, 7.0, 10.0, 8.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-397.5, -383.30859375, -369.1171875, -354.92578125, -340.734375, -326.54296875, -312.3515625, -298.16015625, -283.96875, -269.77734375, -255.5859375, -241.39453125, -227.203125, -213.01171875, -198.8203125, -184.62890625, -170.4375, -156.24609375, -142.0546875, -127.86328125, -113.671875, -99.48046875, -85.2890625, -71.09765625, -56.90625, -42.71484375, -28.5234375, -14.33203125, -0.140625, 14.05078125, 28.2421875, 42.43359375, 56.625, 70.81640625, 85.0078125, 99.19921875, 113.390625, 127.58203125, 141.7734375, 155.96484375, 170.15625, 184.34765625, 198.5390625, 212.73046875, 226.921875, 241.11328125, 255.3046875, 269.49609375, 283.6875, 297.87890625, 312.0703125, 326.26171875, 340.453125, 354.64453125, 368.8359375, 383.02734375, 397.21875, 411.41015625, 425.6015625, 439.79296875, 453.984375, 468.17578125, 482.3671875, 496.55859375, 510.75]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 112.0, 656.0, 219.0, 20.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1361.9676513671875, -1330.0133056640625, -1298.058837890625, -1266.1044921875, -1234.1500244140625, -1202.1956787109375, -1170.2412109375, -1138.286865234375, -1106.33251953125, -1074.378173828125, -1042.4237060546875, -1010.4692993164062, -978.514892578125, -946.560546875, -914.6061401367188, -882.6517333984375, -850.697265625, -818.7428588867188, -786.7884521484375, -754.8340454101562, -722.879638671875, -690.92529296875, -658.9708862304688, -627.0164794921875, -595.0620727539062, -563.107666015625, -531.1532592773438, -499.1988830566406, -467.2444763183594, -435.2900695800781, -403.335693359375, -371.38128662109375, -339.42694091796875, -307.4725341796875, -275.51812744140625, -243.56375122070312, -211.60934448242188, -179.65493774414062, -147.70054626464844, -115.74615478515625, -83.791748046875, -51.83734893798828, -19.882949829101562, 12.071449279785156, 44.025848388671875, 75.98025512695312, 107.93464660644531, 139.8890380859375, 171.84344482421875, 203.7978515625, 235.7522430419922, 267.7066345214844, 299.6610412597656, 331.6154479980469, 363.56982421875, 395.52423095703125, 427.4786376953125, 459.43304443359375, 491.387451171875, 523.3418579101562, 555.2962646484375, 587.2506103515625, 619.2050170898438, 651.159423828125, 683.1138305664062]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 13.0, 7.0, 16.0, 8.0, 15.0, 23.0, 21.0, 22.0, 26.0, 27.0, 38.0, 32.0, 43.0, 37.0, 43.0, 35.0, 39.0, 41.0, 36.0, 32.0, 36.0, 39.0, 42.0, 39.0, 30.0, 30.0, 37.0, 20.0, 33.0, 19.0, 15.0, 12.0, 14.0, 16.0, 12.0, 5.0, 7.0, 3.0, 3.0, 4.0, 8.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-497.30914306640625, -481.456298828125, -465.60345458984375, -449.7505798339844, -433.8977355957031, -418.0448913574219, -402.1920166015625, -386.33917236328125, -370.486328125, -354.63348388671875, -338.7806396484375, -322.9277648925781, -307.0749206542969, -291.2220764160156, -275.36920166015625, -259.516357421875, -243.66351318359375, -227.8106689453125, -211.9578094482422, -196.10494995117188, -180.25210571289062, -164.39926147460938, -148.54640197753906, -132.69354248046875, -116.8406982421875, -100.98784637451172, -85.13499450683594, -69.28214263916016, -53.429290771484375, -37.576438903808594, -21.723587036132812, -5.870735168457031, 9.98211669921875, 25.83496856689453, 41.68782043457031, 57.540672302246094, 73.39352416992188, 89.24637603759766, 105.09922790527344, 120.95207977294922, 136.804931640625, 152.65777587890625, 168.51063537597656, 184.36349487304688, 200.21633911132812, 216.06918334960938, 231.9220428466797, 247.77490234375, 263.62774658203125, 279.4805908203125, 295.33343505859375, 311.1863098144531, 327.0391540527344, 342.8919982910156, 358.744873046875, 374.59771728515625, 390.4505615234375, 406.30340576171875, 422.15625, 438.0091247558594, 453.8619689941406, 469.7148132324219, 485.56768798828125, 501.4205322265625, 517.2733764648438]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 6.0, 12.0, 7.0, 12.0, 4.0, 16.0, 15.0, 18.0, 38.0, 22.0, 34.0, 42.0, 37.0, 45.0, 37.0, 52.0, 49.0, 46.0, 48.0, 54.0, 46.0, 42.0, 37.0, 37.0, 35.0, 26.0, 34.0, 30.0, 25.0, 11.0, 16.0, 9.0, 13.0, 10.0, 8.0, 9.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-64.625, -62.6064453125, -60.587890625, -58.5693359375, -56.55078125, -54.5322265625, -52.513671875, -50.4951171875, -48.4765625, -46.4580078125, -44.439453125, -42.4208984375, -40.40234375, -38.3837890625, -36.365234375, -34.3466796875, -32.328125, -30.3095703125, -28.291015625, -26.2724609375, -24.25390625, -22.2353515625, -20.216796875, -18.1982421875, -16.1796875, -14.1611328125, -12.142578125, -10.1240234375, -8.10546875, -6.0869140625, -4.068359375, -2.0498046875, -0.03125, 1.9873046875, 4.005859375, 6.0244140625, 8.04296875, 10.0615234375, 12.080078125, 14.0986328125, 16.1171875, 18.1357421875, 20.154296875, 22.1728515625, 24.19140625, 26.2099609375, 28.228515625, 30.2470703125, 32.265625, 34.2841796875, 36.302734375, 38.3212890625, 40.33984375, 42.3583984375, 44.376953125, 46.3955078125, 48.4140625, 50.4326171875, 52.451171875, 54.4697265625, 56.48828125, 58.5068359375, 60.525390625, 62.5439453125, 64.5625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 10.0, 15.0, 16.0, 24.0, 43.0, 48.0, 68.0, 70.0, 115.0, 165.0, 235.0, 342.0, 456.0, 701.0, 1064.0, 1715.0, 2768.0, 4995.0, 9826.0, 27637.0, 227777.0, 2725481.0, 1070936.0, 84881.0, 16586.0, 7490.0, 4013.0, 2314.0, 1486.0, 910.0, 620.0, 430.0, 283.0, 212.0, 159.0, 105.0, 70.0, 53.0, 41.0, 36.0, 27.0, 11.0, 12.0, 7.0, 7.0, 5.0, 4.0, 0.0, 6.0, 2.0, 1.0, 1.0], "bins": [-124.0625, -120.3916015625, -116.720703125, -113.0498046875, -109.37890625, -105.7080078125, -102.037109375, -98.3662109375, -94.6953125, -91.0244140625, -87.353515625, -83.6826171875, -80.01171875, -76.3408203125, -72.669921875, -68.9990234375, -65.328125, -61.6572265625, -57.986328125, -54.3154296875, -50.64453125, -46.9736328125, -43.302734375, -39.6318359375, -35.9609375, -32.2900390625, -28.619140625, -24.9482421875, -21.27734375, -17.6064453125, -13.935546875, -10.2646484375, -6.59375, -2.9228515625, 0.748046875, 4.4189453125, 8.08984375, 11.7607421875, 15.431640625, 19.1025390625, 22.7734375, 26.4443359375, 30.115234375, 33.7861328125, 37.45703125, 41.1279296875, 44.798828125, 48.4697265625, 52.140625, 55.8115234375, 59.482421875, 63.1533203125, 66.82421875, 70.4951171875, 74.166015625, 77.8369140625, 81.5078125, 85.1787109375, 88.849609375, 92.5205078125, 96.19140625, 99.8623046875, 103.533203125, 107.2041015625, 110.875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 5.0, 7.0, 9.0, 17.0, 16.0, 31.0, 45.0, 74.0, 110.0, 145.0, 332.0, 751.0, 1151.0, 645.0, 290.0, 150.0, 93.0, 66.0, 30.0, 30.0, 16.0, 8.0, 15.0, 7.0, 7.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.625, -134.876953125, -130.12890625, -125.380859375, -120.6328125, -115.884765625, -111.13671875, -106.388671875, -101.640625, -96.892578125, -92.14453125, -87.396484375, -82.6484375, -77.900390625, -73.15234375, -68.404296875, -63.65625, -58.908203125, -54.16015625, -49.412109375, -44.6640625, -39.916015625, -35.16796875, -30.419921875, -25.671875, -20.923828125, -16.17578125, -11.427734375, -6.6796875, -1.931640625, 2.81640625, 7.564453125, 12.3125, 17.060546875, 21.80859375, 26.556640625, 31.3046875, 36.052734375, 40.80078125, 45.548828125, 50.296875, 55.044921875, 59.79296875, 64.541015625, 69.2890625, 74.037109375, 78.78515625, 83.533203125, 88.28125, 93.029296875, 97.77734375, 102.525390625, 107.2734375, 112.021484375, 116.76953125, 121.517578125, 126.265625, 131.013671875, 135.76171875, 140.509765625, 145.2578125, 150.005859375, 154.75390625, 159.501953125, 164.25]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 9.0, 6.0, 5.0, 9.0, 16.0, 22.0, 29.0, 31.0, 41.0, 58.0, 102.0, 134.0, 196.0, 334.0, 816.0, 2798.0, 15145.0, 270505.0, 3854799.0, 41241.0, 5353.0, 1249.0, 510.0, 269.0, 155.0, 112.0, 82.0, 53.0, 56.0, 34.0, 23.0, 22.0, 20.0, 12.0, 4.0, 10.0, 5.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-411.75, -397.16015625, -382.5703125, -367.98046875, -353.390625, -338.80078125, -324.2109375, -309.62109375, -295.03125, -280.44140625, -265.8515625, -251.26171875, -236.671875, -222.08203125, -207.4921875, -192.90234375, -178.3125, -163.72265625, -149.1328125, -134.54296875, -119.953125, -105.36328125, -90.7734375, -76.18359375, -61.59375, -47.00390625, -32.4140625, -17.82421875, -3.234375, 11.35546875, 25.9453125, 40.53515625, 55.125, 69.71484375, 84.3046875, 98.89453125, 113.484375, 128.07421875, 142.6640625, 157.25390625, 171.84375, 186.43359375, 201.0234375, 215.61328125, 230.203125, 244.79296875, 259.3828125, 273.97265625, 288.5625, 303.15234375, 317.7421875, 332.33203125, 346.921875, 361.51171875, 376.1015625, 390.69140625, 405.28125, 419.87109375, 434.4609375, 449.05078125, 463.640625, 478.23046875, 492.8203125, 507.41015625, 522.0]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 9.0, 25.0, 36.0, 115.0, 261.0, 298.0, 142.0, 69.0, 27.0, 8.0, 10.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1765.814697265625, -1730.64111328125, -1695.467529296875, -1660.2939453125, -1625.120361328125, -1589.94677734375, -1554.773193359375, -1519.5994873046875, -1484.4259033203125, -1449.2523193359375, -1414.0787353515625, -1378.9051513671875, -1343.7315673828125, -1308.557861328125, -1273.38427734375, -1238.210693359375, -1203.037109375, -1167.863525390625, -1132.68994140625, -1097.516357421875, -1062.3427734375, -1027.169189453125, -991.9955444335938, -956.8219604492188, -921.6484375, -886.474853515625, -851.30126953125, -816.127685546875, -780.9540405273438, -745.7804565429688, -710.6068725585938, -675.4332885742188, -640.2595825195312, -605.0859985351562, -569.9124145507812, -534.73876953125, -499.565185546875, -464.3916015625, -429.218017578125, -394.04443359375, -358.8708190917969, -323.6972351074219, -288.52362060546875, -253.35003662109375, -218.1764373779297, -183.00283813476562, -147.82925415039062, -112.65565490722656, -77.4820556640625, -42.3084602355957, -7.134864807128906, 28.038726806640625, 63.21232604980469, 98.38592529296875, 133.55950927734375, 168.7331085205078, 203.90670776367188, 239.08030700683594, 274.25390625, 309.427490234375, 344.60107421875, 379.7746887207031, 414.9482727050781, 450.12188720703125, 485.29547119140625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 4.0, 8.0, 15.0, 12.0, 7.0, 11.0, 14.0, 24.0, 22.0, 25.0, 25.0, 25.0, 33.0, 29.0, 36.0, 46.0, 51.0, 35.0, 45.0, 29.0, 29.0, 34.0, 39.0, 31.0, 32.0, 40.0, 25.0, 34.0, 31.0, 27.0, 20.0, 19.0, 21.0, 13.0, 16.0, 18.0, 11.0, 12.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-269.7220764160156, -260.63629150390625, -251.55050659179688, -242.46470642089844, -233.37892150878906, -224.2931365966797, -215.20733642578125, -206.12155151367188, -197.0357666015625, -187.94998168945312, -178.86419677734375, -169.7783966064453, -160.69261169433594, -151.60682678222656, -142.52102661132812, -133.43524169921875, -124.34945678710938, -115.263671875, -106.1778793334961, -97.09208679199219, -88.00630187988281, -78.92051696777344, -69.83472442626953, -60.74893569946289, -51.66314697265625, -42.57735824584961, -33.49156951904297, -24.405780792236328, -15.319992065429688, -6.234203338623047, 2.8515853881835938, 11.937374114990234, 21.02313232421875, 30.10892105102539, 39.19470977783203, 48.28049850463867, 57.36628723144531, 66.45207214355469, 75.5378646850586, 84.6236572265625, 93.70944213867188, 102.79522705078125, 111.88101959228516, 120.96681213378906, 130.05259704589844, 139.1383819580078, 148.22418212890625, 157.30996704101562, 166.395751953125, 175.48153686523438, 184.56732177734375, 193.6531219482422, 202.73890686035156, 211.82469177246094, 220.91049194335938, 229.99627685546875, 239.08206176757812, 248.1678466796875, 257.2536315917969, 266.33941650390625, 275.42523193359375, 284.5110168457031, 293.5968017578125, 302.6825866699219, 311.76837158203125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 1.0, 4.0, 12.0, 7.0, 23.0, 13.0, 22.0, 25.0, 25.0, 25.0, 41.0, 37.0, 36.0, 41.0, 54.0, 51.0, 58.0, 55.0, 59.0, 45.0, 50.0, 34.0, 46.0, 33.0, 31.0, 26.0, 25.0, 22.0, 17.0, 24.0, 10.0, 12.0, 8.0, 3.0, 11.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.0, -64.8623046875, -62.724609375, -60.5869140625, -58.44921875, -56.3115234375, -54.173828125, -52.0361328125, -49.8984375, -47.7607421875, -45.623046875, -43.4853515625, -41.34765625, -39.2099609375, -37.072265625, -34.9345703125, -32.796875, -30.6591796875, -28.521484375, -26.3837890625, -24.24609375, -22.1083984375, -19.970703125, -17.8330078125, -15.6953125, -13.5576171875, -11.419921875, -9.2822265625, -7.14453125, -5.0068359375, -2.869140625, -0.7314453125, 1.40625, 3.5439453125, 5.681640625, 7.8193359375, 9.95703125, 12.0947265625, 14.232421875, 16.3701171875, 18.5078125, 20.6455078125, 22.783203125, 24.9208984375, 27.05859375, 29.1962890625, 31.333984375, 33.4716796875, 35.609375, 37.7470703125, 39.884765625, 42.0224609375, 44.16015625, 46.2978515625, 48.435546875, 50.5732421875, 52.7109375, 54.8486328125, 56.986328125, 59.1240234375, 61.26171875, 63.3994140625, 65.537109375, 67.6748046875, 69.8125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 8.0, 15.0, 15.0, 23.0, 35.0, 50.0, 82.0, 112.0, 163.0, 253.0, 467.0, 791.0, 1512.0, 2894.0, 5985.0, 12692.0, 28451.0, 71052.0, 198245.0, 449582.0, 167468.0, 60850.0, 25317.0, 11303.0, 5318.0, 2586.0, 1349.0, 742.0, 423.0, 267.0, 147.0, 104.0, 61.0, 37.0, 52.0, 26.0, 16.0, 15.0, 9.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3203125, -8.027587890625, -7.73486328125, -7.442138671875, -7.1494140625, -6.856689453125, -6.56396484375, -6.271240234375, -5.978515625, -5.685791015625, -5.39306640625, -5.100341796875, -4.8076171875, -4.514892578125, -4.22216796875, -3.929443359375, -3.63671875, -3.343994140625, -3.05126953125, -2.758544921875, -2.4658203125, -2.173095703125, -1.88037109375, -1.587646484375, -1.294921875, -1.002197265625, -0.70947265625, -0.416748046875, -0.1240234375, 0.168701171875, 0.46142578125, 0.754150390625, 1.046875, 1.339599609375, 1.63232421875, 1.925048828125, 2.2177734375, 2.510498046875, 2.80322265625, 3.095947265625, 3.388671875, 3.681396484375, 3.97412109375, 4.266845703125, 4.5595703125, 4.852294921875, 5.14501953125, 5.437744140625, 5.73046875, 6.023193359375, 6.31591796875, 6.608642578125, 6.9013671875, 7.194091796875, 7.48681640625, 7.779541015625, 8.072265625, 8.364990234375, 8.65771484375, 8.950439453125, 9.2431640625, 9.535888671875, 9.82861328125, 10.121337890625, 10.4140625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 10.0, 3.0, 11.0, 8.0, 12.0, 15.0, 10.0, 11.0, 17.0, 21.0, 14.0, 43.0, 23.0, 21.0, 42.0, 41.0, 38.0, 38.0, 38.0, 40.0, 1058.0, 43.0, 32.0, 49.0, 37.0, 40.0, 28.0, 34.0, 31.0, 26.0, 22.0, 20.0, 12.0, 27.0, 21.0, 21.0, 16.0, 15.0, 7.0, 6.0, 7.0, 2.0, 9.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-39.75, -38.61083984375, -37.4716796875, -36.33251953125, -35.193359375, -34.05419921875, -32.9150390625, -31.77587890625, -30.63671875, -29.49755859375, -28.3583984375, -27.21923828125, -26.080078125, -24.94091796875, -23.8017578125, -22.66259765625, -21.5234375, -20.38427734375, -19.2451171875, -18.10595703125, -16.966796875, -15.82763671875, -14.6884765625, -13.54931640625, -12.41015625, -11.27099609375, -10.1318359375, -8.99267578125, -7.853515625, -6.71435546875, -5.5751953125, -4.43603515625, -3.296875, -2.15771484375, -1.0185546875, 0.12060546875, 1.259765625, 2.39892578125, 3.5380859375, 4.67724609375, 5.81640625, 6.95556640625, 8.0947265625, 9.23388671875, 10.373046875, 11.51220703125, 12.6513671875, 13.79052734375, 14.9296875, 16.06884765625, 17.2080078125, 18.34716796875, 19.486328125, 20.62548828125, 21.7646484375, 22.90380859375, 24.04296875, 25.18212890625, 26.3212890625, 27.46044921875, 28.599609375, 29.73876953125, 30.8779296875, 32.01708984375, 33.15625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 8.0, 9.0, 26.0, 33.0, 42.0, 42.0, 88.0, 126.0, 168.0, 310.0, 378.0, 606.0, 907.0, 1316.0, 2054.0, 3185.0, 4946.0, 7672.0, 12122.0, 19278.0, 31611.0, 54117.0, 96298.0, 183120.0, 1303952.0, 160863.0, 86433.0, 49405.0, 29213.0, 17764.0, 11090.0, 6808.0, 4460.0, 2902.0, 1929.0, 1231.0, 807.0, 585.0, 352.0, 292.0, 188.0, 121.0, 95.0, 48.0, 42.0, 24.0, 23.0, 15.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.87890625, -2.787261962890625, -2.69561767578125, -2.603973388671875, -2.5123291015625, -2.420684814453125, -2.32904052734375, -2.237396240234375, -2.145751953125, -2.054107666015625, -1.96246337890625, -1.870819091796875, -1.7791748046875, -1.687530517578125, -1.59588623046875, -1.504241943359375, -1.41259765625, -1.320953369140625, -1.22930908203125, -1.137664794921875, -1.0460205078125, -0.954376220703125, -0.86273193359375, -0.771087646484375, -0.679443359375, -0.587799072265625, -0.49615478515625, -0.404510498046875, -0.3128662109375, -0.221221923828125, -0.12957763671875, -0.037933349609375, 0.0537109375, 0.145355224609375, 0.23699951171875, 0.328643798828125, 0.4202880859375, 0.511932373046875, 0.60357666015625, 0.695220947265625, 0.786865234375, 0.878509521484375, 0.97015380859375, 1.061798095703125, 1.1534423828125, 1.245086669921875, 1.33673095703125, 1.428375244140625, 1.52001953125, 1.611663818359375, 1.70330810546875, 1.794952392578125, 1.8865966796875, 1.978240966796875, 2.06988525390625, 2.161529541015625, 2.253173828125, 2.344818115234375, 2.43646240234375, 2.528106689453125, 2.6197509765625, 2.711395263671875, 2.80303955078125, 2.894683837890625, 2.986328125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 8.0, 13.0, 16.0, 17.0, 13.0, 38.0, 42.0, 63.0, 102.0, 198.0, 167.0, 108.0, 57.0, 40.0, 33.0, 20.0, 7.0, 7.0, 9.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4306640625, -0.41710662841796875, -0.4035491943359375, -0.38999176025390625, -0.376434326171875, -0.36287689208984375, -0.3493194580078125, -0.33576202392578125, -0.32220458984375, -0.30864715576171875, -0.2950897216796875, -0.28153228759765625, -0.267974853515625, -0.25441741943359375, -0.2408599853515625, -0.22730255126953125, -0.2137451171875, -0.20018768310546875, -0.1866302490234375, -0.17307281494140625, -0.159515380859375, -0.14595794677734375, -0.1324005126953125, -0.11884307861328125, -0.10528564453125, -0.09172821044921875, -0.0781707763671875, -0.06461334228515625, -0.051055908203125, -0.03749847412109375, -0.0239410400390625, -0.01038360595703125, 0.003173828125, 0.01673126220703125, 0.0302886962890625, 0.04384613037109375, 0.057403564453125, 0.07096099853515625, 0.0845184326171875, 0.09807586669921875, 0.11163330078125, 0.12519073486328125, 0.1387481689453125, 0.15230560302734375, 0.165863037109375, 0.17942047119140625, 0.1929779052734375, 0.20653533935546875, 0.2200927734375, 0.23365020751953125, 0.2472076416015625, 0.26076507568359375, 0.274322509765625, 0.28787994384765625, 0.3014373779296875, 0.31499481201171875, 0.32855224609375, 0.34210968017578125, 0.3556671142578125, 0.36922454833984375, 0.382781982421875, 0.39633941650390625, 0.4098968505859375, 0.42345428466796875, 0.43701171875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 9.0, 6.0, 11.0, 14.0, 34.0, 35.0, 69.0, 132.0, 523.0, 1047213.0, 212.0, 101.0, 52.0, 33.0, 21.0, 15.0, 16.0, 10.0, 12.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.0546875, -13.6192626953125, -13.183837890625, -12.7484130859375, -12.31298828125, -11.8775634765625, -11.442138671875, -11.0067138671875, -10.5712890625, -10.1358642578125, -9.700439453125, -9.2650146484375, -8.82958984375, -8.3941650390625, -7.958740234375, -7.5233154296875, -7.087890625, -6.6524658203125, -6.217041015625, -5.7816162109375, -5.34619140625, -4.9107666015625, -4.475341796875, -4.0399169921875, -3.6044921875, -3.1690673828125, -2.733642578125, -2.2982177734375, -1.86279296875, -1.4273681640625, -0.991943359375, -0.5565185546875, -0.12109375, 0.3143310546875, 0.749755859375, 1.1851806640625, 1.62060546875, 2.0560302734375, 2.491455078125, 2.9268798828125, 3.3623046875, 3.7977294921875, 4.233154296875, 4.6685791015625, 5.10400390625, 5.5394287109375, 5.974853515625, 6.4102783203125, 6.845703125, 7.2811279296875, 7.716552734375, 8.1519775390625, 8.58740234375, 9.0228271484375, 9.458251953125, 9.8936767578125, 10.3291015625, 10.7645263671875, 11.199951171875, 11.6353759765625, 12.07080078125, 12.5062255859375, 12.941650390625, 13.3770751953125, 13.8125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 11.0, 980.0, 28.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36365607380867004, -0.28428715467453003, -0.20491823554039001, -0.12554931640625, -0.046180397272109985, 0.03318852186203003, 0.11255744099617004, 0.19192633032798767, 0.2712952792644501, 0.3506641983985901, 0.4300331175327301, 0.5094020366668701, 0.5887709856033325, 0.6681398749351501, 0.7475087642669678, 0.8268777132034302, 0.9062466621398926, 0.985615611076355, 1.0649845600128174, 1.1443533897399902, 1.2237223386764526, 1.303091287612915, 1.382460117340088, 1.4618290662765503, 1.5411980152130127, 1.620566964149475, 1.6999359130859375, 1.7793047428131104, 1.8586736917495728, 1.9380426406860352, 2.017411470413208, 2.096780300140381, 2.176149368286133, 2.2555181980133057, 2.3348872661590576, 2.4142560958862305, 2.4936251640319824, 2.5729939937591553, 2.652362823486328, 2.73173189163208, 2.811100721359253, 2.890469551086426, 2.9698386192321777, 3.0492074489593506, 3.1285762786865234, 3.2079453468322754, 3.2873141765594482, 3.366683006286621, 3.446052074432373, 3.525420904159546, 3.604789972305298, 3.6841588020324707, 3.7635278701782227, 3.8428966999053955, 3.9222655296325684, 4.00163459777832, 4.081003189086914, 4.160372257232666, 4.23974084854126, 4.319109916687012, 4.398478984832764, 4.477847576141357, 4.557216644287109, 4.636585712432861, 4.715954780578613]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 5.0, 10.0, 13.0, 16.0, 16.0, 20.0, 20.0, 25.0, 32.0, 33.0, 42.0, 27.0, 37.0, 43.0, 40.0, 36.0, 38.0, 42.0, 42.0, 54.0, 47.0, 42.0, 41.0, 33.0, 38.0, 27.0, 25.0, 30.0, 16.0, 17.0, 18.0, 17.0, 10.0, 5.0, 8.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22160261869430542, -0.2148842215538025, -0.20816582441329956, -0.20144742727279663, -0.1947290301322937, -0.18801063299179077, -0.18129223585128784, -0.1745738387107849, -0.16785544157028198, -0.16113704442977905, -0.15441864728927612, -0.1477002501487732, -0.14098185300827026, -0.13426345586776733, -0.1275450587272644, -0.12082665413618088, -0.11410824954509735, -0.10738985240459442, -0.10067145526409149, -0.09395305812358856, -0.08723466098308563, -0.0805162638425827, -0.07379785925149918, -0.06707946211099625, -0.06036106497049332, -0.05364266782999039, -0.04692427068948746, -0.04020586982369423, -0.0334874726831913, -0.02676907554268837, -0.02005067467689514, -0.013332277536392212, -0.006613880395889282, 0.00010451767593622208, 0.006822915747761726, 0.013541314750909805, 0.020259711891412735, 0.026978109031915665, 0.03369650989770889, 0.04041490703821182, 0.04713330417871475, 0.05385170131921768, 0.06057009845972061, 0.06728850305080414, 0.07400690019130707, 0.08072529733181, 0.08744369447231293, 0.09416209161281586, 0.10088048875331879, 0.10759888589382172, 0.11431728303432465, 0.12103568017482758, 0.1277540773153305, 0.13447247445583344, 0.14119088649749756, 0.1479092836380005, 0.15462768077850342, 0.16134607791900635, 0.16806447505950928, 0.1747828722000122, 0.18150126934051514, 0.18821966648101807, 0.194938063621521, 0.20165646076202393, 0.20837485790252686]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 1.0, 4.0, 12.0, 7.0, 23.0, 13.0, 22.0, 25.0, 25.0, 25.0, 41.0, 37.0, 36.0, 41.0, 54.0, 51.0, 58.0, 55.0, 59.0, 45.0, 50.0, 34.0, 47.0, 32.0, 31.0, 26.0, 25.0, 22.0, 17.0, 24.0, 10.0, 12.0, 8.0, 3.0, 11.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.0, -64.8623046875, -62.724609375, -60.5869140625, -58.44921875, -56.3115234375, -54.173828125, -52.0361328125, -49.8984375, -47.7607421875, -45.623046875, -43.4853515625, -41.34765625, -39.2099609375, -37.072265625, -34.9345703125, -32.796875, -30.6591796875, -28.521484375, -26.3837890625, -24.24609375, -22.1083984375, -19.970703125, -17.8330078125, -15.6953125, -13.5576171875, -11.419921875, -9.2822265625, -7.14453125, -5.0068359375, -2.869140625, -0.7314453125, 1.40625, 3.5439453125, 5.681640625, 7.8193359375, 9.95703125, 12.0947265625, 14.232421875, 16.3701171875, 18.5078125, 20.6455078125, 22.783203125, 24.9208984375, 27.05859375, 29.1962890625, 31.333984375, 33.4716796875, 35.609375, 37.7470703125, 39.884765625, 42.0224609375, 44.16015625, 46.2978515625, 48.435546875, 50.5732421875, 52.7109375, 54.8486328125, 56.986328125, 59.1240234375, 61.26171875, 63.3994140625, 65.537109375, 67.6748046875, 69.8125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 10.0, 13.0, 17.0, 25.0, 43.0, 50.0, 69.0, 101.0, 143.0, 222.0, 282.0, 437.0, 706.0, 1043.0, 1713.0, 3013.0, 6548.0, 36024.0, 873632.0, 104686.0, 10285.0, 3679.0, 2107.0, 1258.0, 775.0, 528.0, 337.0, 240.0, 154.0, 120.0, 65.0, 60.0, 45.0, 34.0, 23.0, 14.0, 8.0, 13.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-141.0, -137.0478515625, -133.095703125, -129.1435546875, -125.19140625, -121.2392578125, -117.287109375, -113.3349609375, -109.3828125, -105.4306640625, -101.478515625, -97.5263671875, -93.57421875, -89.6220703125, -85.669921875, -81.7177734375, -77.765625, -73.8134765625, -69.861328125, -65.9091796875, -61.95703125, -58.0048828125, -54.052734375, -50.1005859375, -46.1484375, -42.1962890625, -38.244140625, -34.2919921875, -30.33984375, -26.3876953125, -22.435546875, -18.4833984375, -14.53125, -10.5791015625, -6.626953125, -2.6748046875, 1.27734375, 5.2294921875, 9.181640625, 13.1337890625, 17.0859375, 21.0380859375, 24.990234375, 28.9423828125, 32.89453125, 36.8466796875, 40.798828125, 44.7509765625, 48.703125, 52.6552734375, 56.607421875, 60.5595703125, 64.51171875, 68.4638671875, 72.416015625, 76.3681640625, 80.3203125, 84.2724609375, 88.224609375, 92.1767578125, 96.12890625, 100.0810546875, 104.033203125, 107.9853515625, 111.9375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 5.0, 5.0, 8.0, 7.0, 7.0, 20.0, 16.0, 20.0, 26.0, 26.0, 28.0, 38.0, 40.0, 34.0, 53.0, 55.0, 63.0, 138.0, 1753.0, 191.0, 96.0, 49.0, 50.0, 48.0, 37.0, 31.0, 32.0, 36.0, 25.0, 18.0, 11.0, 11.0, 15.0, 5.0, 12.0, 10.0, 4.0, 7.0, 3.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-192.375, -185.669921875, -178.96484375, -172.259765625, -165.5546875, -158.849609375, -152.14453125, -145.439453125, -138.734375, -132.029296875, -125.32421875, -118.619140625, -111.9140625, -105.208984375, -98.50390625, -91.798828125, -85.09375, -78.388671875, -71.68359375, -64.978515625, -58.2734375, -51.568359375, -44.86328125, -38.158203125, -31.453125, -24.748046875, -18.04296875, -11.337890625, -4.6328125, 2.072265625, 8.77734375, 15.482421875, 22.1875, 28.892578125, 35.59765625, 42.302734375, 49.0078125, 55.712890625, 62.41796875, 69.123046875, 75.828125, 82.533203125, 89.23828125, 95.943359375, 102.6484375, 109.353515625, 116.05859375, 122.763671875, 129.46875, 136.173828125, 142.87890625, 149.583984375, 156.2890625, 162.994140625, 169.69921875, 176.404296875, 183.109375, 189.814453125, 196.51953125, 203.224609375, 209.9296875, 216.634765625, 223.33984375, 230.044921875, 236.75]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 11.0, 3.0, 4.0, 5.0, 15.0, 8.0, 12.0, 14.0, 23.0, 22.0, 30.0, 52.0, 56.0, 85.0, 103.0, 115.0, 244.0, 465.0, 1714.0, 13386.0, 3027979.0, 95049.0, 4416.0, 891.0, 359.0, 188.0, 108.0, 103.0, 61.0, 49.0, 38.0, 31.0, 25.0, 15.0, 6.0, 5.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-569.0, -551.6328125, -534.265625, -516.8984375, -499.53125, -482.1640625, -464.796875, -447.4296875, -430.0625, -412.6953125, -395.328125, -377.9609375, -360.59375, -343.2265625, -325.859375, -308.4921875, -291.125, -273.7578125, -256.390625, -239.0234375, -221.65625, -204.2890625, -186.921875, -169.5546875, -152.1875, -134.8203125, -117.453125, -100.0859375, -82.71875, -65.3515625, -47.984375, -30.6171875, -13.25, 4.1171875, 21.484375, 38.8515625, 56.21875, 73.5859375, 90.953125, 108.3203125, 125.6875, 143.0546875, 160.421875, 177.7890625, 195.15625, 212.5234375, 229.890625, 247.2578125, 264.625, 281.9921875, 299.359375, 316.7265625, 334.09375, 351.4609375, 368.828125, 386.1953125, 403.5625, 420.9296875, 438.296875, 455.6640625, 473.03125, 490.3984375, 507.765625, 525.1328125, 542.5]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [4.0, 168.0, 819.0, 28.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.09202575683594, -115.2530288696289, -24.414031982421875, 66.42497253417969, 157.2639617919922, 248.1029510498047, 338.94195556640625, 429.78094482421875, 520.6199340820312, 611.4589233398438, 702.2979125976562, 793.136962890625, 883.9759521484375, 974.81494140625, 1065.6539306640625, 1156.492919921875, 1247.3319091796875, 1338.1708984375, 1429.0098876953125, 1519.848876953125, 1610.6878662109375, 1701.52685546875, 1792.365966796875, 1883.204833984375, 1974.0439453125, 2064.883056640625, 2155.721923828125, 2246.56103515625, 2337.39990234375, 2428.239013671875, 2519.077880859375, 2609.9169921875, 2700.756103515625, 2791.59521484375, 2882.43408203125, 2973.273193359375, 3064.112060546875, 3154.951171875, 3245.7900390625, 3336.629150390625, 3427.468017578125, 3518.30712890625, 3609.14599609375, 3699.985107421875, 3790.823974609375, 3881.6630859375, 3972.501953125, 4063.341064453125, 4154.18017578125, 4245.01904296875, 4335.8583984375, 4426.697265625, 4517.5361328125, 4608.375, 4699.21435546875, 4790.05322265625, 4880.89208984375, 4971.73095703125, 5062.5703125, 5153.4091796875, 5244.248046875, 5335.0869140625, 5425.92626953125, 5516.76513671875, 5607.60400390625]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 7.0, 5.0, 11.0, 3.0, 9.0, 12.0, 14.0, 12.0, 26.0, 22.0, 20.0, 20.0, 16.0, 23.0, 25.0, 28.0, 27.0, 36.0, 30.0, 40.0, 38.0, 33.0, 43.0, 32.0, 47.0, 30.0, 39.0, 27.0, 29.0, 35.0, 31.0, 33.0, 23.0, 24.0, 22.0, 14.0, 13.0, 8.0, 5.0, 19.0, 16.0, 6.0, 8.0, 9.0, 7.0, 7.0, 6.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0], "bins": [-448.8605041503906, -435.37518310546875, -421.8898620605469, -408.404541015625, -394.9192199707031, -381.43389892578125, -367.9485778808594, -354.4632568359375, -340.9779357910156, -327.49261474609375, -314.0072937011719, -300.52197265625, -287.0366516113281, -273.55133056640625, -260.0660095214844, -246.5806884765625, -233.09535217285156, -219.6100311279297, -206.1247100830078, -192.63938903808594, -179.15406799316406, -165.66873168945312, -152.18341064453125, -138.69808959960938, -125.21277618408203, -111.72745513916016, -98.24213409423828, -84.75680541992188, -71.271484375, -57.786163330078125, -44.30084228515625, -30.815521240234375, -17.3302001953125, -3.8448781967163086, 9.640443801879883, 23.12576675415039, 36.611087799072266, 50.096412658691406, 63.58173370361328, 77.06705474853516, 90.55237579345703, 104.0376968383789, 117.52301788330078, 131.0083465576172, 144.49366760253906, 157.97898864746094, 171.4643096923828, 184.9496307373047, 198.43495178222656, 211.92027282714844, 225.4055938720703, 238.8909149169922, 252.37623596191406, 265.861572265625, 279.3468933105469, 292.83221435546875, 306.3175354003906, 319.8028564453125, 333.2881774902344, 346.77349853515625, 360.2588195800781, 373.744140625, 387.2294616699219, 400.71478271484375, 414.2001037597656]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 10.0, 12.0, 18.0, 19.0, 27.0, 19.0, 33.0, 23.0, 36.0, 34.0, 41.0, 46.0, 48.0, 50.0, 49.0, 55.0, 58.0, 60.0, 37.0, 33.0, 45.0, 28.0, 40.0, 26.0, 19.0, 20.0, 23.0, 18.0, 20.0, 12.0, 4.0, 8.0, 6.0, 6.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-68.125, -65.9462890625, -63.767578125, -61.5888671875, -59.41015625, -57.2314453125, -55.052734375, -52.8740234375, -50.6953125, -48.5166015625, -46.337890625, -44.1591796875, -41.98046875, -39.8017578125, -37.623046875, -35.4443359375, -33.265625, -31.0869140625, -28.908203125, -26.7294921875, -24.55078125, -22.3720703125, -20.193359375, -18.0146484375, -15.8359375, -13.6572265625, -11.478515625, -9.2998046875, -7.12109375, -4.9423828125, -2.763671875, -0.5849609375, 1.59375, 3.7724609375, 5.951171875, 8.1298828125, 10.30859375, 12.4873046875, 14.666015625, 16.8447265625, 19.0234375, 21.2021484375, 23.380859375, 25.5595703125, 27.73828125, 29.9169921875, 32.095703125, 34.2744140625, 36.453125, 38.6318359375, 40.810546875, 42.9892578125, 45.16796875, 47.3466796875, 49.525390625, 51.7041015625, 53.8828125, 56.0615234375, 58.240234375, 60.4189453125, 62.59765625, 64.7763671875, 66.955078125, 69.1337890625, 71.3125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 10.0, 15.0, 20.0, 21.0, 38.0, 51.0, 61.0, 91.0, 127.0, 186.0, 336.0, 537.0, 980.0, 2185.0, 5374.0, 15777.0, 113178.0, 3575949.0, 440036.0, 25354.0, 7750.0, 2972.0, 1390.0, 656.0, 394.0, 247.0, 149.0, 110.0, 80.0, 54.0, 40.0, 28.0, 20.0, 15.0, 8.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-233.75, -227.197265625, -220.64453125, -214.091796875, -207.5390625, -200.986328125, -194.43359375, -187.880859375, -181.328125, -174.775390625, -168.22265625, -161.669921875, -155.1171875, -148.564453125, -142.01171875, -135.458984375, -128.90625, -122.353515625, -115.80078125, -109.248046875, -102.6953125, -96.142578125, -89.58984375, -83.037109375, -76.484375, -69.931640625, -63.37890625, -56.826171875, -50.2734375, -43.720703125, -37.16796875, -30.615234375, -24.0625, -17.509765625, -10.95703125, -4.404296875, 2.1484375, 8.701171875, 15.25390625, 21.806640625, 28.359375, 34.912109375, 41.46484375, 48.017578125, 54.5703125, 61.123046875, 67.67578125, 74.228515625, 80.78125, 87.333984375, 93.88671875, 100.439453125, 106.9921875, 113.544921875, 120.09765625, 126.650390625, 133.203125, 139.755859375, 146.30859375, 152.861328125, 159.4140625, 165.966796875, 172.51953125, 179.072265625, 185.625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 8.0, 7.0, 5.0, 19.0, 24.0, 33.0, 59.0, 87.0, 160.0, 339.0, 739.0, 1230.0, 658.0, 289.0, 168.0, 93.0, 34.0, 33.0, 19.0, 15.0, 11.0, 8.0, 5.0, 6.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.875, -137.47265625, -132.0703125, -126.66796875, -121.265625, -115.86328125, -110.4609375, -105.05859375, -99.65625, -94.25390625, -88.8515625, -83.44921875, -78.046875, -72.64453125, -67.2421875, -61.83984375, -56.4375, -51.03515625, -45.6328125, -40.23046875, -34.828125, -29.42578125, -24.0234375, -18.62109375, -13.21875, -7.81640625, -2.4140625, 2.98828125, 8.390625, 13.79296875, 19.1953125, 24.59765625, 30.0, 35.40234375, 40.8046875, 46.20703125, 51.609375, 57.01171875, 62.4140625, 67.81640625, 73.21875, 78.62109375, 84.0234375, 89.42578125, 94.828125, 100.23046875, 105.6328125, 111.03515625, 116.4375, 121.83984375, 127.2421875, 132.64453125, 138.046875, 143.44921875, 148.8515625, 154.25390625, 159.65625, 165.05859375, 170.4609375, 175.86328125, 181.265625, 186.66796875, 192.0703125, 197.47265625, 202.875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 11.0, 9.0, 12.0, 13.0, 27.0, 30.0, 41.0, 41.0, 66.0, 118.0, 132.0, 233.0, 428.0, 985.0, 3123.0, 15538.0, 254604.0, 3865870.0, 43337.0, 6298.0, 1695.0, 662.0, 336.0, 205.0, 125.0, 84.0, 71.0, 39.0, 36.0, 29.0, 17.0, 13.0, 17.0, 6.0, 7.0, 7.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-544.5, -529.046875, -513.59375, -498.140625, -482.6875, -467.234375, -451.78125, -436.328125, -420.875, -405.421875, -389.96875, -374.515625, -359.0625, -343.609375, -328.15625, -312.703125, -297.25, -281.796875, -266.34375, -250.890625, -235.4375, -219.984375, -204.53125, -189.078125, -173.625, -158.171875, -142.71875, -127.265625, -111.8125, -96.359375, -80.90625, -65.453125, -50.0, -34.546875, -19.09375, -3.640625, 11.8125, 27.265625, 42.71875, 58.171875, 73.625, 89.078125, 104.53125, 119.984375, 135.4375, 150.890625, 166.34375, 181.796875, 197.25, 212.703125, 228.15625, 243.609375, 259.0625, 274.515625, 289.96875, 305.421875, 320.875, 336.328125, 351.78125, 367.234375, 382.6875, 398.140625, 413.59375, 429.046875, 444.5]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 10.0, 11.0, 20.0, 27.0, 54.0, 76.0, 147.0, 183.0, 143.0, 125.0, 76.0, 45.0, 29.0, 20.0, 10.0, 7.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1035.982177734375, -1013.8694458007812, -991.7567138671875, -969.6439208984375, -947.5311889648438, -925.41845703125, -903.3056640625, -881.1929321289062, -859.0802001953125, -836.9674682617188, -814.854736328125, -792.741943359375, -770.6292114257812, -748.5164794921875, -726.4036865234375, -704.2909545898438, -682.17822265625, -660.0654907226562, -637.9527587890625, -615.8399658203125, -593.7272338867188, -571.614501953125, -549.501708984375, -527.3889770507812, -505.2762451171875, -483.16351318359375, -461.0507507324219, -438.93798828125, -416.82525634765625, -394.7125244140625, -372.5997619628906, -350.48699951171875, -328.37420654296875, -306.261474609375, -284.1487121582031, -262.03594970703125, -239.9232177734375, -217.8104705810547, -195.69772338867188, -173.58497619628906, -151.47222900390625, -129.35948181152344, -107.24673461914062, -85.13398742675781, -63.021240234375, -40.90849304199219, -18.795745849609375, 3.3170013427734375, 25.42974853515625, 47.54249572753906, 69.65524291992188, 91.76799011230469, 113.8807373046875, 135.9934844970703, 158.10623168945312, 180.21897888183594, 202.33172607421875, 224.44447326660156, 246.55722045898438, 268.66998291015625, 290.78271484375, 312.89544677734375, 335.0082092285156, 357.1209716796875, 379.23370361328125]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 13.0, 7.0, 9.0, 9.0, 16.0, 24.0, 20.0, 21.0, 28.0, 29.0, 30.0, 44.0, 36.0, 33.0, 37.0, 52.0, 39.0, 45.0, 44.0, 46.0, 26.0, 41.0, 22.0, 34.0, 27.0, 25.0, 24.0, 30.0, 25.0, 22.0, 26.0, 22.0, 17.0, 11.0, 12.0, 7.0, 7.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-360.80126953125, -350.17242431640625, -339.5435485839844, -328.9147033691406, -318.2858581542969, -307.6570129394531, -297.02813720703125, -286.3992919921875, -275.77044677734375, -265.1416015625, -254.5127410888672, -243.88388061523438, -233.25503540039062, -222.6261749267578, -211.997314453125, -201.36846923828125, -190.73960876464844, -180.11074829101562, -169.48190307617188, -158.85304260253906, -148.2241973876953, -137.5953369140625, -126.96648406982422, -116.33763122558594, -105.70877838134766, -95.07992553710938, -84.4510726928711, -73.82221984863281, -63.193363189697266, -52.564510345458984, -41.93565368652344, -31.306800842285156, -20.677947998046875, -10.049094200134277, 0.5797595977783203, 11.208614349365234, 21.837467193603516, 32.4663200378418, 43.095176696777344, 53.724029541015625, 64.3528823852539, 74.98173522949219, 85.61058807373047, 96.23944091796875, 106.86830139160156, 117.49714660644531, 128.12600708007812, 138.75485229492188, 149.3837127685547, 160.0125732421875, 170.64141845703125, 181.27027893066406, 191.8991241455078, 202.52798461914062, 213.15682983398438, 223.7856903076172, 234.41455078125, 245.0434112548828, 255.67225646972656, 266.3011169433594, 276.9299621582031, 287.5588073730469, 298.18768310546875, 308.8165283203125, 319.44537353515625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 5.0, 12.0, 18.0, 25.0, 15.0, 27.0, 26.0, 24.0, 34.0, 36.0, 48.0, 41.0, 55.0, 51.0, 47.0, 55.0, 49.0, 46.0, 41.0, 44.0, 46.0, 39.0, 31.0, 22.0, 23.0, 24.0, 22.0, 15.0, 14.0, 15.0, 11.0, 5.0, 4.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.875, -63.7060546875, -61.537109375, -59.3681640625, -57.19921875, -55.0302734375, -52.861328125, -50.6923828125, -48.5234375, -46.3544921875, -44.185546875, -42.0166015625, -39.84765625, -37.6787109375, -35.509765625, -33.3408203125, -31.171875, -29.0029296875, -26.833984375, -24.6650390625, -22.49609375, -20.3271484375, -18.158203125, -15.9892578125, -13.8203125, -11.6513671875, -9.482421875, -7.3134765625, -5.14453125, -2.9755859375, -0.806640625, 1.3623046875, 3.53125, 5.7001953125, 7.869140625, 10.0380859375, 12.20703125, 14.3759765625, 16.544921875, 18.7138671875, 20.8828125, 23.0517578125, 25.220703125, 27.3896484375, 29.55859375, 31.7275390625, 33.896484375, 36.0654296875, 38.234375, 40.4033203125, 42.572265625, 44.7412109375, 46.91015625, 49.0791015625, 51.248046875, 53.4169921875, 55.5859375, 57.7548828125, 59.923828125, 62.0927734375, 64.26171875, 66.4306640625, 68.599609375, 70.7685546875, 72.9375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 9.0, 24.0, 24.0, 26.0, 61.0, 92.0, 116.0, 193.0, 307.0, 477.0, 745.0, 1216.0, 1931.0, 3237.0, 5497.0, 9337.0, 16141.0, 28378.0, 52331.0, 104004.0, 236664.0, 308312.0, 132980.0, 65083.0, 34317.0, 19188.0, 11218.0, 6611.0, 3922.0, 2278.0, 1408.0, 876.0, 530.0, 344.0, 222.0, 137.0, 104.0, 66.0, 43.0, 32.0, 17.0, 17.0, 11.0, 3.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.7772216796875, -5.585693359375, -5.3941650390625, -5.20263671875, -5.0111083984375, -4.819580078125, -4.6280517578125, -4.4365234375, -4.2449951171875, -4.053466796875, -3.8619384765625, -3.67041015625, -3.4788818359375, -3.287353515625, -3.0958251953125, -2.904296875, -2.7127685546875, -2.521240234375, -2.3297119140625, -2.13818359375, -1.9466552734375, -1.755126953125, -1.5635986328125, -1.3720703125, -1.1805419921875, -0.989013671875, -0.7974853515625, -0.60595703125, -0.4144287109375, -0.222900390625, -0.0313720703125, 0.16015625, 0.3516845703125, 0.543212890625, 0.7347412109375, 0.92626953125, 1.1177978515625, 1.309326171875, 1.5008544921875, 1.6923828125, 1.8839111328125, 2.075439453125, 2.2669677734375, 2.45849609375, 2.6500244140625, 2.841552734375, 3.0330810546875, 3.224609375, 3.4161376953125, 3.607666015625, 3.7991943359375, 3.99072265625, 4.1822509765625, 4.373779296875, 4.5653076171875, 4.7568359375, 4.9483642578125, 5.139892578125, 5.3314208984375, 5.52294921875, 5.7144775390625, 5.906005859375, 6.0975341796875, 6.2890625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 9.0, 2.0, 10.0, 9.0, 14.0, 11.0, 10.0, 16.0, 16.0, 22.0, 26.0, 26.0, 21.0, 26.0, 40.0, 20.0, 37.0, 40.0, 43.0, 44.0, 39.0, 1069.0, 26.0, 45.0, 36.0, 28.0, 38.0, 32.0, 37.0, 27.0, 27.0, 22.0, 20.0, 25.0, 21.0, 15.0, 9.0, 11.0, 12.0, 13.0, 7.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-37.0625, -35.91455078125, -34.7666015625, -33.61865234375, -32.470703125, -31.32275390625, -30.1748046875, -29.02685546875, -27.87890625, -26.73095703125, -25.5830078125, -24.43505859375, -23.287109375, -22.13916015625, -20.9912109375, -19.84326171875, -18.6953125, -17.54736328125, -16.3994140625, -15.25146484375, -14.103515625, -12.95556640625, -11.8076171875, -10.65966796875, -9.51171875, -8.36376953125, -7.2158203125, -6.06787109375, -4.919921875, -3.77197265625, -2.6240234375, -1.47607421875, -0.328125, 0.81982421875, 1.9677734375, 3.11572265625, 4.263671875, 5.41162109375, 6.5595703125, 7.70751953125, 8.85546875, 10.00341796875, 11.1513671875, 12.29931640625, 13.447265625, 14.59521484375, 15.7431640625, 16.89111328125, 18.0390625, 19.18701171875, 20.3349609375, 21.48291015625, 22.630859375, 23.77880859375, 24.9267578125, 26.07470703125, 27.22265625, 28.37060546875, 29.5185546875, 30.66650390625, 31.814453125, 32.96240234375, 34.1103515625, 35.25830078125, 36.40625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 8.0, 8.0, 6.0, 23.0, 28.0, 31.0, 44.0, 65.0, 92.0, 149.0, 205.0, 293.0, 421.0, 658.0, 939.0, 1310.0, 1944.0, 2760.0, 4087.0, 6080.0, 8997.0, 13593.0, 20703.0, 32314.0, 51367.0, 82969.0, 137964.0, 1266599.0, 182550.0, 102953.0, 63368.0, 39496.0, 25479.0, 16042.0, 10892.0, 7141.0, 4886.0, 3365.0, 2276.0, 1534.0, 1085.0, 767.0, 497.0, 352.0, 224.0, 167.0, 143.0, 82.0, 57.0, 47.0, 29.0, 18.0, 16.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.537109375, -2.457122802734375, -2.37713623046875, -2.297149658203125, -2.2171630859375, -2.137176513671875, -2.05718994140625, -1.977203369140625, -1.897216796875, -1.817230224609375, -1.73724365234375, -1.657257080078125, -1.5772705078125, -1.497283935546875, -1.41729736328125, -1.337310791015625, -1.25732421875, -1.177337646484375, -1.09735107421875, -1.017364501953125, -0.9373779296875, -0.857391357421875, -0.77740478515625, -0.697418212890625, -0.617431640625, -0.537445068359375, -0.45745849609375, -0.377471923828125, -0.2974853515625, -0.217498779296875, -0.13751220703125, -0.057525634765625, 0.0224609375, 0.102447509765625, 0.18243408203125, 0.262420654296875, 0.3424072265625, 0.422393798828125, 0.50238037109375, 0.582366943359375, 0.662353515625, 0.742340087890625, 0.82232666015625, 0.902313232421875, 0.9822998046875, 1.062286376953125, 1.14227294921875, 1.222259521484375, 1.30224609375, 1.382232666015625, 1.46221923828125, 1.542205810546875, 1.6221923828125, 1.702178955078125, 1.78216552734375, 1.862152099609375, 1.942138671875, 2.022125244140625, 2.10211181640625, 2.182098388671875, 2.2620849609375, 2.342071533203125, 2.42205810546875, 2.502044677734375, 2.58203125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 15.0, 13.0, 24.0, 39.0, 63.0, 129.0, 270.0, 184.0, 98.0, 57.0, 22.0, 22.0, 12.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24341964721679688, -0.23464202880859375, -0.22586441040039062, -0.2170867919921875, -0.20830917358398438, -0.19953155517578125, -0.19075393676757812, -0.181976318359375, -0.17319869995117188, -0.16442108154296875, -0.15564346313476562, -0.1468658447265625, -0.13808822631835938, -0.12931060791015625, -0.12053298950195312, -0.11175537109375, -0.10297775268554688, -0.09420013427734375, -0.08542251586914062, -0.0766448974609375, -0.06786727905273438, -0.05908966064453125, -0.050312042236328125, -0.041534423828125, -0.032756805419921875, -0.02397918701171875, -0.015201568603515625, -0.0064239501953125, 0.002353668212890625, 0.01113128662109375, 0.019908905029296875, 0.0286865234375, 0.037464141845703125, 0.04624176025390625, 0.055019378662109375, 0.0637969970703125, 0.07257461547851562, 0.08135223388671875, 0.09012985229492188, 0.098907470703125, 0.10768508911132812, 0.11646270751953125, 0.12524032592773438, 0.1340179443359375, 0.14279556274414062, 0.15157318115234375, 0.16035079956054688, 0.16912841796875, 0.17790603637695312, 0.18668365478515625, 0.19546127319335938, 0.2042388916015625, 0.21301651000976562, 0.22179412841796875, 0.23057174682617188, 0.239349365234375, 0.24812698364257812, 0.25690460205078125, 0.2656822204589844, 0.2744598388671875, 0.2832374572753906, 0.29201507568359375, 0.3007926940917969, 0.3095703125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 11.0, 10.0, 19.0, 30.0, 61.0, 126.0, 475.0, 1047395.0, 200.0, 83.0, 44.0, 31.0, 18.0, 12.0, 6.0, 4.0, 6.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.65625, -9.3824462890625, -9.108642578125, -8.8348388671875, -8.56103515625, -8.2872314453125, -8.013427734375, -7.7396240234375, -7.4658203125, -7.1920166015625, -6.918212890625, -6.6444091796875, -6.37060546875, -6.0968017578125, -5.822998046875, -5.5491943359375, -5.275390625, -5.0015869140625, -4.727783203125, -4.4539794921875, -4.18017578125, -3.9063720703125, -3.632568359375, -3.3587646484375, -3.0849609375, -2.8111572265625, -2.537353515625, -2.2635498046875, -1.98974609375, -1.7159423828125, -1.442138671875, -1.1683349609375, -0.89453125, -0.6207275390625, -0.346923828125, -0.0731201171875, 0.20068359375, 0.4744873046875, 0.748291015625, 1.0220947265625, 1.2958984375, 1.5697021484375, 1.843505859375, 2.1173095703125, 2.39111328125, 2.6649169921875, 2.938720703125, 3.2125244140625, 3.486328125, 3.7601318359375, 4.033935546875, 4.3077392578125, 4.58154296875, 4.8553466796875, 5.129150390625, 5.4029541015625, 5.6767578125, 5.9505615234375, 6.224365234375, 6.4981689453125, 6.77197265625, 7.0457763671875, 7.319580078125, 7.5933837890625, 7.8671875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 499.0, 519.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1394769251346588, -0.09296469390392303, -0.04645247012376785, 5.97536563873291e-05, 0.04657198488712311, 0.09308421611785889, 0.13959643244743347, 0.18610867857933044, 0.23262089490890503, 0.2791331112384796, 0.3256453573703766, 0.37215757369995117, 0.41866981983184814, 0.46518203616142273, 0.5116942524909973, 0.5582064986228943, 0.6047186851501465, 0.6512309312820435, 0.6977431178092957, 0.7442553639411926, 0.7907676100730896, 0.8372797966003418, 0.8837920427322388, 0.9303042888641357, 0.9768165349960327, 1.0233287811279297, 1.0698410272598267, 1.1163532733917236, 1.162865400314331, 1.209377646446228, 1.255889892578125, 1.302402138710022, 1.3489142656326294, 1.3954265117645264, 1.4419387578964233, 1.4884510040283203, 1.5349631309509277, 1.5814753770828247, 1.6279876232147217, 1.6744998693466187, 1.7210121154785156, 1.7675243616104126, 1.8140366077423096, 1.860548734664917, 1.907060980796814, 1.953573226928711, 2.0000853538513184, 2.046597719192505, 2.0931098461151123, 2.1396219730377197, 2.1861343383789062, 2.2326464653015137, 2.2791588306427, 2.3256709575653076, 2.372183322906494, 2.4186954498291016, 2.465207815170288, 2.5117199420928955, 2.558232307434082, 2.6047444343566895, 2.651256799697876, 2.6977689266204834, 2.74428129196167, 2.7907934188842773, 2.8373055458068848]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 8.0, 9.0, 13.0, 9.0, 16.0, 18.0, 16.0, 16.0, 23.0, 23.0, 26.0, 39.0, 28.0, 36.0, 37.0, 33.0, 38.0, 39.0, 48.0, 37.0, 29.0, 39.0, 31.0, 47.0, 28.0, 30.0, 34.0, 33.0, 36.0, 23.0, 22.0, 16.0, 20.0, 14.0, 13.0, 11.0, 9.0, 11.0, 8.0, 6.0, 2.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.10227209329605103, -0.0990079864859581, -0.09574387967586517, -0.09247976541519165, -0.08921565860509872, -0.0859515517950058, -0.08268743753433228, -0.07942333072423935, -0.07615922391414642, -0.0728951171040535, -0.06963101029396057, -0.06636689603328705, -0.06310278922319412, -0.059838682413101196, -0.05657457187771797, -0.05331046134233475, -0.05004635453224182, -0.046782247722148895, -0.04351813718676567, -0.040254026651382446, -0.03698991984128952, -0.033725813031196594, -0.03046170249581337, -0.027197593823075294, -0.02393348515033722, -0.020669376477599144, -0.01740526780486107, -0.014141159132122993, -0.010877050459384918, -0.007612941786646843, -0.004348833113908768, -0.0010847244411706924, 0.002179384231567383, 0.005443492904305458, 0.008707601577043533, 0.011971710249781609, 0.015235818922519684, 0.01849992759525776, 0.021764036267995834, 0.02502814494073391, 0.028292253613471985, 0.03155636042356491, 0.034820470958948135, 0.03808458149433136, 0.041348688304424286, 0.04461279511451721, 0.047876905649900436, 0.05114101618528366, 0.05440512299537659, 0.05766922980546951, 0.06093334034085274, 0.06419745087623596, 0.06746155768632889, 0.07072566449642181, 0.07398977875709534, 0.07725388556718826, 0.08051799237728119, 0.08378209918737411, 0.08704620599746704, 0.09031032025814056, 0.09357442706823349, 0.09683853387832642, 0.10010264813899994, 0.10336675494909286, 0.10663086175918579]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 5.0, 12.0, 18.0, 25.0, 15.0, 27.0, 26.0, 24.0, 34.0, 35.0, 49.0, 41.0, 55.0, 51.0, 47.0, 55.0, 48.0, 47.0, 41.0, 44.0, 46.0, 39.0, 31.0, 22.0, 23.0, 24.0, 22.0, 15.0, 14.0, 15.0, 11.0, 5.0, 4.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.875, -63.7060546875, -61.537109375, -59.3681640625, -57.19921875, -55.0302734375, -52.861328125, -50.6923828125, -48.5234375, -46.3544921875, -44.185546875, -42.0166015625, -39.84765625, -37.6787109375, -35.509765625, -33.3408203125, -31.171875, -29.0029296875, -26.833984375, -24.6650390625, -22.49609375, -20.3271484375, -18.158203125, -15.9892578125, -13.8203125, -11.6513671875, -9.482421875, -7.3134765625, -5.14453125, -2.9755859375, -0.806640625, 1.3623046875, 3.53125, 5.7001953125, 7.869140625, 10.0380859375, 12.20703125, 14.3759765625, 16.544921875, 18.7138671875, 20.8828125, 23.0517578125, 25.220703125, 27.3896484375, 29.55859375, 31.7275390625, 33.896484375, 36.0654296875, 38.234375, 40.4033203125, 42.572265625, 44.7412109375, 46.91015625, 49.0791015625, 51.248046875, 53.4169921875, 55.5859375, 57.7548828125, 59.923828125, 62.0927734375, 64.26171875, 66.4306640625, 68.599609375, 70.7685546875, 72.9375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 10.0, 9.0, 13.0, 20.0, 25.0, 48.0, 55.0, 86.0, 133.0, 146.0, 278.0, 417.0, 579.0, 867.0, 1253.0, 1912.0, 2903.0, 4417.0, 6943.0, 11785.0, 23658.0, 88198.0, 723602.0, 119874.0, 26972.0, 12876.0, 7493.0, 4657.0, 3107.0, 2030.0, 1342.0, 918.0, 638.0, 413.0, 246.0, 191.0, 139.0, 97.0, 57.0, 48.0, 18.0, 26.0, 20.0, 11.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-83.625, -81.2060546875, -78.787109375, -76.3681640625, -73.94921875, -71.5302734375, -69.111328125, -66.6923828125, -64.2734375, -61.8544921875, -59.435546875, -57.0166015625, -54.59765625, -52.1787109375, -49.759765625, -47.3408203125, -44.921875, -42.5029296875, -40.083984375, -37.6650390625, -35.24609375, -32.8271484375, -30.408203125, -27.9892578125, -25.5703125, -23.1513671875, -20.732421875, -18.3134765625, -15.89453125, -13.4755859375, -11.056640625, -8.6376953125, -6.21875, -3.7998046875, -1.380859375, 1.0380859375, 3.45703125, 5.8759765625, 8.294921875, 10.7138671875, 13.1328125, 15.5517578125, 17.970703125, 20.3896484375, 22.80859375, 25.2275390625, 27.646484375, 30.0654296875, 32.484375, 34.9033203125, 37.322265625, 39.7412109375, 42.16015625, 44.5791015625, 46.998046875, 49.4169921875, 51.8359375, 54.2548828125, 56.673828125, 59.0927734375, 61.51171875, 63.9306640625, 66.349609375, 68.7685546875, 71.1875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 6.0, 9.0, 8.0, 10.0, 10.0, 21.0, 23.0, 25.0, 15.0, 24.0, 38.0, 40.0, 44.0, 41.0, 49.0, 52.0, 69.0, 210.0, 1785.0, 98.0, 48.0, 60.0, 56.0, 47.0, 28.0, 39.0, 36.0, 25.0, 23.0, 17.0, 11.0, 19.0, 9.0, 7.0, 6.0, 7.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.125, -187.896484375, -181.66796875, -175.439453125, -169.2109375, -162.982421875, -156.75390625, -150.525390625, -144.296875, -138.068359375, -131.83984375, -125.611328125, -119.3828125, -113.154296875, -106.92578125, -100.697265625, -94.46875, -88.240234375, -82.01171875, -75.783203125, -69.5546875, -63.326171875, -57.09765625, -50.869140625, -44.640625, -38.412109375, -32.18359375, -25.955078125, -19.7265625, -13.498046875, -7.26953125, -1.041015625, 5.1875, 11.416015625, 17.64453125, 23.873046875, 30.1015625, 36.330078125, 42.55859375, 48.787109375, 55.015625, 61.244140625, 67.47265625, 73.701171875, 79.9296875, 86.158203125, 92.38671875, 98.615234375, 104.84375, 111.072265625, 117.30078125, 123.529296875, 129.7578125, 135.986328125, 142.21484375, 148.443359375, 154.671875, 160.900390625, 167.12890625, 173.357421875, 179.5859375, 185.814453125, 192.04296875, 198.271484375, 204.5]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 8.0, 10.0, 15.0, 17.0, 31.0, 50.0, 96.0, 199.0, 669.0, 2814.0, 22879.0, 3062961.0, 49999.0, 4429.0, 930.0, 264.0, 133.0, 61.0, 36.0, 25.0, 25.0, 15.0, 10.0, 6.0, 5.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-984.5, -954.328125, -924.15625, -893.984375, -863.8125, -833.640625, -803.46875, -773.296875, -743.125, -712.953125, -682.78125, -652.609375, -622.4375, -592.265625, -562.09375, -531.921875, -501.75, -471.578125, -441.40625, -411.234375, -381.0625, -350.890625, -320.71875, -290.546875, -260.375, -230.203125, -200.03125, -169.859375, -139.6875, -109.515625, -79.34375, -49.171875, -19.0, 11.171875, 41.34375, 71.515625, 101.6875, 131.859375, 162.03125, 192.203125, 222.375, 252.546875, 282.71875, 312.890625, 343.0625, 373.234375, 403.40625, 433.578125, 463.75, 493.921875, 524.09375, 554.265625, 584.4375, 614.609375, 644.78125, 674.953125, 705.125, 735.296875, 765.46875, 795.640625, 825.8125, 855.984375, 886.15625, 916.328125, 946.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 8.0, 132.0, 792.0, 76.0, 8.0, 3.0], "bins": [-7885.18798828125, -7754.6591796875, -7624.13037109375, -7493.6015625, -7363.072265625, -7232.54345703125, -7102.0146484375, -6971.48583984375, -6840.95703125, -6710.42822265625, -6579.8994140625, -6449.3701171875, -6318.84130859375, -6188.3125, -6057.78369140625, -5927.2548828125, -5796.7255859375, -5666.19677734375, -5535.66796875, -5405.138671875, -5274.60986328125, -5144.0810546875, -5013.55224609375, -4883.0234375, -4752.49462890625, -4621.9658203125, -4491.43701171875, -4360.908203125, -4230.37890625, -4099.85009765625, -3969.3212890625, -3838.79248046875, -3708.26416015625, -3577.7353515625, -3447.206298828125, -3316.677490234375, -3186.148681640625, -3055.61962890625, -2925.0908203125, -2794.56201171875, -2664.032958984375, -2533.504150390625, -2402.97509765625, -2272.4462890625, -2141.91748046875, -2011.3885498046875, -1880.859619140625, -1750.330810546875, -1619.802001953125, -1489.2730712890625, -1358.7442626953125, -1228.21533203125, -1097.6865234375, -967.1575927734375, -836.628662109375, -706.0997924804688, -575.5709228515625, -445.04205322265625, -314.5131530761719, -183.9842529296875, -53.45538330078125, 77.073486328125, 207.6024169921875, 338.13128662109375, 468.6601867675781]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 5.0, 3.0, 5.0, 6.0, 6.0, 9.0, 6.0, 16.0, 13.0, 22.0, 18.0, 17.0, 20.0, 23.0, 39.0, 40.0, 27.0, 36.0, 25.0, 27.0, 42.0, 30.0, 44.0, 42.0, 31.0, 37.0, 48.0, 44.0, 39.0, 30.0, 35.0, 36.0, 34.0, 12.0, 29.0, 16.0, 16.0, 14.0, 17.0, 11.0, 7.0, 8.0, 7.0, 4.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-421.03778076171875, -405.5781555175781, -390.1184997558594, -374.65887451171875, -359.19921875, -343.7395935058594, -328.27996826171875, -312.8203125, -297.3606872558594, -281.90106201171875, -266.44140625, -250.98178100585938, -235.5221405029297, -220.0625, -204.60287475585938, -189.1432342529297, -173.68359375, -158.2239532470703, -142.76431274414062, -127.3046875, -111.84504699707031, -96.38540649414062, -80.92577362060547, -65.46614074707031, -50.006500244140625, -34.5468635559082, -19.08722686767578, -3.6275901794433594, 11.832046508789062, 27.29168701171875, 42.751319885253906, 58.21095275878906, 73.67059326171875, 89.13023376464844, 104.5898666381836, 120.04949951171875, 135.50914001464844, 150.96878051757812, 166.42840576171875, 181.88804626464844, 197.34768676757812, 212.8073272705078, 228.2669677734375, 243.72659301757812, 259.18621826171875, 274.6458740234375, 290.1054992675781, 305.56512451171875, 321.0247802734375, 336.4844055175781, 351.9440612792969, 367.4036865234375, 382.86334228515625, 398.3229675292969, 413.7825927734375, 429.24224853515625, 444.7018737792969, 460.1614990234375, 475.62115478515625, 491.0807800292969, 506.5404052734375, 522.0000610351562, 537.459716796875, 552.9193115234375, 568.3789672851562]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 10.0, 4.0, 10.0, 10.0, 19.0, 16.0, 21.0, 25.0, 23.0, 38.0, 39.0, 26.0, 32.0, 51.0, 45.0, 48.0, 55.0, 49.0, 57.0, 45.0, 46.0, 32.0, 41.0, 39.0, 26.0, 28.0, 32.0, 26.0, 20.0, 16.0, 11.0, 10.0, 13.0, 16.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.25, -61.9033203125, -59.556640625, -57.2099609375, -54.86328125, -52.5166015625, -50.169921875, -47.8232421875, -45.4765625, -43.1298828125, -40.783203125, -38.4365234375, -36.08984375, -33.7431640625, -31.396484375, -29.0498046875, -26.703125, -24.3564453125, -22.009765625, -19.6630859375, -17.31640625, -14.9697265625, -12.623046875, -10.2763671875, -7.9296875, -5.5830078125, -3.236328125, -0.8896484375, 1.45703125, 3.8037109375, 6.150390625, 8.4970703125, 10.84375, 13.1904296875, 15.537109375, 17.8837890625, 20.23046875, 22.5771484375, 24.923828125, 27.2705078125, 29.6171875, 31.9638671875, 34.310546875, 36.6572265625, 39.00390625, 41.3505859375, 43.697265625, 46.0439453125, 48.390625, 50.7373046875, 53.083984375, 55.4306640625, 57.77734375, 60.1240234375, 62.470703125, 64.8173828125, 67.1640625, 69.5107421875, 71.857421875, 74.2041015625, 76.55078125, 78.8974609375, 81.244140625, 83.5908203125, 85.9375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 8.0, 8.0, 19.0, 20.0, 34.0, 61.0, 75.0, 95.0, 161.0, 240.0, 357.0, 573.0, 958.0, 1659.0, 3226.0, 6864.0, 17609.0, 141823.0, 3487828.0, 487166.0, 27367.0, 8979.0, 3984.0, 2068.0, 1211.0, 651.0, 405.0, 263.0, 178.0, 125.0, 76.0, 58.0, 41.0, 30.0, 14.0, 15.0, 13.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-178.625, -172.603515625, -166.58203125, -160.560546875, -154.5390625, -148.517578125, -142.49609375, -136.474609375, -130.453125, -124.431640625, -118.41015625, -112.388671875, -106.3671875, -100.345703125, -94.32421875, -88.302734375, -82.28125, -76.259765625, -70.23828125, -64.216796875, -58.1953125, -52.173828125, -46.15234375, -40.130859375, -34.109375, -28.087890625, -22.06640625, -16.044921875, -10.0234375, -4.001953125, 2.01953125, 8.041015625, 14.0625, 20.083984375, 26.10546875, 32.126953125, 38.1484375, 44.169921875, 50.19140625, 56.212890625, 62.234375, 68.255859375, 74.27734375, 80.298828125, 86.3203125, 92.341796875, 98.36328125, 104.384765625, 110.40625, 116.427734375, 122.44921875, 128.470703125, 134.4921875, 140.513671875, 146.53515625, 152.556640625, 158.578125, 164.599609375, 170.62109375, 176.642578125, 182.6640625, 188.685546875, 194.70703125, 200.728515625, 206.75]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 11.0, 7.0, 13.0, 20.0, 30.0, 40.0, 70.0, 83.0, 231.0, 524.0, 1295.0, 995.0, 401.0, 143.0, 85.0, 39.0, 16.0, 25.0, 7.0, 13.0, 9.0, 10.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.125, -131.802734375, -125.48046875, -119.158203125, -112.8359375, -106.513671875, -100.19140625, -93.869140625, -87.546875, -81.224609375, -74.90234375, -68.580078125, -62.2578125, -55.935546875, -49.61328125, -43.291015625, -36.96875, -30.646484375, -24.32421875, -18.001953125, -11.6796875, -5.357421875, 0.96484375, 7.287109375, 13.609375, 19.931640625, 26.25390625, 32.576171875, 38.8984375, 45.220703125, 51.54296875, 57.865234375, 64.1875, 70.509765625, 76.83203125, 83.154296875, 89.4765625, 95.798828125, 102.12109375, 108.443359375, 114.765625, 121.087890625, 127.41015625, 133.732421875, 140.0546875, 146.376953125, 152.69921875, 159.021484375, 165.34375, 171.666015625, 177.98828125, 184.310546875, 190.6328125, 196.955078125, 203.27734375, 209.599609375, 215.921875, 222.244140625, 228.56640625, 234.888671875, 241.2109375, 247.533203125, 253.85546875, 260.177734375, 266.5]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 11.0, 10.0, 15.0, 33.0, 44.0, 55.0, 108.0, 143.0, 296.0, 771.0, 3681.0, 43783.0, 4076398.0, 62654.0, 4554.0, 895.0, 338.0, 180.0, 97.0, 85.0, 44.0, 37.0, 23.0, 12.0, 9.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1044.0, -1018.875, -993.75, -968.625, -943.5, -918.375, -893.25, -868.125, -843.0, -817.875, -792.75, -767.625, -742.5, -717.375, -692.25, -667.125, -642.0, -616.875, -591.75, -566.625, -541.5, -516.375, -491.25, -466.125, -441.0, -415.875, -390.75, -365.625, -340.5, -315.375, -290.25, -265.125, -240.0, -214.875, -189.75, -164.625, -139.5, -114.375, -89.25, -64.125, -39.0, -13.875, 11.25, 36.375, 61.5, 86.625, 111.75, 136.875, 162.0, 187.125, 212.25, 237.375, 262.5, 287.625, 312.75, 337.875, 363.0, 388.125, 413.25, 438.375, 463.5, 488.625, 513.75, 538.875, 564.0]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 14.0, 7.0, 17.0, 23.0, 35.0, 62.0, 88.0, 109.0, 191.0, 167.0, 90.0, 78.0, 43.0, 23.0, 15.0, 15.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-940.9987182617188, -920.4614868164062, -899.9242553710938, -879.3870239257812, -858.8497924804688, -838.3125610351562, -817.7753295898438, -797.2381591796875, -776.700927734375, -756.1636962890625, -735.62646484375, -715.0892333984375, -694.552001953125, -674.0147705078125, -653.4775390625, -632.9403076171875, -612.403076171875, -591.8658447265625, -571.32861328125, -550.7913818359375, -530.254150390625, -509.7169189453125, -489.1797180175781, -468.6424865722656, -448.1052551269531, -427.5680236816406, -407.0307922363281, -386.4935607910156, -365.95635986328125, -345.41912841796875, -324.88189697265625, -304.34466552734375, -283.8074035644531, -263.2701721191406, -242.73294067382812, -222.1957244873047, -201.6584930419922, -181.1212615966797, -160.58404541015625, -140.04681396484375, -119.50958251953125, -98.97235107421875, -78.43512725830078, -57.89789962768555, -37.36067199707031, -16.823440551757812, 3.7137832641601562, 24.251007080078125, 44.788238525390625, 65.32546997070312, 85.8626937866211, 106.39991760253906, 126.93714904785156, 147.47438049316406, 168.0115966796875, 188.548828125, 209.0860595703125, 229.623291015625, 250.1605224609375, 270.69775390625, 291.2349853515625, 311.772216796875, 332.3094177246094, 352.8466491699219, 373.3838806152344]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 3.0, 1.0, 2.0, 4.0, 6.0, 13.0, 11.0, 20.0, 26.0, 24.0, 18.0, 13.0, 18.0, 28.0, 39.0, 44.0, 39.0, 41.0, 51.0, 35.0, 49.0, 41.0, 39.0, 46.0, 41.0, 41.0, 38.0, 45.0, 31.0, 32.0, 21.0, 16.0, 23.0, 20.0, 20.0, 8.0, 9.0, 13.0, 10.0, 5.0, 12.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-401.249267578125, -389.5586853027344, -377.8680725097656, -366.177490234375, -354.48687744140625, -342.7962951660156, -331.105712890625, -319.41510009765625, -307.7245178222656, -296.033935546875, -284.34332275390625, -272.6527404785156, -260.962158203125, -249.27154541015625, -237.58096313476562, -225.89036560058594, -214.19976806640625, -202.50917053222656, -190.81857299804688, -179.12799072265625, -167.43739318847656, -155.74679565429688, -144.05621337890625, -132.36561584472656, -120.67501831054688, -108.98442077636719, -97.29383087158203, -85.60324096679688, -73.91264343261719, -62.222049713134766, -50.531455993652344, -38.84086608886719, -27.1502685546875, -15.459674835205078, -3.7690811157226562, 7.921512603759766, 19.612106323242188, 31.30270004272461, 42.99329376220703, 54.68388366699219, 66.37448120117188, 78.06507873535156, 89.75566864013672, 101.44625854492188, 113.13685607910156, 124.82745361328125, 136.51803588867188, 148.20863342285156, 159.89923095703125, 171.58982849121094, 183.28042602539062, 194.97100830078125, 206.66160583496094, 218.35220336914062, 230.04278564453125, 241.73338317871094, 253.42398071289062, 265.11456298828125, 276.80517578125, 288.4957580566406, 300.18634033203125, 311.876953125, 323.5675354003906, 335.25811767578125, 346.94873046875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 6.0, 1.0, 5.0, 2.0, 4.0, 3.0, 13.0, 12.0, 5.0, 13.0, 14.0, 21.0, 26.0, 24.0, 26.0, 39.0, 48.0, 38.0, 35.0, 55.0, 47.0, 43.0, 54.0, 51.0, 37.0, 40.0, 38.0, 45.0, 26.0, 34.0, 32.0, 18.0, 33.0, 25.0, 18.0, 18.0, 10.0, 5.0, 16.0, 7.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.3125, -61.0986328125, -58.884765625, -56.6708984375, -54.45703125, -52.2431640625, -50.029296875, -47.8154296875, -45.6015625, -43.3876953125, -41.173828125, -38.9599609375, -36.74609375, -34.5322265625, -32.318359375, -30.1044921875, -27.890625, -25.6767578125, -23.462890625, -21.2490234375, -19.03515625, -16.8212890625, -14.607421875, -12.3935546875, -10.1796875, -7.9658203125, -5.751953125, -3.5380859375, -1.32421875, 0.8896484375, 3.103515625, 5.3173828125, 7.53125, 9.7451171875, 11.958984375, 14.1728515625, 16.38671875, 18.6005859375, 20.814453125, 23.0283203125, 25.2421875, 27.4560546875, 29.669921875, 31.8837890625, 34.09765625, 36.3115234375, 38.525390625, 40.7392578125, 42.953125, 45.1669921875, 47.380859375, 49.5947265625, 51.80859375, 54.0224609375, 56.236328125, 58.4501953125, 60.6640625, 62.8779296875, 65.091796875, 67.3056640625, 69.51953125, 71.7333984375, 73.947265625, 76.1611328125, 78.375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 6.0, 6.0, 17.0, 16.0, 34.0, 30.0, 52.0, 52.0, 79.0, 117.0, 155.0, 230.0, 325.0, 461.0, 714.0, 1177.0, 1863.0, 3277.0, 6073.0, 11461.0, 23822.0, 52694.0, 130821.0, 395140.0, 253861.0, 88874.0, 38126.0, 17944.0, 9007.0, 4906.0, 2662.0, 1664.0, 958.0, 633.0, 411.0, 254.0, 161.0, 129.0, 95.0, 64.0, 50.0, 39.0, 23.0, 15.0, 16.0, 13.0, 7.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-11.5625, -11.220458984375, -10.87841796875, -10.536376953125, -10.1943359375, -9.852294921875, -9.51025390625, -9.168212890625, -8.826171875, -8.484130859375, -8.14208984375, -7.800048828125, -7.4580078125, -7.115966796875, -6.77392578125, -6.431884765625, -6.08984375, -5.747802734375, -5.40576171875, -5.063720703125, -4.7216796875, -4.379638671875, -4.03759765625, -3.695556640625, -3.353515625, -3.011474609375, -2.66943359375, -2.327392578125, -1.9853515625, -1.643310546875, -1.30126953125, -0.959228515625, -0.6171875, -0.275146484375, 0.06689453125, 0.408935546875, 0.7509765625, 1.093017578125, 1.43505859375, 1.777099609375, 2.119140625, 2.461181640625, 2.80322265625, 3.145263671875, 3.4873046875, 3.829345703125, 4.17138671875, 4.513427734375, 4.85546875, 5.197509765625, 5.53955078125, 5.881591796875, 6.2236328125, 6.565673828125, 6.90771484375, 7.249755859375, 7.591796875, 7.933837890625, 8.27587890625, 8.617919921875, 8.9599609375, 9.302001953125, 9.64404296875, 9.986083984375, 10.328125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 6.0, 9.0, 7.0, 19.0, 13.0, 14.0, 15.0, 23.0, 15.0, 27.0, 22.0, 22.0, 25.0, 42.0, 29.0, 26.0, 25.0, 39.0, 35.0, 1058.0, 56.0, 34.0, 46.0, 32.0, 38.0, 33.0, 29.0, 36.0, 22.0, 35.0, 27.0, 14.0, 26.0, 14.0, 18.0, 7.0, 21.0, 11.0, 5.0, 6.0, 5.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.65625, -37.44091796875, -36.2255859375, -35.01025390625, -33.794921875, -32.57958984375, -31.3642578125, -30.14892578125, -28.93359375, -27.71826171875, -26.5029296875, -25.28759765625, -24.072265625, -22.85693359375, -21.6416015625, -20.42626953125, -19.2109375, -17.99560546875, -16.7802734375, -15.56494140625, -14.349609375, -13.13427734375, -11.9189453125, -10.70361328125, -9.48828125, -8.27294921875, -7.0576171875, -5.84228515625, -4.626953125, -3.41162109375, -2.1962890625, -0.98095703125, 0.234375, 1.44970703125, 2.6650390625, 3.88037109375, 5.095703125, 6.31103515625, 7.5263671875, 8.74169921875, 9.95703125, 11.17236328125, 12.3876953125, 13.60302734375, 14.818359375, 16.03369140625, 17.2490234375, 18.46435546875, 19.6796875, 20.89501953125, 22.1103515625, 23.32568359375, 24.541015625, 25.75634765625, 26.9716796875, 28.18701171875, 29.40234375, 30.61767578125, 31.8330078125, 33.04833984375, 34.263671875, 35.47900390625, 36.6943359375, 37.90966796875, 39.125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 10.0, 14.0, 18.0, 18.0, 45.0, 68.0, 90.0, 122.0, 184.0, 293.0, 417.0, 689.0, 1014.0, 1582.0, 2450.0, 3958.0, 6318.0, 10027.0, 16391.0, 27223.0, 46047.0, 79056.0, 143782.0, 1246009.0, 243599.0, 110950.0, 62377.0, 36580.0, 22021.0, 13398.0, 8129.0, 5156.0, 3168.0, 2076.0, 1336.0, 864.0, 599.0, 344.0, 247.0, 158.0, 103.0, 61.0, 56.0, 27.0, 15.0, 15.0, 18.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.677734375, -3.565582275390625, -3.45343017578125, -3.341278076171875, -3.2291259765625, -3.116973876953125, -3.00482177734375, -2.892669677734375, -2.780517578125, -2.668365478515625, -2.55621337890625, -2.444061279296875, -2.3319091796875, -2.219757080078125, -2.10760498046875, -1.995452880859375, -1.88330078125, -1.771148681640625, -1.65899658203125, -1.546844482421875, -1.4346923828125, -1.322540283203125, -1.21038818359375, -1.098236083984375, -0.986083984375, -0.873931884765625, -0.76177978515625, -0.649627685546875, -0.5374755859375, -0.425323486328125, -0.31317138671875, -0.201019287109375, -0.0888671875, 0.023284912109375, 0.13543701171875, 0.247589111328125, 0.3597412109375, 0.471893310546875, 0.58404541015625, 0.696197509765625, 0.808349609375, 0.920501708984375, 1.03265380859375, 1.144805908203125, 1.2569580078125, 1.369110107421875, 1.48126220703125, 1.593414306640625, 1.70556640625, 1.817718505859375, 1.92987060546875, 2.042022705078125, 2.1541748046875, 2.266326904296875, 2.37847900390625, 2.490631103515625, 2.602783203125, 2.714935302734375, 2.82708740234375, 2.939239501953125, 3.0513916015625, 3.163543701171875, 3.27569580078125, 3.387847900390625, 3.5]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 11.0, 12.0, 21.0, 31.0, 57.0, 122.0, 364.0, 159.0, 76.0, 45.0, 23.0, 15.0, 15.0, 10.0, 4.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82421875, -0.7933197021484375, -0.762420654296875, -0.7315216064453125, -0.70062255859375, -0.6697235107421875, -0.638824462890625, -0.6079254150390625, -0.5770263671875, -0.5461273193359375, -0.515228271484375, -0.4843292236328125, -0.45343017578125, -0.4225311279296875, -0.391632080078125, -0.3607330322265625, -0.329833984375, -0.2989349365234375, -0.268035888671875, -0.2371368408203125, -0.20623779296875, -0.1753387451171875, -0.144439697265625, -0.1135406494140625, -0.0826416015625, -0.0517425537109375, -0.020843505859375, 0.0100555419921875, 0.04095458984375, 0.0718536376953125, 0.102752685546875, 0.1336517333984375, 0.16455078125, 0.1954498291015625, 0.226348876953125, 0.2572479248046875, 0.28814697265625, 0.3190460205078125, 0.349945068359375, 0.3808441162109375, 0.4117431640625, 0.4426422119140625, 0.473541259765625, 0.5044403076171875, 0.53533935546875, 0.5662384033203125, 0.597137451171875, 0.6280364990234375, 0.658935546875, 0.6898345947265625, 0.720733642578125, 0.7516326904296875, 0.78253173828125, 0.8134307861328125, 0.844329833984375, 0.8752288818359375, 0.9061279296875, 0.9370269775390625, 0.967926025390625, 0.9988250732421875, 1.02972412109375, 1.0606231689453125, 1.091522216796875, 1.1224212646484375, 1.1533203125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 9.0, 13.0, 21.0, 25.0, 53.0, 108.0, 315.0, 1047629.0, 184.0, 71.0, 33.0, 21.0, 14.0, 13.0, 4.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.40625, -35.4306640625, -34.455078125, -33.4794921875, -32.50390625, -31.5283203125, -30.552734375, -29.5771484375, -28.6015625, -27.6259765625, -26.650390625, -25.6748046875, -24.69921875, -23.7236328125, -22.748046875, -21.7724609375, -20.796875, -19.8212890625, -18.845703125, -17.8701171875, -16.89453125, -15.9189453125, -14.943359375, -13.9677734375, -12.9921875, -12.0166015625, -11.041015625, -10.0654296875, -9.08984375, -8.1142578125, -7.138671875, -6.1630859375, -5.1875, -4.2119140625, -3.236328125, -2.2607421875, -1.28515625, -0.3095703125, 0.666015625, 1.6416015625, 2.6171875, 3.5927734375, 4.568359375, 5.5439453125, 6.51953125, 7.4951171875, 8.470703125, 9.4462890625, 10.421875, 11.3974609375, 12.373046875, 13.3486328125, 14.32421875, 15.2998046875, 16.275390625, 17.2509765625, 18.2265625, 19.2021484375, 20.177734375, 21.1533203125, 22.12890625, 23.1044921875, 24.080078125, 25.0556640625, 26.03125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [948.0, 74.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21622787415981293, 0.04361291229724884, 0.3034536838531494, 0.5632944703102112, 0.823135256767273, 1.08297598361969, 1.3428168296813965, 1.602657675743103, 1.86249840259552, 2.1223392486572266, 2.3821799755096436, 2.6420207023620605, 2.9018616676330566, 3.1617021560668945, 3.4215431213378906, 3.6813840866088867, 3.9412248134613037, 4.201065540313721, 4.460906505584717, 4.720746994018555, 4.980587959289551, 5.240428924560547, 5.500269412994385, 5.760110378265381, 6.019950866699219, 6.279791831970215, 6.539632320404053, 6.799473285675049, 7.059313774108887, 7.319154739379883, 7.578995704650879, 7.838836669921875, 8.098676681518555, 8.35851764678955, 8.618358612060547, 8.878198623657227, 9.138039588928223, 9.397880554199219, 9.657721519470215, 9.917562484741211, 10.17740249633789, 10.437243461608887, 10.697084426879883, 10.956924438476562, 11.216765403747559, 11.476606369018555, 11.73644733428955, 11.996288299560547, 12.256129264831543, 12.515970230102539, 12.775811195373535, 13.035651206970215, 13.295492172241211, 13.555333137512207, 13.815174102783203, 14.0750150680542, 14.334856033325195, 14.594696998596191, 14.854537963867188, 15.114377975463867, 15.374218940734863, 15.63405990600586, 15.893900871276855, 16.15374183654785, 16.41358184814453]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 6.0, 7.0, 7.0, 12.0, 17.0, 17.0, 20.0, 19.0, 18.0, 25.0, 25.0, 27.0, 23.0, 39.0, 36.0, 30.0, 29.0, 37.0, 52.0, 43.0, 42.0, 40.0, 39.0, 33.0, 32.0, 30.0, 26.0, 38.0, 34.0, 22.0, 19.0, 27.0, 16.0, 11.0, 10.0, 11.0, 11.0, 11.0, 7.0, 5.0, 3.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.88971346616745, -0.8618452548980713, -0.8339771032333374, -0.8061088919639587, -0.7782406806945801, -0.7503724694252014, -0.7225042581558228, -0.6946361064910889, -0.6667678952217102, -0.6388996839523315, -0.6110315322875977, -0.583163321018219, -0.5552951097488403, -0.5274268984794617, -0.4995587170124054, -0.4716905355453491, -0.44382232427597046, -0.4159541130065918, -0.3880859315395355, -0.36021775007247925, -0.3323495388031006, -0.3044813275337219, -0.27661314606666565, -0.24874494969844818, -0.2208767533302307, -0.19300855696201324, -0.16514036059379578, -0.1372721642255783, -0.10940396785736084, -0.08153577148914337, -0.0536675751209259, -0.025799378752708435, 0.002068758010864258, 0.029936954379081726, 0.057805150747299194, 0.08567334711551666, 0.11354154348373413, 0.1414097398519516, 0.16927793622016907, 0.19714613258838654, 0.225014328956604, 0.25288254022598267, 0.28075072169303894, 0.3086189031600952, 0.3364871144294739, 0.36435532569885254, 0.3922235071659088, 0.4200916886329651, 0.44795989990234375, 0.4758281111717224, 0.5036963224411011, 0.531564474105835, 0.5594326853752136, 0.5873008966445923, 0.6151690483093262, 0.6430372595787048, 0.6709054708480835, 0.6987736821174622, 0.7266418933868408, 0.7545100450515747, 0.7823782563209534, 0.810246467590332, 0.8381146192550659, 0.8659828305244446, 0.8938510417938232]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 6.0, 1.0, 5.0, 2.0, 4.0, 3.0, 13.0, 12.0, 5.0, 13.0, 14.0, 21.0, 26.0, 24.0, 26.0, 39.0, 48.0, 38.0, 35.0, 55.0, 47.0, 43.0, 54.0, 51.0, 37.0, 40.0, 38.0, 45.0, 26.0, 34.0, 32.0, 18.0, 33.0, 25.0, 18.0, 18.0, 10.0, 5.0, 16.0, 7.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.3125, -61.0986328125, -58.884765625, -56.6708984375, -54.45703125, -52.2431640625, -50.029296875, -47.8154296875, -45.6015625, -43.3876953125, -41.173828125, -38.9599609375, -36.74609375, -34.5322265625, -32.318359375, -30.1044921875, -27.890625, -25.6767578125, -23.462890625, -21.2490234375, -19.03515625, -16.8212890625, -14.607421875, -12.3935546875, -10.1796875, -7.9658203125, -5.751953125, -3.5380859375, -1.32421875, 0.8896484375, 3.103515625, 5.3173828125, 7.53125, 9.7451171875, 11.958984375, 14.1728515625, 16.38671875, 18.6005859375, 20.814453125, 23.0283203125, 25.2421875, 27.4560546875, 29.669921875, 31.8837890625, 34.09765625, 36.3115234375, 38.525390625, 40.7392578125, 42.953125, 45.1669921875, 47.380859375, 49.5947265625, 51.80859375, 54.0224609375, 56.236328125, 58.4501953125, 60.6640625, 62.8779296875, 65.091796875, 67.3056640625, 69.51953125, 71.7333984375, 73.947265625, 76.1611328125, 78.375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 13.0, 10.0, 16.0, 20.0, 37.0, 32.0, 56.0, 61.0, 77.0, 110.0, 147.0, 222.0, 229.0, 358.0, 489.0, 641.0, 851.0, 1218.0, 1692.0, 2282.0, 3347.0, 5457.0, 14902.0, 203004.0, 765938.0, 26932.0, 7110.0, 3834.0, 2578.0, 1863.0, 1244.0, 968.0, 701.0, 545.0, 398.0, 282.0, 220.0, 161.0, 131.0, 95.0, 65.0, 63.0, 38.0, 27.0, 29.0, 17.0, 8.0, 16.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-120.375, -116.384765625, -112.39453125, -108.404296875, -104.4140625, -100.423828125, -96.43359375, -92.443359375, -88.453125, -84.462890625, -80.47265625, -76.482421875, -72.4921875, -68.501953125, -64.51171875, -60.521484375, -56.53125, -52.541015625, -48.55078125, -44.560546875, -40.5703125, -36.580078125, -32.58984375, -28.599609375, -24.609375, -20.619140625, -16.62890625, -12.638671875, -8.6484375, -4.658203125, -0.66796875, 3.322265625, 7.3125, 11.302734375, 15.29296875, 19.283203125, 23.2734375, 27.263671875, 31.25390625, 35.244140625, 39.234375, 43.224609375, 47.21484375, 51.205078125, 55.1953125, 59.185546875, 63.17578125, 67.166015625, 71.15625, 75.146484375, 79.13671875, 83.126953125, 87.1171875, 91.107421875, 95.09765625, 99.087890625, 103.078125, 107.068359375, 111.05859375, 115.048828125, 119.0390625, 123.029296875, 127.01953125, 131.009765625, 135.0]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 2.0, 7.0, 6.0, 11.0, 8.0, 12.0, 18.0, 15.0, 15.0, 25.0, 27.0, 22.0, 33.0, 36.0, 50.0, 44.0, 54.0, 55.0, 105.0, 1914.0, 103.0, 61.0, 52.0, 70.0, 42.0, 36.0, 17.0, 24.0, 26.0, 25.0, 30.0, 15.0, 15.0, 16.0, 11.0, 8.0, 9.0, 3.0, 3.0, 5.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-229.5, -222.646484375, -215.79296875, -208.939453125, -202.0859375, -195.232421875, -188.37890625, -181.525390625, -174.671875, -167.818359375, -160.96484375, -154.111328125, -147.2578125, -140.404296875, -133.55078125, -126.697265625, -119.84375, -112.990234375, -106.13671875, -99.283203125, -92.4296875, -85.576171875, -78.72265625, -71.869140625, -65.015625, -58.162109375, -51.30859375, -44.455078125, -37.6015625, -30.748046875, -23.89453125, -17.041015625, -10.1875, -3.333984375, 3.51953125, 10.373046875, 17.2265625, 24.080078125, 30.93359375, 37.787109375, 44.640625, 51.494140625, 58.34765625, 65.201171875, 72.0546875, 78.908203125, 85.76171875, 92.615234375, 99.46875, 106.322265625, 113.17578125, 120.029296875, 126.8828125, 133.736328125, 140.58984375, 147.443359375, 154.296875, 161.150390625, 168.00390625, 174.857421875, 181.7109375, 188.564453125, 195.41796875, 202.271484375, 209.125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 9.0, 1.0, 7.0, 10.0, 8.0, 19.0, 19.0, 19.0, 27.0, 32.0, 59.0, 56.0, 101.0, 247.0, 594.0, 1414.0, 3802.0, 16874.0, 3047374.0, 63055.0, 7866.0, 2322.0, 882.0, 356.0, 228.0, 78.0, 55.0, 54.0, 25.0, 18.0, 17.0, 16.0, 15.0, 5.0, 4.0, 5.0, 6.0, 11.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-679.0, -658.28125, -637.5625, -616.84375, -596.125, -575.40625, -554.6875, -533.96875, -513.25, -492.53125, -471.8125, -451.09375, -430.375, -409.65625, -388.9375, -368.21875, -347.5, -326.78125, -306.0625, -285.34375, -264.625, -243.90625, -223.1875, -202.46875, -181.75, -161.03125, -140.3125, -119.59375, -98.875, -78.15625, -57.4375, -36.71875, -16.0, 4.71875, 25.4375, 46.15625, 66.875, 87.59375, 108.3125, 129.03125, 149.75, 170.46875, 191.1875, 211.90625, 232.625, 253.34375, 274.0625, 294.78125, 315.5, 336.21875, 356.9375, 377.65625, 398.375, 419.09375, 439.8125, 460.53125, 481.25, 501.96875, 522.6875, 543.40625, 564.125, 584.84375, 605.5625, 626.28125, 647.0]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 3.0, 7.0, 14.0, 20.0, 38.0, 60.0, 91.0, 152.0, 172.0, 180.0, 97.0, 59.0, 46.0, 27.0, 16.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-542.3075561523438, -526.6310424804688, -510.95452880859375, -495.27801513671875, -479.6015319824219, -463.9250183105469, -448.2485046386719, -432.5719909667969, -416.8955078125, -401.218994140625, -385.54248046875, -369.865966796875, -354.1894836425781, -338.5129699707031, -322.8364562988281, -307.1599426269531, -291.4834289550781, -275.8069152832031, -260.1304016113281, -244.4539031982422, -228.77740478515625, -213.10089111328125, -197.42437744140625, -181.74786376953125, -166.0713653564453, -150.3948516845703, -134.71835327148438, -119.04183959960938, -103.3653335571289, -87.68882751464844, -72.01231384277344, -56.33580780029297, -40.6593017578125, -24.9827938079834, -9.306285858154297, 6.3702239990234375, 22.046730041503906, 37.723236083984375, 53.399749755859375, 69.07625579833984, 84.75276184082031, 100.42926788330078, 116.10577392578125, 131.78228759765625, 147.45880126953125, 163.1352996826172, 178.8118133544922, 194.48831176757812, 210.16482543945312, 225.84133911132812, 241.51783752441406, 257.1943359375, 272.870849609375, 288.54736328125, 304.223876953125, 319.900390625, 335.576904296875, 351.25341796875, 366.929931640625, 382.6064453125, 398.2829284667969, 413.9594421386719, 429.6359558105469, 445.3124694824219, 460.98895263671875]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 8.0, 19.0, 13.0, 12.0, 13.0, 17.0, 22.0, 23.0, 22.0, 21.0, 25.0, 36.0, 35.0, 37.0, 38.0, 36.0, 39.0, 53.0, 48.0, 42.0, 51.0, 34.0, 37.0, 35.0, 47.0, 35.0, 29.0, 27.0, 24.0, 26.0, 19.0, 11.0, 11.0, 13.0, 8.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-574.0869140625, -555.5037231445312, -536.9205932617188, -518.33740234375, -499.7542419433594, -481.17108154296875, -462.587890625, -444.0047302246094, -425.42156982421875, -406.8384094238281, -388.2552490234375, -369.67205810546875, -351.0888977050781, -332.5057373046875, -313.92254638671875, -295.3393859863281, -276.7562255859375, -258.1730651855469, -239.5898895263672, -221.0067138671875, -202.42355346679688, -183.84039306640625, -165.25721740722656, -146.67404174804688, -128.09088134765625, -109.5077133178711, -90.92454528808594, -72.34137725830078, -53.758209228515625, -35.17504119873047, -16.591873168945312, 1.991302490234375, 20.57452392578125, 39.157691955566406, 57.74085998535156, 76.32402801513672, 94.90719604492188, 113.49036407470703, 132.0735321044922, 150.65670776367188, 169.2398681640625, 187.82302856445312, 206.4062042236328, 224.9893798828125, 243.57254028320312, 262.15570068359375, 280.7388916015625, 299.3220520019531, 317.90521240234375, 336.4883728027344, 355.071533203125, 373.65472412109375, 392.2378845214844, 410.821044921875, 429.40423583984375, 447.9873962402344, 466.570556640625, 485.1537170410156, 503.73687744140625, 522.320068359375, 540.9031982421875, 559.4863891601562, 578.069580078125, 596.6527099609375, 615.2359008789062]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 3.0, 5.0, 1.0, 15.0, 9.0, 5.0, 12.0, 16.0, 20.0, 19.0, 27.0, 36.0, 26.0, 44.0, 34.0, 40.0, 37.0, 44.0, 44.0, 50.0, 36.0, 52.0, 44.0, 40.0, 41.0, 34.0, 29.0, 20.0, 28.0, 33.0, 23.0, 21.0, 21.0, 18.0, 13.0, 10.0, 9.0, 9.0, 7.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.625, -65.3828125, -63.140625, -60.8984375, -58.65625, -56.4140625, -54.171875, -51.9296875, -49.6875, -47.4453125, -45.203125, -42.9609375, -40.71875, -38.4765625, -36.234375, -33.9921875, -31.75, -29.5078125, -27.265625, -25.0234375, -22.78125, -20.5390625, -18.296875, -16.0546875, -13.8125, -11.5703125, -9.328125, -7.0859375, -4.84375, -2.6015625, -0.359375, 1.8828125, 4.125, 6.3671875, 8.609375, 10.8515625, 13.09375, 15.3359375, 17.578125, 19.8203125, 22.0625, 24.3046875, 26.546875, 28.7890625, 31.03125, 33.2734375, 35.515625, 37.7578125, 40.0, 42.2421875, 44.484375, 46.7265625, 48.96875, 51.2109375, 53.453125, 55.6953125, 57.9375, 60.1796875, 62.421875, 64.6640625, 66.90625, 69.1484375, 71.390625, 73.6328125, 75.875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 14.0, 17.0, 26.0, 38.0, 43.0, 89.0, 111.0, 158.0, 240.0, 398.0, 626.0, 1046.0, 1869.0, 3302.0, 6191.0, 12461.0, 30777.0, 228409.0, 2920192.0, 882692.0, 67863.0, 18637.0, 8553.0, 4409.0, 2444.0, 1347.0, 809.0, 518.0, 334.0, 199.0, 140.0, 97.0, 70.0, 55.0, 33.0, 20.0, 21.0, 13.0, 10.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-160.375, -155.4765625, -150.578125, -145.6796875, -140.78125, -135.8828125, -130.984375, -126.0859375, -121.1875, -116.2890625, -111.390625, -106.4921875, -101.59375, -96.6953125, -91.796875, -86.8984375, -82.0, -77.1015625, -72.203125, -67.3046875, -62.40625, -57.5078125, -52.609375, -47.7109375, -42.8125, -37.9140625, -33.015625, -28.1171875, -23.21875, -18.3203125, -13.421875, -8.5234375, -3.625, 1.2734375, 6.171875, 11.0703125, 15.96875, 20.8671875, 25.765625, 30.6640625, 35.5625, 40.4609375, 45.359375, 50.2578125, 55.15625, 60.0546875, 64.953125, 69.8515625, 74.75, 79.6484375, 84.546875, 89.4453125, 94.34375, 99.2421875, 104.140625, 109.0390625, 113.9375, 118.8359375, 123.734375, 128.6328125, 133.53125, 138.4296875, 143.328125, 148.2265625, 153.125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 10.0, 13.0, 15.0, 16.0, 43.0, 78.0, 115.0, 238.0, 432.0, 957.0, 1107.0, 524.0, 223.0, 109.0, 77.0, 34.0, 24.0, 14.0, 10.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-245.125, -237.93359375, -230.7421875, -223.55078125, -216.359375, -209.16796875, -201.9765625, -194.78515625, -187.59375, -180.40234375, -173.2109375, -166.01953125, -158.828125, -151.63671875, -144.4453125, -137.25390625, -130.0625, -122.87109375, -115.6796875, -108.48828125, -101.296875, -94.10546875, -86.9140625, -79.72265625, -72.53125, -65.33984375, -58.1484375, -50.95703125, -43.765625, -36.57421875, -29.3828125, -22.19140625, -15.0, -7.80859375, -0.6171875, 6.57421875, 13.765625, 20.95703125, 28.1484375, 35.33984375, 42.53125, 49.72265625, 56.9140625, 64.10546875, 71.296875, 78.48828125, 85.6796875, 92.87109375, 100.0625, 107.25390625, 114.4453125, 121.63671875, 128.828125, 136.01953125, 143.2109375, 150.40234375, 157.59375, 164.78515625, 171.9765625, 179.16796875, 186.359375, 193.55078125, 200.7421875, 207.93359375, 215.125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 10.0, 16.0, 19.0, 25.0, 43.0, 81.0, 126.0, 227.0, 411.0, 905.0, 3268.0, 21418.0, 3478581.0, 670476.0, 14394.0, 2414.0, 870.0, 436.0, 207.0, 138.0, 74.0, 54.0, 29.0, 15.0, 16.0, 4.0, 3.0, 9.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-699.0, -677.1015625, -655.203125, -633.3046875, -611.40625, -589.5078125, -567.609375, -545.7109375, -523.8125, -501.9140625, -480.015625, -458.1171875, -436.21875, -414.3203125, -392.421875, -370.5234375, -348.625, -326.7265625, -304.828125, -282.9296875, -261.03125, -239.1328125, -217.234375, -195.3359375, -173.4375, -151.5390625, -129.640625, -107.7421875, -85.84375, -63.9453125, -42.046875, -20.1484375, 1.75, 23.6484375, 45.546875, 67.4453125, 89.34375, 111.2421875, 133.140625, 155.0390625, 176.9375, 198.8359375, 220.734375, 242.6328125, 264.53125, 286.4296875, 308.328125, 330.2265625, 352.125, 374.0234375, 395.921875, 417.8203125, 439.71875, 461.6171875, 483.515625, 505.4140625, 527.3125, 549.2109375, 571.109375, 593.0078125, 614.90625, 636.8046875, 658.703125, 680.6015625, 702.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 9.0, 13.0, 16.0, 25.0, 71.0, 141.0, 206.0, 253.0, 137.0, 72.0, 43.0, 11.0, 9.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1969.292236328125, -1932.192138671875, -1895.092041015625, -1857.991943359375, -1820.891845703125, -1783.791748046875, -1746.691650390625, -1709.591552734375, -1672.491455078125, -1635.391357421875, -1598.291259765625, -1561.191162109375, -1524.091064453125, -1486.990966796875, -1449.890869140625, -1412.790771484375, -1375.690673828125, -1338.590576171875, -1301.490478515625, -1264.390380859375, -1227.290283203125, -1190.190185546875, -1153.090087890625, -1115.989990234375, -1078.8897705078125, -1041.7896728515625, -1004.6895751953125, -967.5894775390625, -930.4893798828125, -893.3892822265625, -856.2891845703125, -819.1890869140625, -782.0889892578125, -744.9888916015625, -707.8887939453125, -670.7886962890625, -633.6885986328125, -596.5885009765625, -559.4884033203125, -522.3883056640625, -485.2882080078125, -448.1881103515625, -411.0880126953125, -373.9879150390625, -336.8878173828125, -299.7877197265625, -262.6875915527344, -225.58749389648438, -188.48739624023438, -151.38729858398438, -114.28719329833984, -77.18708801269531, -40.08699035644531, -2.9868927001953125, 34.11322021484375, 71.21331787109375, 108.31341552734375, 145.41351318359375, 182.51361083984375, 219.6137237548828, 256.71380615234375, 293.81390380859375, 330.9140319824219, 368.0141296386719, 405.1142272949219]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 8.0, 6.0, 12.0, 11.0, 14.0, 13.0, 19.0, 17.0, 25.0, 22.0, 28.0, 34.0, 37.0, 38.0, 42.0, 37.0, 41.0, 34.0, 53.0, 46.0, 43.0, 44.0, 32.0, 42.0, 39.0, 35.0, 33.0, 25.0, 33.0, 13.0, 19.0, 20.0, 14.0, 11.0, 11.0, 9.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-400.17364501953125, -385.8074035644531, -371.441162109375, -357.0749206542969, -342.70867919921875, -328.34246826171875, -313.9761962890625, -299.6099853515625, -285.2437438964844, -270.87750244140625, -256.5112609863281, -242.14501953125, -227.77879333496094, -213.4125518798828, -199.0463104248047, -184.68008422851562, -170.31382751464844, -155.9475860595703, -141.5813446044922, -127.2151107788086, -112.848876953125, -98.48263549804688, -84.11639404296875, -69.75016021728516, -55.38391876220703, -41.01768112182617, -26.65144157409668, -12.285202026367188, 2.081035614013672, 16.44727325439453, 30.813514709472656, 45.17974853515625, 59.545989990234375, 73.9122314453125, 88.2784652709961, 102.64470672607422, 117.01094055175781, 131.37718200683594, 145.74342346191406, 160.10964965820312, 174.47589111328125, 188.84213256835938, 203.2083740234375, 217.57461547851562, 231.9408416748047, 246.3070831298828, 260.67333984375, 275.03955078125, 289.40582275390625, 303.7720642089844, 318.1383056640625, 332.5045471191406, 346.87078857421875, 361.23699951171875, 375.603271484375, 389.969482421875, 404.3357238769531, 418.70196533203125, 433.0682067871094, 447.4344482421875, 461.8006896972656, 476.16693115234375, 490.53314208984375, 504.8993835449219, 519.265625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 6.0, 8.0, 10.0, 11.0, 16.0, 14.0, 21.0, 31.0, 24.0, 30.0, 41.0, 41.0, 41.0, 42.0, 47.0, 36.0, 57.0, 52.0, 44.0, 38.0, 58.0, 40.0, 41.0, 26.0, 28.0, 23.0, 20.0, 22.0, 20.0, 16.0, 21.0, 16.0, 11.0, 6.0, 6.0, 7.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.6875, -73.244140625, -70.80078125, -68.357421875, -65.9140625, -63.470703125, -61.02734375, -58.583984375, -56.140625, -53.697265625, -51.25390625, -48.810546875, -46.3671875, -43.923828125, -41.48046875, -39.037109375, -36.59375, -34.150390625, -31.70703125, -29.263671875, -26.8203125, -24.376953125, -21.93359375, -19.490234375, -17.046875, -14.603515625, -12.16015625, -9.716796875, -7.2734375, -4.830078125, -2.38671875, 0.056640625, 2.5, 4.943359375, 7.38671875, 9.830078125, 12.2734375, 14.716796875, 17.16015625, 19.603515625, 22.046875, 24.490234375, 26.93359375, 29.376953125, 31.8203125, 34.263671875, 36.70703125, 39.150390625, 41.59375, 44.037109375, 46.48046875, 48.923828125, 51.3671875, 53.810546875, 56.25390625, 58.697265625, 61.140625, 63.583984375, 66.02734375, 68.470703125, 70.9140625, 73.357421875, 75.80078125, 78.244140625, 80.6875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 8.0, 10.0, 7.0, 14.0, 14.0, 33.0, 30.0, 57.0, 54.0, 85.0, 125.0, 170.0, 255.0, 361.0, 488.0, 786.0, 1204.0, 2019.0, 3429.0, 6329.0, 12182.0, 24633.0, 54877.0, 135188.0, 385734.0, 251039.0, 90778.0, 38690.0, 18475.0, 9021.0, 4916.0, 2801.0, 1659.0, 991.0, 668.0, 389.0, 303.0, 196.0, 146.0, 121.0, 73.0, 52.0, 46.0, 28.0, 18.0, 13.0, 13.0, 10.0, 11.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-11.8203125, -11.4598388671875, -11.099365234375, -10.7388916015625, -10.37841796875, -10.0179443359375, -9.657470703125, -9.2969970703125, -8.9365234375, -8.5760498046875, -8.215576171875, -7.8551025390625, -7.49462890625, -7.1341552734375, -6.773681640625, -6.4132080078125, -6.052734375, -5.6922607421875, -5.331787109375, -4.9713134765625, -4.61083984375, -4.2503662109375, -3.889892578125, -3.5294189453125, -3.1689453125, -2.8084716796875, -2.447998046875, -2.0875244140625, -1.72705078125, -1.3665771484375, -1.006103515625, -0.6456298828125, -0.28515625, 0.0753173828125, 0.435791015625, 0.7962646484375, 1.15673828125, 1.5172119140625, 1.877685546875, 2.2381591796875, 2.5986328125, 2.9591064453125, 3.319580078125, 3.6800537109375, 4.04052734375, 4.4010009765625, 4.761474609375, 5.1219482421875, 5.482421875, 5.8428955078125, 6.203369140625, 6.5638427734375, 6.92431640625, 7.2847900390625, 7.645263671875, 8.0057373046875, 8.3662109375, 8.7266845703125, 9.087158203125, 9.4476318359375, 9.80810546875, 10.1685791015625, 10.529052734375, 10.8895263671875, 11.25]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 7.0, 15.0, 16.0, 24.0, 18.0, 23.0, 30.0, 29.0, 28.0, 40.0, 38.0, 39.0, 50.0, 33.0, 46.0, 41.0, 1061.0, 47.0, 37.0, 44.0, 41.0, 53.0, 31.0, 38.0, 24.0, 21.0, 25.0, 28.0, 22.0, 16.0, 9.0, 8.0, 7.0, 3.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.96875, -49.341796875, -47.71484375, -46.087890625, -44.4609375, -42.833984375, -41.20703125, -39.580078125, -37.953125, -36.326171875, -34.69921875, -33.072265625, -31.4453125, -29.818359375, -28.19140625, -26.564453125, -24.9375, -23.310546875, -21.68359375, -20.056640625, -18.4296875, -16.802734375, -15.17578125, -13.548828125, -11.921875, -10.294921875, -8.66796875, -7.041015625, -5.4140625, -3.787109375, -2.16015625, -0.533203125, 1.09375, 2.720703125, 4.34765625, 5.974609375, 7.6015625, 9.228515625, 10.85546875, 12.482421875, 14.109375, 15.736328125, 17.36328125, 18.990234375, 20.6171875, 22.244140625, 23.87109375, 25.498046875, 27.125, 28.751953125, 30.37890625, 32.005859375, 33.6328125, 35.259765625, 36.88671875, 38.513671875, 40.140625, 41.767578125, 43.39453125, 45.021484375, 46.6484375, 48.275390625, 49.90234375, 51.529296875, 53.15625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 8.0, 17.0, 19.0, 22.0, 50.0, 63.0, 67.0, 114.0, 152.0, 247.0, 348.0, 467.0, 745.0, 1064.0, 1593.0, 2527.0, 3809.0, 5880.0, 9478.0, 15516.0, 25678.0, 44113.0, 77546.0, 141837.0, 1276081.0, 230275.0, 108053.0, 60726.0, 34664.0, 20874.0, 12721.0, 7914.0, 4964.0, 3249.0, 2102.0, 1335.0, 864.0, 638.0, 416.0, 277.0, 178.0, 128.0, 99.0, 65.0, 52.0, 32.0, 21.0, 16.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-3.91015625, -3.787139892578125, -3.66412353515625, -3.541107177734375, -3.4180908203125, -3.295074462890625, -3.17205810546875, -3.049041748046875, -2.926025390625, -2.803009033203125, -2.67999267578125, -2.556976318359375, -2.4339599609375, -2.310943603515625, -2.18792724609375, -2.064910888671875, -1.94189453125, -1.818878173828125, -1.69586181640625, -1.572845458984375, -1.4498291015625, -1.326812744140625, -1.20379638671875, -1.080780029296875, -0.957763671875, -0.834747314453125, -0.71173095703125, -0.588714599609375, -0.4656982421875, -0.342681884765625, -0.21966552734375, -0.096649169921875, 0.0263671875, 0.149383544921875, 0.27239990234375, 0.395416259765625, 0.5184326171875, 0.641448974609375, 0.76446533203125, 0.887481689453125, 1.010498046875, 1.133514404296875, 1.25653076171875, 1.379547119140625, 1.5025634765625, 1.625579833984375, 1.74859619140625, 1.871612548828125, 1.99462890625, 2.117645263671875, 2.24066162109375, 2.363677978515625, 2.4866943359375, 2.609710693359375, 2.73272705078125, 2.855743408203125, 2.978759765625, 3.101776123046875, 3.22479248046875, 3.347808837890625, 3.4708251953125, 3.593841552734375, 3.71685791015625, 3.839874267578125, 3.962890625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 9.0, 10.0, 13.0, 8.0, 15.0, 5.0, 18.0, 8.0, 21.0, 38.0, 56.0, 136.0, 304.0, 119.0, 45.0, 31.0, 22.0, 19.0, 21.0, 8.0, 12.0, 9.0, 11.0, 8.0, 9.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.346435546875, -0.3354148864746094, -0.32439422607421875, -0.3133735656738281, -0.3023529052734375, -0.2913322448730469, -0.28031158447265625, -0.2692909240722656, -0.258270263671875, -0.24724960327148438, -0.23622894287109375, -0.22520828247070312, -0.2141876220703125, -0.20316696166992188, -0.19214630126953125, -0.18112564086914062, -0.17010498046875, -0.15908432006835938, -0.14806365966796875, -0.13704299926757812, -0.1260223388671875, -0.11500167846679688, -0.10398101806640625, -0.09296035766601562, -0.081939697265625, -0.07091903686523438, -0.05989837646484375, -0.048877716064453125, -0.0378570556640625, -0.026836395263671875, -0.01581573486328125, -0.004795074462890625, 0.0062255859375, 0.017246246337890625, 0.02826690673828125, 0.039287567138671875, 0.0503082275390625, 0.061328887939453125, 0.07234954833984375, 0.08337020874023438, 0.094390869140625, 0.10541152954101562, 0.11643218994140625, 0.12745285034179688, 0.1384735107421875, 0.14949417114257812, 0.16051483154296875, 0.17153549194335938, 0.18255615234375, 0.19357681274414062, 0.20459747314453125, 0.21561813354492188, 0.2266387939453125, 0.23765945434570312, 0.24868011474609375, 0.2597007751464844, 0.270721435546875, 0.2817420959472656, 0.29276275634765625, 0.3037834167480469, 0.3148040771484375, 0.3258247375488281, 0.33684539794921875, 0.3478660583496094, 0.35888671875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 10.0, 6.0, 11.0, 11.0, 7.0, 12.0, 6.0, 18.0, 23.0, 33.0, 49.0, 89.0, 190.0, 1046769.0, 964.0, 114.0, 68.0, 35.0, 25.0, 13.0, 10.0, 13.0, 9.0, 11.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.770751953125, -10.43212890625, -10.093505859375, -9.7548828125, -9.416259765625, -9.07763671875, -8.739013671875, -8.400390625, -8.061767578125, -7.72314453125, -7.384521484375, -7.0458984375, -6.707275390625, -6.36865234375, -6.030029296875, -5.69140625, -5.352783203125, -5.01416015625, -4.675537109375, -4.3369140625, -3.998291015625, -3.65966796875, -3.321044921875, -2.982421875, -2.643798828125, -2.30517578125, -1.966552734375, -1.6279296875, -1.289306640625, -0.95068359375, -0.612060546875, -0.2734375, 0.065185546875, 0.40380859375, 0.742431640625, 1.0810546875, 1.419677734375, 1.75830078125, 2.096923828125, 2.435546875, 2.774169921875, 3.11279296875, 3.451416015625, 3.7900390625, 4.128662109375, 4.46728515625, 4.805908203125, 5.14453125, 5.483154296875, 5.82177734375, 6.160400390625, 6.4990234375, 6.837646484375, 7.17626953125, 7.514892578125, 7.853515625, 8.192138671875, 8.53076171875, 8.869384765625, 9.2080078125, 9.546630859375, 9.88525390625, 10.223876953125, 10.5625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [45.0, 937.0, 38.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10511351376771927, -0.034976959228515625, 0.03515959531068802, 0.10529615730047226, 0.1754327118396759, 0.24556925892829895, 0.3157058358192444, 0.38584238290786743, 0.4559789299964905, 0.5261154770851135, 0.5962520241737366, 0.6663886308670044, 0.7365251779556274, 0.8066617250442505, 0.8767982721328735, 0.9469348192214966, 1.0170713663101196, 1.0872079133987427, 1.1573444604873657, 1.2274810075759888, 1.2976175546646118, 1.3677541017532349, 1.4378907680511475, 1.5080273151397705, 1.578163743019104, 1.648300290107727, 1.71843683719635, 1.7885733842849731, 1.8587099313735962, 1.9288464784622192, 1.9989831447601318, 2.069119691848755, 2.139256238937378, 2.209392786026001, 2.279529333114624, 2.349665880203247, 2.41980242729187, 2.489938974380493, 2.560075521469116, 2.6302120685577393, 2.7003486156463623, 2.7704851627349854, 2.8406217098236084, 2.9107582569122314, 2.9808948040008545, 3.0510313510894775, 3.1211678981781006, 3.1913044452667236, 3.261441230773926, 3.331577777862549, 3.401714324951172, 3.471850872039795, 3.541987419128418, 3.612123966217041, 3.682260513305664, 3.752397060394287, 3.82253360748291, 3.892670154571533, 3.9628067016601562, 4.032943248748779, 4.103079795837402, 4.173216342926025, 4.243352890014648, 4.3134894371032715, 4.3836259841918945]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 8.0, 9.0, 8.0, 11.0, 19.0, 11.0, 14.0, 19.0, 22.0, 33.0, 31.0, 36.0, 26.0, 29.0, 41.0, 56.0, 49.0, 37.0, 41.0, 36.0, 35.0, 43.0, 31.0, 41.0, 43.0, 30.0, 39.0, 27.0, 37.0, 25.0, 25.0, 13.0, 17.0, 10.0, 9.0, 11.0, 7.0, 8.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.22266161441802979, -0.21496491134166718, -0.20726822316646576, -0.19957152009010315, -0.19187483191490173, -0.18417812883853912, -0.1764814257621765, -0.1687847375869751, -0.1610880345106125, -0.15339133143424988, -0.14569464325904846, -0.13799794018268585, -0.13030123710632324, -0.12260454893112183, -0.11490784585475922, -0.1072111502289772, -0.09951445460319519, -0.09181775897741318, -0.08412106335163116, -0.07642436027526855, -0.06872766464948654, -0.06103096902370453, -0.05333426967263222, -0.045637570321559906, -0.03794087469577789, -0.03024417720735073, -0.02254747971892357, -0.014850782230496407, -0.007154084742069244, 0.0005426108837127686, 0.00823931023478508, 0.01593600958585739, 0.023632705211639404, 0.03132940083742142, 0.03902610018849373, 0.04672279953956604, 0.05441949516534805, 0.062116190791130066, 0.06981289386749268, 0.07750958949327469, 0.0852062851190567, 0.09290298074483871, 0.10059967637062073, 0.10829637944698334, 0.11599307507276535, 0.12368977069854736, 0.13138647377490997, 0.13908317685127258, 0.146779865026474, 0.1544765681028366, 0.16217325627803802, 0.16986995935440063, 0.17756664752960205, 0.18526335060596466, 0.19296005368232727, 0.2006567418575287, 0.2083534449338913, 0.2160501480102539, 0.22374683618545532, 0.23144353926181793, 0.23914024233818054, 0.24683693051338196, 0.2545336186885834, 0.2622303366661072, 0.2699270248413086]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 6.0, 8.0, 9.0, 12.0, 16.0, 14.0, 21.0, 30.0, 25.0, 30.0, 41.0, 41.0, 39.0, 44.0, 47.0, 36.0, 56.0, 51.0, 45.0, 39.0, 57.0, 39.0, 43.0, 26.0, 28.0, 22.0, 21.0, 22.0, 19.0, 17.0, 21.0, 16.0, 10.0, 7.0, 6.0, 7.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.6875, -73.2451171875, -70.802734375, -68.3603515625, -65.91796875, -63.4755859375, -61.033203125, -58.5908203125, -56.1484375, -53.7060546875, -51.263671875, -48.8212890625, -46.37890625, -43.9365234375, -41.494140625, -39.0517578125, -36.609375, -34.1669921875, -31.724609375, -29.2822265625, -26.83984375, -24.3974609375, -21.955078125, -19.5126953125, -17.0703125, -14.6279296875, -12.185546875, -9.7431640625, -7.30078125, -4.8583984375, -2.416015625, 0.0263671875, 2.46875, 4.9111328125, 7.353515625, 9.7958984375, 12.23828125, 14.6806640625, 17.123046875, 19.5654296875, 22.0078125, 24.4501953125, 26.892578125, 29.3349609375, 31.77734375, 34.2197265625, 36.662109375, 39.1044921875, 41.546875, 43.9892578125, 46.431640625, 48.8740234375, 51.31640625, 53.7587890625, 56.201171875, 58.6435546875, 61.0859375, 63.5283203125, 65.970703125, 68.4130859375, 70.85546875, 73.2978515625, 75.740234375, 78.1826171875, 80.625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 7.0, 22.0, 20.0, 20.0, 22.0, 27.0, 45.0, 73.0, 95.0, 153.0, 219.0, 346.0, 433.0, 656.0, 1128.0, 1643.0, 2817.0, 5015.0, 9688.0, 23484.0, 96914.0, 722181.0, 131229.0, 27688.0, 11036.0, 5267.0, 3031.0, 1814.0, 1153.0, 746.0, 509.0, 331.0, 201.0, 153.0, 113.0, 76.0, 57.0, 48.0, 26.0, 16.0, 10.0, 11.0, 9.0, 7.0, 4.0, 6.0, 0.0, 2.0, 6.0, 1.0, 1.0], "bins": [-118.8125, -115.3759765625, -111.939453125, -108.5029296875, -105.06640625, -101.6298828125, -98.193359375, -94.7568359375, -91.3203125, -87.8837890625, -84.447265625, -81.0107421875, -77.57421875, -74.1376953125, -70.701171875, -67.2646484375, -63.828125, -60.3916015625, -56.955078125, -53.5185546875, -50.08203125, -46.6455078125, -43.208984375, -39.7724609375, -36.3359375, -32.8994140625, -29.462890625, -26.0263671875, -22.58984375, -19.1533203125, -15.716796875, -12.2802734375, -8.84375, -5.4072265625, -1.970703125, 1.4658203125, 4.90234375, 8.3388671875, 11.775390625, 15.2119140625, 18.6484375, 22.0849609375, 25.521484375, 28.9580078125, 32.39453125, 35.8310546875, 39.267578125, 42.7041015625, 46.140625, 49.5771484375, 53.013671875, 56.4501953125, 59.88671875, 63.3232421875, 66.759765625, 70.1962890625, 73.6328125, 77.0693359375, 80.505859375, 83.9423828125, 87.37890625, 90.8154296875, 94.251953125, 97.6884765625, 101.125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 6.0, 3.0, 7.0, 4.0, 11.0, 12.0, 21.0, 15.0, 23.0, 21.0, 15.0, 18.0, 30.0, 36.0, 35.0, 33.0, 43.0, 47.0, 58.0, 121.0, 1568.0, 336.0, 119.0, 57.0, 49.0, 37.0, 38.0, 38.0, 43.0, 22.0, 26.0, 20.0, 17.0, 22.0, 19.0, 12.0, 12.0, 15.0, 12.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-237.5, -230.287109375, -223.07421875, -215.861328125, -208.6484375, -201.435546875, -194.22265625, -187.009765625, -179.796875, -172.583984375, -165.37109375, -158.158203125, -150.9453125, -143.732421875, -136.51953125, -129.306640625, -122.09375, -114.880859375, -107.66796875, -100.455078125, -93.2421875, -86.029296875, -78.81640625, -71.603515625, -64.390625, -57.177734375, -49.96484375, -42.751953125, -35.5390625, -28.326171875, -21.11328125, -13.900390625, -6.6875, 0.525390625, 7.73828125, 14.951171875, 22.1640625, 29.376953125, 36.58984375, 43.802734375, 51.015625, 58.228515625, 65.44140625, 72.654296875, 79.8671875, 87.080078125, 94.29296875, 101.505859375, 108.71875, 115.931640625, 123.14453125, 130.357421875, 137.5703125, 144.783203125, 151.99609375, 159.208984375, 166.421875, 173.634765625, 180.84765625, 188.060546875, 195.2734375, 202.486328125, 209.69921875, 216.912109375, 224.125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 3.0, 8.0, 8.0, 13.0, 12.0, 16.0, 18.0, 28.0, 32.0, 33.0, 53.0, 71.0, 95.0, 186.0, 266.0, 470.0, 929.0, 2293.0, 6443.0, 32071.0, 2946091.0, 138352.0, 11673.0, 3549.0, 1413.0, 626.0, 295.0, 223.0, 118.0, 70.0, 52.0, 35.0, 35.0, 28.0, 23.0, 14.0, 11.0, 10.0, 8.0, 5.0, 6.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-399.0, -386.80859375, -374.6171875, -362.42578125, -350.234375, -338.04296875, -325.8515625, -313.66015625, -301.46875, -289.27734375, -277.0859375, -264.89453125, -252.703125, -240.51171875, -228.3203125, -216.12890625, -203.9375, -191.74609375, -179.5546875, -167.36328125, -155.171875, -142.98046875, -130.7890625, -118.59765625, -106.40625, -94.21484375, -82.0234375, -69.83203125, -57.640625, -45.44921875, -33.2578125, -21.06640625, -8.875, 3.31640625, 15.5078125, 27.69921875, 39.890625, 52.08203125, 64.2734375, 76.46484375, 88.65625, 100.84765625, 113.0390625, 125.23046875, 137.421875, 149.61328125, 161.8046875, 173.99609375, 186.1875, 198.37890625, 210.5703125, 222.76171875, 234.953125, 247.14453125, 259.3359375, 271.52734375, 283.71875, 295.91015625, 308.1015625, 320.29296875, 332.484375, 344.67578125, 356.8671875, 369.05859375, 381.25]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 29.0, 700.0, 277.0, 10.0, 1.0], "bins": [-5922.0849609375, -5824.642578125, -5727.2001953125, -5629.7578125, -5532.3154296875, -5434.873046875, -5337.4306640625, -5239.98828125, -5142.5458984375, -5045.103515625, -4947.6611328125, -4850.21875, -4752.7763671875, -4655.333984375, -4557.8916015625, -4460.44921875, -4363.00634765625, -4265.56396484375, -4168.12158203125, -4070.67919921875, -3973.23681640625, -3875.79443359375, -3778.35205078125, -3680.909423828125, -3583.46728515625, -3486.02490234375, -3388.58251953125, -3291.14013671875, -3193.69775390625, -3096.25537109375, -2998.81298828125, -2901.370361328125, -2803.927978515625, -2706.485595703125, -2609.043212890625, -2511.600830078125, -2414.158447265625, -2316.7158203125, -2219.2734375, -2121.8310546875, -2024.3887939453125, -1926.9464111328125, -1829.5040283203125, -1732.0615234375, -1634.619140625, -1537.1767578125, -1439.734375, -1342.2919921875, -1244.8494873046875, -1147.4071044921875, -1049.9647216796875, -952.5222778320312, -855.079833984375, -757.637451171875, -660.195068359375, -562.7526245117188, -465.3102722167969, -367.86785888671875, -270.42547607421875, -172.98306274414062, -75.5406494140625, 21.901763916015625, 119.34414672851562, 216.78659057617188, 314.2289733886719]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 13.0, 5.0, 13.0, 7.0, 16.0, 22.0, 19.0, 25.0, 21.0, 18.0, 29.0, 26.0, 24.0, 25.0, 42.0, 32.0, 38.0, 44.0, 50.0, 41.0, 42.0, 43.0, 44.0, 39.0, 31.0, 36.0, 33.0, 31.0, 33.0, 21.0, 19.0, 23.0, 19.0, 8.0, 14.0, 16.0, 12.0, 10.0, 1.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-632.8162841796875, -614.3766479492188, -595.93701171875, -577.4973754882812, -559.0577392578125, -540.6181030273438, -522.178466796875, -503.7388610839844, -485.2992248535156, -466.8595886230469, -448.4199523925781, -429.9803161621094, -411.54071044921875, -393.10107421875, -374.66143798828125, -356.2218017578125, -337.78216552734375, -319.342529296875, -300.90289306640625, -282.4632568359375, -264.02362060546875, -245.58399963378906, -227.14437866210938, -208.70474243164062, -190.26510620117188, -171.82546997070312, -153.38583374023438, -134.9462127685547, -116.50657653808594, -98.06694030761719, -79.62731170654297, -61.18768310546875, -42.74810791015625, -24.308475494384766, -5.868843078613281, 12.570789337158203, 31.010421752929688, 49.45005798339844, 67.88968658447266, 86.32931518554688, 104.76895141601562, 123.20858764648438, 141.64822387695312, 160.0878448486328, 178.52748107910156, 196.9671173095703, 215.40673828125, 233.84637451171875, 252.2860107421875, 270.72564697265625, 289.165283203125, 307.60491943359375, 326.0445556640625, 344.48419189453125, 362.9237976074219, 381.3634338378906, 399.8030700683594, 418.2427062988281, 436.6823425292969, 455.1219787597656, 473.56158447265625, 492.001220703125, 510.44085693359375, 528.8804931640625, 547.3201293945312]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 10.0, 12.0, 15.0, 14.0, 20.0, 18.0, 27.0, 33.0, 35.0, 29.0, 43.0, 49.0, 35.0, 47.0, 41.0, 57.0, 63.0, 46.0, 43.0, 38.0, 52.0, 38.0, 24.0, 30.0, 24.0, 26.0, 15.0, 17.0, 18.0, 15.0, 12.0, 7.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-84.375, -81.70703125, -79.0390625, -76.37109375, -73.703125, -71.03515625, -68.3671875, -65.69921875, -63.03125, -60.36328125, -57.6953125, -55.02734375, -52.359375, -49.69140625, -47.0234375, -44.35546875, -41.6875, -39.01953125, -36.3515625, -33.68359375, -31.015625, -28.34765625, -25.6796875, -23.01171875, -20.34375, -17.67578125, -15.0078125, -12.33984375, -9.671875, -7.00390625, -4.3359375, -1.66796875, 1.0, 3.66796875, 6.3359375, 9.00390625, 11.671875, 14.33984375, 17.0078125, 19.67578125, 22.34375, 25.01171875, 27.6796875, 30.34765625, 33.015625, 35.68359375, 38.3515625, 41.01953125, 43.6875, 46.35546875, 49.0234375, 51.69140625, 54.359375, 57.02734375, 59.6953125, 62.36328125, 65.03125, 67.69921875, 70.3671875, 73.03515625, 75.703125, 78.37109375, 81.0390625, 83.70703125, 86.375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 9.0, 9.0, 13.0, 22.0, 31.0, 41.0, 61.0, 76.0, 132.0, 176.0, 283.0, 426.0, 665.0, 1192.0, 2312.0, 4312.0, 9224.0, 22179.0, 93473.0, 1797371.0, 2109501.0, 109283.0, 23369.0, 9680.0, 4597.0, 2299.0, 1375.0, 749.0, 463.0, 289.0, 185.0, 144.0, 100.0, 74.0, 43.0, 33.0, 27.0, 12.0, 15.0, 6.0, 2.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-176.25, -170.74609375, -165.2421875, -159.73828125, -154.234375, -148.73046875, -143.2265625, -137.72265625, -132.21875, -126.71484375, -121.2109375, -115.70703125, -110.203125, -104.69921875, -99.1953125, -93.69140625, -88.1875, -82.68359375, -77.1796875, -71.67578125, -66.171875, -60.66796875, -55.1640625, -49.66015625, -44.15625, -38.65234375, -33.1484375, -27.64453125, -22.140625, -16.63671875, -11.1328125, -5.62890625, -0.125, 5.37890625, 10.8828125, 16.38671875, 21.890625, 27.39453125, 32.8984375, 38.40234375, 43.90625, 49.41015625, 54.9140625, 60.41796875, 65.921875, 71.42578125, 76.9296875, 82.43359375, 87.9375, 93.44140625, 98.9453125, 104.44921875, 109.953125, 115.45703125, 120.9609375, 126.46484375, 131.96875, 137.47265625, 142.9765625, 148.48046875, 153.984375, 159.48828125, 164.9921875, 170.49609375, 176.0]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 12.0, 18.0, 20.0, 32.0, 58.0, 100.0, 300.0, 875.0, 1771.0, 507.0, 193.0, 68.0, 42.0, 29.0, 19.0, 9.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.0, -251.71875, -240.4375, -229.15625, -217.875, -206.59375, -195.3125, -184.03125, -172.75, -161.46875, -150.1875, -138.90625, -127.625, -116.34375, -105.0625, -93.78125, -82.5, -71.21875, -59.9375, -48.65625, -37.375, -26.09375, -14.8125, -3.53125, 7.75, 19.03125, 30.3125, 41.59375, 52.875, 64.15625, 75.4375, 86.71875, 98.0, 109.28125, 120.5625, 131.84375, 143.125, 154.40625, 165.6875, 176.96875, 188.25, 199.53125, 210.8125, 222.09375, 233.375, 244.65625, 255.9375, 267.21875, 278.5, 289.78125, 301.0625, 312.34375, 323.625, 334.90625, 346.1875, 357.46875, 368.75, 380.03125, 391.3125, 402.59375, 413.875, 425.15625, 436.4375, 447.71875, 459.0]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 24.0, 18.0, 44.0, 82.0, 136.0, 255.0, 619.0, 2449.0, 25177.0, 4015719.0, 141493.0, 6288.0, 1138.0, 399.0, 214.0, 87.0, 60.0, 32.0, 15.0, 10.0, 11.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1361.0, -1325.8671875, -1290.734375, -1255.6015625, -1220.46875, -1185.3359375, -1150.203125, -1115.0703125, -1079.9375, -1044.8046875, -1009.671875, -974.5390625, -939.40625, -904.2734375, -869.140625, -834.0078125, -798.875, -763.7421875, -728.609375, -693.4765625, -658.34375, -623.2109375, -588.078125, -552.9453125, -517.8125, -482.6796875, -447.546875, -412.4140625, -377.28125, -342.1484375, -307.015625, -271.8828125, -236.75, -201.6171875, -166.484375, -131.3515625, -96.21875, -61.0859375, -25.953125, 9.1796875, 44.3125, 79.4453125, 114.578125, 149.7109375, 184.84375, 219.9765625, 255.109375, 290.2421875, 325.375, 360.5078125, 395.640625, 430.7734375, 465.90625, 501.0390625, 536.171875, 571.3046875, 606.4375, 641.5703125, 676.703125, 711.8359375, 746.96875, 782.1015625, 817.234375, 852.3671875, 887.5]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 2.0, 17.0, 18.0, 26.0, 61.0, 100.0, 167.0, 222.0, 177.0, 108.0, 57.0, 16.0, 24.0, 4.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1824.9630126953125, -1788.8408203125, -1752.7186279296875, -1716.596435546875, -1680.474365234375, -1644.3521728515625, -1608.22998046875, -1572.1077880859375, -1535.985595703125, -1499.8634033203125, -1463.7412109375, -1427.6190185546875, -1391.496826171875, -1355.374755859375, -1319.2525634765625, -1283.13037109375, -1247.0081787109375, -1210.885986328125, -1174.7637939453125, -1138.6416015625, -1102.51953125, -1066.3973388671875, -1030.275146484375, -994.1529541015625, -958.03076171875, -921.9085693359375, -885.786376953125, -849.6642456054688, -813.5420532226562, -777.4198608398438, -741.2977294921875, -705.175537109375, -669.053466796875, -632.9312744140625, -596.80908203125, -560.6869506835938, -524.5647583007812, -488.44256591796875, -452.3204040527344, -416.1982421875, -380.0760498046875, -343.953857421875, -307.8316955566406, -271.70953369140625, -235.58734130859375, -199.4651641845703, -163.34298706054688, -127.22080993652344, -91.0986328125, -54.97645568847656, -18.854278564453125, 17.267898559570312, 53.39007568359375, 89.51225280761719, 125.63442993164062, 161.75660705566406, 197.8787841796875, 234.00096130371094, 270.1231384277344, 306.24530029296875, 342.36749267578125, 378.48968505859375, 414.6118469238281, 450.7340087890625, 486.856201171875]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 3.0, 8.0, 7.0, 9.0, 15.0, 9.0, 12.0, 16.0, 16.0, 25.0, 26.0, 28.0, 30.0, 20.0, 21.0, 31.0, 39.0, 31.0, 27.0, 33.0, 38.0, 34.0, 35.0, 46.0, 42.0, 28.0, 35.0, 36.0, 36.0, 27.0, 25.0, 25.0, 24.0, 18.0, 22.0, 30.0, 8.0, 17.0, 9.0, 8.0, 10.0, 9.0, 4.0, 9.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-462.4507751464844, -447.8729553222656, -433.29510498046875, -418.71728515625, -404.13946533203125, -389.5616455078125, -374.98382568359375, -360.4059753417969, -345.8281555175781, -331.2503356933594, -316.6724853515625, -302.09466552734375, -287.516845703125, -272.93902587890625, -258.3612060546875, -243.78335571289062, -229.20553588867188, -214.62771606445312, -200.0498809814453, -185.4720458984375, -170.89422607421875, -156.31640625, -141.7385711669922, -127.1607437133789, -112.58291625976562, -98.00508880615234, -83.42726135253906, -68.84943389892578, -54.2716064453125, -39.69377899169922, -25.115951538085938, -10.538124084472656, 4.0396728515625, 18.61750030517578, 33.19532775878906, 47.773155212402344, 62.350982666015625, 76.9288101196289, 91.50663757324219, 106.08446502685547, 120.66229248046875, 135.2401123046875, 149.8179473876953, 164.39578247070312, 178.97360229492188, 193.55142211914062, 208.12925720214844, 222.70709228515625, 237.284912109375, 251.86273193359375, 266.4405517578125, 281.0184020996094, 295.5962219238281, 310.1740417480469, 324.75189208984375, 339.3297119140625, 353.90753173828125, 368.4853515625, 383.06317138671875, 397.6410217285156, 412.2188415527344, 426.7966613769531, 441.37451171875, 455.95233154296875, 470.5301513671875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 17.0, 8.0, 6.0, 11.0, 11.0, 19.0, 20.0, 25.0, 25.0, 29.0, 32.0, 36.0, 39.0, 34.0, 51.0, 51.0, 36.0, 51.0, 36.0, 50.0, 50.0, 38.0, 45.0, 37.0, 32.0, 32.0, 25.0, 21.0, 21.0, 17.0, 19.0, 16.0, 9.0, 12.0, 6.0, 3.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.8125, -82.03515625, -79.2578125, -76.48046875, -73.703125, -70.92578125, -68.1484375, -65.37109375, -62.59375, -59.81640625, -57.0390625, -54.26171875, -51.484375, -48.70703125, -45.9296875, -43.15234375, -40.375, -37.59765625, -34.8203125, -32.04296875, -29.265625, -26.48828125, -23.7109375, -20.93359375, -18.15625, -15.37890625, -12.6015625, -9.82421875, -7.046875, -4.26953125, -1.4921875, 1.28515625, 4.0625, 6.83984375, 9.6171875, 12.39453125, 15.171875, 17.94921875, 20.7265625, 23.50390625, 26.28125, 29.05859375, 31.8359375, 34.61328125, 37.390625, 40.16796875, 42.9453125, 45.72265625, 48.5, 51.27734375, 54.0546875, 56.83203125, 59.609375, 62.38671875, 65.1640625, 67.94140625, 70.71875, 73.49609375, 76.2734375, 79.05078125, 81.828125, 84.60546875, 87.3828125, 90.16015625, 92.9375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 10.0, 19.0, 17.0, 20.0, 32.0, 33.0, 48.0, 77.0, 126.0, 177.0, 243.0, 390.0, 691.0, 1114.0, 2006.0, 3437.0, 6414.0, 11988.0, 23828.0, 50778.0, 119138.0, 345655.0, 288821.0, 103221.0, 44447.0, 21317.0, 10925.0, 5725.0, 3231.0, 1787.0, 1039.0, 624.0, 382.0, 261.0, 147.0, 114.0, 76.0, 53.0, 30.0, 45.0, 14.0, 19.0, 6.0, 4.0, 6.0, 5.0, 8.0, 0.0, 3.0, 1.0, 2.0], "bins": [-13.3125, -12.9312744140625, -12.550048828125, -12.1688232421875, -11.78759765625, -11.4063720703125, -11.025146484375, -10.6439208984375, -10.2626953125, -9.8814697265625, -9.500244140625, -9.1190185546875, -8.73779296875, -8.3565673828125, -7.975341796875, -7.5941162109375, -7.212890625, -6.8316650390625, -6.450439453125, -6.0692138671875, -5.68798828125, -5.3067626953125, -4.925537109375, -4.5443115234375, -4.1630859375, -3.7818603515625, -3.400634765625, -3.0194091796875, -2.63818359375, -2.2569580078125, -1.875732421875, -1.4945068359375, -1.11328125, -0.7320556640625, -0.350830078125, 0.0303955078125, 0.41162109375, 0.7928466796875, 1.174072265625, 1.5552978515625, 1.9365234375, 2.3177490234375, 2.698974609375, 3.0802001953125, 3.46142578125, 3.8426513671875, 4.223876953125, 4.6051025390625, 4.986328125, 5.3675537109375, 5.748779296875, 6.1300048828125, 6.51123046875, 6.8924560546875, 7.273681640625, 7.6549072265625, 8.0361328125, 8.4173583984375, 8.798583984375, 9.1798095703125, 9.56103515625, 9.9422607421875, 10.323486328125, 10.7047119140625, 11.0859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 5.0, 9.0, 10.0, 15.0, 15.0, 20.0, 20.0, 19.0, 15.0, 30.0, 31.0, 31.0, 36.0, 34.0, 38.0, 32.0, 33.0, 50.0, 38.0, 1056.0, 52.0, 54.0, 39.0, 24.0, 41.0, 31.0, 32.0, 24.0, 28.0, 25.0, 16.0, 26.0, 20.0, 14.0, 3.0, 8.0, 12.0, 6.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-58.59375, -56.88134765625, -55.1689453125, -53.45654296875, -51.744140625, -50.03173828125, -48.3193359375, -46.60693359375, -44.89453125, -43.18212890625, -41.4697265625, -39.75732421875, -38.044921875, -36.33251953125, -34.6201171875, -32.90771484375, -31.1953125, -29.48291015625, -27.7705078125, -26.05810546875, -24.345703125, -22.63330078125, -20.9208984375, -19.20849609375, -17.49609375, -15.78369140625, -14.0712890625, -12.35888671875, -10.646484375, -8.93408203125, -7.2216796875, -5.50927734375, -3.796875, -2.08447265625, -0.3720703125, 1.34033203125, 3.052734375, 4.76513671875, 6.4775390625, 8.18994140625, 9.90234375, 11.61474609375, 13.3271484375, 15.03955078125, 16.751953125, 18.46435546875, 20.1767578125, 21.88916015625, 23.6015625, 25.31396484375, 27.0263671875, 28.73876953125, 30.451171875, 32.16357421875, 33.8759765625, 35.58837890625, 37.30078125, 39.01318359375, 40.7255859375, 42.43798828125, 44.150390625, 45.86279296875, 47.5751953125, 49.28759765625, 51.0]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 15.0, 16.0, 20.0, 35.0, 58.0, 61.0, 106.0, 171.0, 245.0, 364.0, 516.0, 771.0, 1192.0, 1798.0, 2739.0, 4338.0, 6710.0, 10655.0, 16938.0, 27243.0, 45345.0, 76074.0, 140036.0, 1240165.0, 255333.0, 107085.0, 61044.0, 36708.0, 22519.0, 13904.0, 8717.0, 5504.0, 3750.0, 2410.0, 1484.0, 1002.0, 693.0, 433.0, 315.0, 203.0, 139.0, 74.0, 62.0, 45.0, 37.0, 17.0, 14.0, 9.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.19921875, -4.067138671875, -3.93505859375, -3.802978515625, -3.6708984375, -3.538818359375, -3.40673828125, -3.274658203125, -3.142578125, -3.010498046875, -2.87841796875, -2.746337890625, -2.6142578125, -2.482177734375, -2.35009765625, -2.218017578125, -2.0859375, -1.953857421875, -1.82177734375, -1.689697265625, -1.5576171875, -1.425537109375, -1.29345703125, -1.161376953125, -1.029296875, -0.897216796875, -0.76513671875, -0.633056640625, -0.5009765625, -0.368896484375, -0.23681640625, -0.104736328125, 0.02734375, 0.159423828125, 0.29150390625, 0.423583984375, 0.5556640625, 0.687744140625, 0.81982421875, 0.951904296875, 1.083984375, 1.216064453125, 1.34814453125, 1.480224609375, 1.6123046875, 1.744384765625, 1.87646484375, 2.008544921875, 2.140625, 2.272705078125, 2.40478515625, 2.536865234375, 2.6689453125, 2.801025390625, 2.93310546875, 3.065185546875, 3.197265625, 3.329345703125, 3.46142578125, 3.593505859375, 3.7255859375, 3.857666015625, 3.98974609375, 4.121826171875, 4.25390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 3.0, 6.0, 11.0, 14.0, 17.0, 13.0, 21.0, 31.0, 28.0, 50.0, 98.0, 243.0, 169.0, 96.0, 51.0, 35.0, 21.0, 17.0, 10.0, 15.0, 13.0, 6.0, 8.0, 9.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93798828125, -0.9102935791015625, -0.882598876953125, -0.8549041748046875, -0.82720947265625, -0.7995147705078125, -0.771820068359375, -0.7441253662109375, -0.7164306640625, -0.6887359619140625, -0.661041259765625, -0.6333465576171875, -0.60565185546875, -0.5779571533203125, -0.550262451171875, -0.5225677490234375, -0.494873046875, -0.4671783447265625, -0.439483642578125, -0.4117889404296875, -0.38409423828125, -0.3563995361328125, -0.328704833984375, -0.3010101318359375, -0.2733154296875, -0.2456207275390625, -0.217926025390625, -0.1902313232421875, -0.16253662109375, -0.1348419189453125, -0.107147216796875, -0.0794525146484375, -0.0517578125, -0.0240631103515625, 0.003631591796875, 0.0313262939453125, 0.05902099609375, 0.0867156982421875, 0.114410400390625, 0.1421051025390625, 0.1697998046875, 0.1974945068359375, 0.225189208984375, 0.2528839111328125, 0.28057861328125, 0.3082733154296875, 0.335968017578125, 0.3636627197265625, 0.391357421875, 0.4190521240234375, 0.446746826171875, 0.4744415283203125, 0.50213623046875, 0.5298309326171875, 0.557525634765625, 0.5852203369140625, 0.6129150390625, 0.6406097412109375, 0.668304443359375, 0.6959991455078125, 0.72369384765625, 0.7513885498046875, 0.779083251953125, 0.8067779541015625, 0.83447265625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 9.0, 5.0, 13.0, 16.0, 10.0, 18.0, 24.0, 45.0, 71.0, 150.0, 586.0, 1047151.0, 185.0, 85.0, 37.0, 33.0, 25.0, 13.0, 16.0, 18.0, 9.0, 6.0, 3.0, 3.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.03125, -25.16796875, -24.3046875, -23.44140625, -22.578125, -21.71484375, -20.8515625, -19.98828125, -19.125, -18.26171875, -17.3984375, -16.53515625, -15.671875, -14.80859375, -13.9453125, -13.08203125, -12.21875, -11.35546875, -10.4921875, -9.62890625, -8.765625, -7.90234375, -7.0390625, -6.17578125, -5.3125, -4.44921875, -3.5859375, -2.72265625, -1.859375, -0.99609375, -0.1328125, 0.73046875, 1.59375, 2.45703125, 3.3203125, 4.18359375, 5.046875, 5.91015625, 6.7734375, 7.63671875, 8.5, 9.36328125, 10.2265625, 11.08984375, 11.953125, 12.81640625, 13.6796875, 14.54296875, 15.40625, 16.26953125, 17.1328125, 17.99609375, 18.859375, 19.72265625, 20.5859375, 21.44921875, 22.3125, 23.17578125, 24.0390625, 24.90234375, 25.765625, 26.62890625, 27.4921875, 28.35546875, 29.21875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 40.0, 961.0, 20.0], "bins": [-4.400049686431885, -4.329604625701904, -4.259159564971924, -4.188714981079102, -4.118269920349121, -4.047824859619141, -3.9773800373077393, -3.906934976577759, -3.8364901542663574, -3.766045093536377, -3.6956002712249756, -3.625155210494995, -3.5547103881835938, -3.4842653274536133, -3.413820505142212, -3.3433754444122314, -3.272930383682251, -3.2024853229522705, -3.132040500640869, -3.0615954399108887, -2.9911506175994873, -2.920705556869507, -2.8502607345581055, -2.779815673828125, -2.7093706130981445, -2.638925552368164, -2.5684807300567627, -2.4980356693267822, -2.427590847015381, -2.3571457862854004, -2.286700963973999, -2.2162559032440186, -2.145811080932617, -2.0753660202026367, -2.0049211978912354, -1.9344762563705444, -1.8640313148498535, -1.793586254119873, -1.7231413125991821, -1.6526963710784912, -1.5822515487670898, -1.511806607246399, -1.441361665725708, -1.370916724205017, -1.3004717826843262, -1.2300267219543457, -1.1595817804336548, -1.0891368389129639, -1.018691897392273, -0.948246955871582, -0.8778020143508911, -0.8073570132255554, -0.7369120717048645, -0.6664671301841736, -0.5960221290588379, -0.525577187538147, -0.4551321864128113, -0.38468724489212036, -0.31424227356910706, -0.24379731714725494, -0.17335236072540283, -0.10290741920471191, -0.03246244788169861, 0.0379825234413147, 0.10842745751142502]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 9.0, 5.0, 7.0, 8.0, 12.0, 15.0, 16.0, 20.0, 16.0, 18.0, 28.0, 24.0, 30.0, 19.0, 28.0, 17.0, 36.0, 30.0, 29.0, 24.0, 35.0, 28.0, 31.0, 38.0, 37.0, 41.0, 31.0, 49.0, 32.0, 28.0, 19.0, 22.0, 23.0, 28.0, 29.0, 18.0, 18.0, 15.0, 21.0, 13.0, 9.0, 8.0, 6.0, 7.0, 6.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.4317131042480469, -0.41850537061691284, -0.4052976369857788, -0.3920899033546448, -0.37888216972351074, -0.3656744360923767, -0.3524667024612427, -0.33925899863243103, -0.326051265001297, -0.31284353137016296, -0.29963579773902893, -0.2864280641078949, -0.27322033047676086, -0.2600126266479492, -0.246804878115654, -0.23359715938568115, -0.22038941085338593, -0.2071816772222519, -0.19397394359111786, -0.18076622486114502, -0.167558491230011, -0.15435075759887695, -0.14114302396774292, -0.1279352903366089, -0.11472756415605545, -0.10151983052492142, -0.08831210434436798, -0.07510437071323395, -0.06189664080739021, -0.04868891090154648, -0.035481177270412445, -0.02227345108985901, -0.009065717458724976, 0.004142013378441334, 0.017349744215607643, 0.030557475984096527, 0.04376520588994026, 0.056972935795784, 0.07018066942691803, 0.08338839560747147, 0.0965961292386055, 0.10980386286973953, 0.12301158905029297, 0.136219322681427, 0.14942705631256104, 0.16263478994369507, 0.1758425235748291, 0.18905024230480194, 0.20225797593593597, 0.21546570956707, 0.22867344319820404, 0.24188116192817688, 0.2550888955593109, 0.26829662919044495, 0.281504362821579, 0.294712096452713, 0.30791983008384705, 0.3211275637149811, 0.3343352973461151, 0.34754303097724915, 0.3607507646083832, 0.3739584684371948, 0.38716620206832886, 0.4003739356994629, 0.4135816693305969]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 17.0, 8.0, 6.0, 11.0, 11.0, 19.0, 20.0, 25.0, 25.0, 29.0, 32.0, 36.0, 39.0, 34.0, 51.0, 51.0, 36.0, 51.0, 36.0, 50.0, 50.0, 38.0, 45.0, 37.0, 32.0, 32.0, 25.0, 21.0, 21.0, 17.0, 19.0, 16.0, 9.0, 12.0, 6.0, 3.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.8125, -82.03515625, -79.2578125, -76.48046875, -73.703125, -70.92578125, -68.1484375, -65.37109375, -62.59375, -59.81640625, -57.0390625, -54.26171875, -51.484375, -48.70703125, -45.9296875, -43.15234375, -40.375, -37.59765625, -34.8203125, -32.04296875, -29.265625, -26.48828125, -23.7109375, -20.93359375, -18.15625, -15.37890625, -12.6015625, -9.82421875, -7.046875, -4.26953125, -1.4921875, 1.28515625, 4.0625, 6.83984375, 9.6171875, 12.39453125, 15.171875, 17.94921875, 20.7265625, 23.50390625, 26.28125, 29.05859375, 31.8359375, 34.61328125, 37.390625, 40.16796875, 42.9453125, 45.72265625, 48.5, 51.27734375, 54.0546875, 56.83203125, 59.609375, 62.38671875, 65.1640625, 67.94140625, 70.71875, 73.49609375, 76.2734375, 79.05078125, 81.828125, 84.60546875, 87.3828125, 90.16015625, 92.9375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 4.0, 11.0, 23.0, 26.0, 32.0, 34.0, 69.0, 103.0, 119.0, 162.0, 236.0, 361.0, 453.0, 697.0, 1046.0, 1560.0, 2557.0, 4744.0, 9950.0, 48798.0, 899165.0, 55561.0, 10247.0, 4794.0, 2715.0, 1629.0, 1081.0, 697.0, 476.0, 329.0, 229.0, 189.0, 121.0, 103.0, 61.0, 38.0, 40.0, 25.0, 16.0, 15.0, 9.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.25, -159.8359375, -154.421875, -149.0078125, -143.59375, -138.1796875, -132.765625, -127.3515625, -121.9375, -116.5234375, -111.109375, -105.6953125, -100.28125, -94.8671875, -89.453125, -84.0390625, -78.625, -73.2109375, -67.796875, -62.3828125, -56.96875, -51.5546875, -46.140625, -40.7265625, -35.3125, -29.8984375, -24.484375, -19.0703125, -13.65625, -8.2421875, -2.828125, 2.5859375, 8.0, 13.4140625, 18.828125, 24.2421875, 29.65625, 35.0703125, 40.484375, 45.8984375, 51.3125, 56.7265625, 62.140625, 67.5546875, 72.96875, 78.3828125, 83.796875, 89.2109375, 94.625, 100.0390625, 105.453125, 110.8671875, 116.28125, 121.6953125, 127.109375, 132.5234375, 137.9375, 143.3515625, 148.765625, 154.1796875, 159.59375, 165.0078125, 170.421875, 175.8359375, 181.25]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 8.0, 9.0, 9.0, 15.0, 11.0, 7.0, 12.0, 23.0, 34.0, 35.0, 25.0, 46.0, 49.0, 44.0, 36.0, 62.0, 115.0, 1960.0, 114.0, 63.0, 63.0, 36.0, 42.0, 39.0, 36.0, 37.0, 25.0, 22.0, 13.0, 11.0, 16.0, 9.0, 7.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-344.25, -333.98046875, -323.7109375, -313.44140625, -303.171875, -292.90234375, -282.6328125, -272.36328125, -262.09375, -251.82421875, -241.5546875, -231.28515625, -221.015625, -210.74609375, -200.4765625, -190.20703125, -179.9375, -169.66796875, -159.3984375, -149.12890625, -138.859375, -128.58984375, -118.3203125, -108.05078125, -97.78125, -87.51171875, -77.2421875, -66.97265625, -56.703125, -46.43359375, -36.1640625, -25.89453125, -15.625, -5.35546875, 4.9140625, 15.18359375, 25.453125, 35.72265625, 45.9921875, 56.26171875, 66.53125, 76.80078125, 87.0703125, 97.33984375, 107.609375, 117.87890625, 128.1484375, 138.41796875, 148.6875, 158.95703125, 169.2265625, 179.49609375, 189.765625, 200.03515625, 210.3046875, 220.57421875, 230.84375, 241.11328125, 251.3828125, 261.65234375, 271.921875, 282.19140625, 292.4609375, 302.73046875, 313.0]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 6.0, 11.0, 11.0, 18.0, 14.0, 22.0, 27.0, 34.0, 52.0, 61.0, 98.0, 186.0, 452.0, 1391.0, 6558.0, 2975274.0, 154694.0, 4763.0, 1088.0, 362.0, 192.0, 95.0, 65.0, 56.0, 39.0, 34.0, 18.0, 7.0, 14.0, 14.0, 5.0, 16.0, 9.0, 8.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-704.0, -681.2265625, -658.453125, -635.6796875, -612.90625, -590.1328125, -567.359375, -544.5859375, -521.8125, -499.0390625, -476.265625, -453.4921875, -430.71875, -407.9453125, -385.171875, -362.3984375, -339.625, -316.8515625, -294.078125, -271.3046875, -248.53125, -225.7578125, -202.984375, -180.2109375, -157.4375, -134.6640625, -111.890625, -89.1171875, -66.34375, -43.5703125, -20.796875, 1.9765625, 24.75, 47.5234375, 70.296875, 93.0703125, 115.84375, 138.6171875, 161.390625, 184.1640625, 206.9375, 229.7109375, 252.484375, 275.2578125, 298.03125, 320.8046875, 343.578125, 366.3515625, 389.125, 411.8984375, 434.671875, 457.4453125, 480.21875, 502.9921875, 525.765625, 548.5390625, 571.3125, 594.0859375, 616.859375, 639.6328125, 662.40625, 685.1796875, 707.953125, 730.7265625, 753.5]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 12.0, 23.0, 28.0, 40.0, 60.0, 108.0, 130.0, 138.0, 139.0, 105.0, 74.0, 51.0, 26.0, 22.0, 10.0, 15.0, 5.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.393310546875, -168.86355590820312, -161.3338165283203, -153.80406188964844, -146.27432250976562, -138.74456787109375, -131.21481323242188, -123.68507385253906, -116.15532684326172, -108.62557983398438, -101.09583282470703, -93.56608581542969, -86.03633117675781, -78.506591796875, -70.97683715820312, -63.44709014892578, -55.91734313964844, -48.387596130371094, -40.85784912109375, -33.32809829711914, -25.798351287841797, -18.268604278564453, -10.738853454589844, -3.2091064453125, 4.320640563964844, 11.850388526916504, 19.380136489868164, 26.90988540649414, 34.439632415771484, 41.96937942504883, 49.49913024902344, 57.02887725830078, 64.55862426757812, 72.08837127685547, 79.61811828613281, 87.14787292480469, 94.6776123046875, 102.20736694335938, 109.73711395263672, 117.26686096191406, 124.7966079711914, 132.32635498046875, 139.85610961914062, 147.38584899902344, 154.9156036376953, 162.44534301757812, 169.97509765625, 177.50485229492188, 185.0345916748047, 192.56434631347656, 200.09408569335938, 207.62384033203125, 215.15357971191406, 222.68333435058594, 230.21307373046875, 237.74282836914062, 245.2725830078125, 252.80233764648438, 260.33209228515625, 267.86181640625, 275.3915710449219, 282.92132568359375, 290.4510803222656, 297.9808349609375, 305.51055908203125]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 3.0, 9.0, 12.0, 13.0, 18.0, 14.0, 22.0, 31.0, 18.0, 19.0, 24.0, 34.0, 32.0, 34.0, 35.0, 37.0, 40.0, 39.0, 44.0, 37.0, 44.0, 50.0, 39.0, 33.0, 31.0, 38.0, 29.0, 32.0, 25.0, 19.0, 23.0, 24.0, 12.0, 21.0, 15.0, 10.0, 9.0, 9.0, 2.0, 3.0, 4.0, 7.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-676.5153198242188, -655.5403442382812, -634.5654296875, -613.5904541015625, -592.6155395507812, -571.6405639648438, -550.6656494140625, -529.690673828125, -508.7156982421875, -487.7407531738281, -466.76580810546875, -445.79083251953125, -424.8158874511719, -403.8409423828125, -382.8659973144531, -361.89105224609375, -340.9161071777344, -319.941162109375, -298.9662170410156, -277.99127197265625, -257.01629638671875, -236.04135131835938, -215.06640625, -194.09144592285156, -173.1165008544922, -152.1415557861328, -131.16659545898438, -110.191650390625, -89.2166976928711, -68.24174499511719, -47.26679992675781, -26.291839599609375, -5.31689453125, 15.658056259155273, 36.63300704956055, 57.60795593261719, 78.5829086303711, 99.557861328125, 120.53280639648438, 141.5077667236328, 162.4827117919922, 183.45765686035156, 204.4326171875, 225.40756225585938, 246.38250732421875, 267.35748291015625, 288.3323974609375, 309.307373046875, 330.2823181152344, 351.25726318359375, 372.2322082519531, 393.2071533203125, 414.18212890625, 435.1570739746094, 456.13201904296875, 477.10699462890625, 498.0819091796875, 519.056884765625, 540.0317993164062, 561.0067749023438, 581.981689453125, 602.9566650390625, 623.931640625, 644.9065551757812, 665.8815307617188]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 0.0, 4.0, 5.0, 6.0, 8.0, 6.0, 7.0, 10.0, 11.0, 14.0, 15.0, 18.0, 26.0, 20.0, 31.0, 29.0, 25.0, 35.0, 34.0, 35.0, 44.0, 51.0, 46.0, 37.0, 46.0, 43.0, 47.0, 44.0, 40.0, 32.0, 38.0, 24.0, 27.0, 26.0, 17.0, 26.0, 13.0, 14.0, 7.0, 9.0, 10.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.5625, -83.798828125, -81.03515625, -78.271484375, -75.5078125, -72.744140625, -69.98046875, -67.216796875, -64.453125, -61.689453125, -58.92578125, -56.162109375, -53.3984375, -50.634765625, -47.87109375, -45.107421875, -42.34375, -39.580078125, -36.81640625, -34.052734375, -31.2890625, -28.525390625, -25.76171875, -22.998046875, -20.234375, -17.470703125, -14.70703125, -11.943359375, -9.1796875, -6.416015625, -3.65234375, -0.888671875, 1.875, 4.638671875, 7.40234375, 10.166015625, 12.9296875, 15.693359375, 18.45703125, 21.220703125, 23.984375, 26.748046875, 29.51171875, 32.275390625, 35.0390625, 37.802734375, 40.56640625, 43.330078125, 46.09375, 48.857421875, 51.62109375, 54.384765625, 57.1484375, 59.912109375, 62.67578125, 65.439453125, 68.203125, 70.966796875, 73.73046875, 76.494140625, 79.2578125, 82.021484375, 84.78515625, 87.548828125, 90.3125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 11.0, 16.0, 19.0, 22.0, 24.0, 62.0, 87.0, 135.0, 219.0, 285.0, 426.0, 613.0, 883.0, 1393.0, 2106.0, 3409.0, 5554.0, 9771.0, 18524.0, 51122.0, 439481.0, 3046692.0, 507892.0, 59987.0, 19450.0, 10224.0, 5835.0, 3493.0, 2136.0, 1445.0, 896.0, 630.0, 442.0, 329.0, 230.0, 144.0, 90.0, 44.0, 39.0, 33.0, 26.0, 20.0, 13.0, 10.0, 11.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-153.125, -148.109375, -143.09375, -138.078125, -133.0625, -128.046875, -123.03125, -118.015625, -113.0, -107.984375, -102.96875, -97.953125, -92.9375, -87.921875, -82.90625, -77.890625, -72.875, -67.859375, -62.84375, -57.828125, -52.8125, -47.796875, -42.78125, -37.765625, -32.75, -27.734375, -22.71875, -17.703125, -12.6875, -7.671875, -2.65625, 2.359375, 7.375, 12.390625, 17.40625, 22.421875, 27.4375, 32.453125, 37.46875, 42.484375, 47.5, 52.515625, 57.53125, 62.546875, 67.5625, 72.578125, 77.59375, 82.609375, 87.625, 92.640625, 97.65625, 102.671875, 107.6875, 112.703125, 117.71875, 122.734375, 127.75, 132.765625, 137.78125, 142.796875, 147.8125, 152.828125, 157.84375, 162.859375, 167.875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 2.0, 5.0, 10.0, 12.0, 11.0, 9.0, 13.0, 27.0, 27.0, 39.0, 53.0, 93.0, 183.0, 323.0, 706.0, 1104.0, 656.0, 336.0, 151.0, 88.0, 62.0, 32.0, 25.0, 24.0, 16.0, 12.0, 8.0, 8.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-231.0, -224.666015625, -218.33203125, -211.998046875, -205.6640625, -199.330078125, -192.99609375, -186.662109375, -180.328125, -173.994140625, -167.66015625, -161.326171875, -154.9921875, -148.658203125, -142.32421875, -135.990234375, -129.65625, -123.322265625, -116.98828125, -110.654296875, -104.3203125, -97.986328125, -91.65234375, -85.318359375, -78.984375, -72.650390625, -66.31640625, -59.982421875, -53.6484375, -47.314453125, -40.98046875, -34.646484375, -28.3125, -21.978515625, -15.64453125, -9.310546875, -2.9765625, 3.357421875, 9.69140625, 16.025390625, 22.359375, 28.693359375, 35.02734375, 41.361328125, 47.6953125, 54.029296875, 60.36328125, 66.697265625, 73.03125, 79.365234375, 85.69921875, 92.033203125, 98.3671875, 104.701171875, 111.03515625, 117.369140625, 123.703125, 130.037109375, 136.37109375, 142.705078125, 149.0390625, 155.373046875, 161.70703125, 168.041015625, 174.375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 4.0, 5.0, 11.0, 12.0, 19.0, 28.0, 31.0, 44.0, 70.0, 95.0, 147.0, 259.0, 442.0, 958.0, 2227.0, 6264.0, 20727.0, 112391.0, 3811048.0, 198400.0, 27993.0, 7950.0, 2690.0, 1133.0, 552.0, 273.0, 168.0, 94.0, 73.0, 47.0, 40.0, 21.0, 14.0, 12.0, 14.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-412.75, -397.23828125, -381.7265625, -366.21484375, -350.703125, -335.19140625, -319.6796875, -304.16796875, -288.65625, -273.14453125, -257.6328125, -242.12109375, -226.609375, -211.09765625, -195.5859375, -180.07421875, -164.5625, -149.05078125, -133.5390625, -118.02734375, -102.515625, -87.00390625, -71.4921875, -55.98046875, -40.46875, -24.95703125, -9.4453125, 6.06640625, 21.578125, 37.08984375, 52.6015625, 68.11328125, 83.625, 99.13671875, 114.6484375, 130.16015625, 145.671875, 161.18359375, 176.6953125, 192.20703125, 207.71875, 223.23046875, 238.7421875, 254.25390625, 269.765625, 285.27734375, 300.7890625, 316.30078125, 331.8125, 347.32421875, 362.8359375, 378.34765625, 393.859375, 409.37109375, 424.8828125, 440.39453125, 455.90625, 471.41796875, 486.9296875, 502.44140625, 517.953125, 533.46484375, 548.9765625, 564.48828125, 580.0]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 31.0, 178.0, 537.0, 215.0, 34.0, 9.0, 3.0], "bins": [-5717.24072265625, -5621.240234375, -5525.23974609375, -5429.2392578125, -5333.23876953125, -5237.23828125, -5141.2373046875, -5045.2373046875, -4949.236328125, -4853.23583984375, -4757.2353515625, -4661.23486328125, -4565.234375, -4469.23388671875, -4373.2333984375, -4277.232421875, -4181.232421875, -4085.23193359375, -3989.2314453125, -3893.23095703125, -3797.230224609375, -3701.229736328125, -3605.229248046875, -3509.228759765625, -3413.22802734375, -3317.2275390625, -3221.22705078125, -3125.2265625, -3029.225830078125, -2933.225341796875, -2837.224853515625, -2741.224365234375, -2645.223876953125, -2549.223388671875, -2453.222900390625, -2357.22216796875, -2261.2216796875, -2165.22119140625, -2069.220703125, -1973.22021484375, -1877.2196044921875, -1781.2191162109375, -1685.218505859375, -1589.218017578125, -1493.217529296875, -1397.217041015625, -1301.2164306640625, -1205.2159423828125, -1109.2154541015625, -1013.2149047851562, -917.2144165039062, -821.2138671875, -725.21337890625, -629.2128295898438, -533.2122802734375, -437.2117919921875, -341.2112121582031, -245.210693359375, -149.2101593017578, -53.209625244140625, 42.7908935546875, 138.79141235351562, 234.79196166992188, 330.7924499511719, 426.7929992675781]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 10.0, 9.0, 15.0, 10.0, 15.0, 17.0, 17.0, 24.0, 27.0, 32.0, 33.0, 34.0, 40.0, 26.0, 40.0, 34.0, 44.0, 48.0, 41.0, 51.0, 39.0, 39.0, 36.0, 37.0, 40.0, 45.0, 24.0, 20.0, 30.0, 23.0, 22.0, 15.0, 11.0, 9.0, 9.0, 5.0, 8.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-530.5936889648438, -514.7981567382812, -499.0025939941406, -483.20703125, -467.4114990234375, -451.6159362792969, -435.82037353515625, -420.02484130859375, -404.22930908203125, -388.4337463378906, -372.6382141113281, -356.8426513671875, -341.047119140625, -325.2515563964844, -309.45599365234375, -293.66046142578125, -277.8648986816406, -262.0693359375, -246.2738037109375, -230.47824096679688, -214.68270874023438, -198.88714599609375, -183.0915985107422, -167.29605102539062, -151.50050354003906, -135.7049560546875, -119.90940856933594, -104.11385345458984, -88.31830596923828, -72.52275848388672, -56.727203369140625, -40.93165588378906, -25.1361083984375, -9.340559005737305, 6.454990386962891, 22.25054168701172, 38.04608917236328, 53.841636657714844, 69.63719177246094, 85.4327392578125, 101.22828674316406, 117.02383422851562, 132.8193817138672, 148.61492919921875, 164.41049194335938, 180.20602416992188, 196.0015869140625, 211.79713439941406, 227.59268188476562, 243.3882293701172, 259.18377685546875, 274.9793395996094, 290.7748718261719, 306.5704345703125, 322.365966796875, 338.1615295410156, 353.95709228515625, 369.7526550292969, 385.5481872558594, 401.34375, 417.1392822265625, 432.9348449707031, 448.73040771484375, 464.52593994140625, 480.32147216796875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 4.0, 5.0, 14.0, 14.0, 9.0, 12.0, 12.0, 17.0, 23.0, 19.0, 24.0, 24.0, 26.0, 37.0, 43.0, 33.0, 34.0, 41.0, 34.0, 39.0, 51.0, 32.0, 42.0, 38.0, 40.0, 45.0, 40.0, 33.0, 28.0, 32.0, 27.0, 17.0, 25.0, 18.0, 9.0, 10.0, 9.0, 5.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-81.375, -78.7626953125, -76.150390625, -73.5380859375, -70.92578125, -68.3134765625, -65.701171875, -63.0888671875, -60.4765625, -57.8642578125, -55.251953125, -52.6396484375, -50.02734375, -47.4150390625, -44.802734375, -42.1904296875, -39.578125, -36.9658203125, -34.353515625, -31.7412109375, -29.12890625, -26.5166015625, -23.904296875, -21.2919921875, -18.6796875, -16.0673828125, -13.455078125, -10.8427734375, -8.23046875, -5.6181640625, -3.005859375, -0.3935546875, 2.21875, 4.8310546875, 7.443359375, 10.0556640625, 12.66796875, 15.2802734375, 17.892578125, 20.5048828125, 23.1171875, 25.7294921875, 28.341796875, 30.9541015625, 33.56640625, 36.1787109375, 38.791015625, 41.4033203125, 44.015625, 46.6279296875, 49.240234375, 51.8525390625, 54.46484375, 57.0771484375, 59.689453125, 62.3017578125, 64.9140625, 67.5263671875, 70.138671875, 72.7509765625, 75.36328125, 77.9755859375, 80.587890625, 83.2001953125, 85.8125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 16.0, 13.0, 15.0, 28.0, 36.0, 60.0, 109.0, 110.0, 216.0, 372.0, 651.0, 1101.0, 2099.0, 3972.0, 7918.0, 16104.0, 33571.0, 74333.0, 181069.0, 405177.0, 180365.0, 74389.0, 34012.0, 16052.0, 7964.0, 3939.0, 2114.0, 1128.0, 626.0, 377.0, 213.0, 136.0, 93.0, 61.0, 31.0, 25.0, 22.0, 12.0, 7.0, 6.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.5706787109375, -10.235107421875, -9.8995361328125, -9.56396484375, -9.2283935546875, -8.892822265625, -8.5572509765625, -8.2216796875, -7.8861083984375, -7.550537109375, -7.2149658203125, -6.87939453125, -6.5438232421875, -6.208251953125, -5.8726806640625, -5.537109375, -5.2015380859375, -4.865966796875, -4.5303955078125, -4.19482421875, -3.8592529296875, -3.523681640625, -3.1881103515625, -2.8525390625, -2.5169677734375, -2.181396484375, -1.8458251953125, -1.51025390625, -1.1746826171875, -0.839111328125, -0.5035400390625, -0.16796875, 0.1676025390625, 0.503173828125, 0.8387451171875, 1.17431640625, 1.5098876953125, 1.845458984375, 2.1810302734375, 2.5166015625, 2.8521728515625, 3.187744140625, 3.5233154296875, 3.85888671875, 4.1944580078125, 4.530029296875, 4.8656005859375, 5.201171875, 5.5367431640625, 5.872314453125, 6.2078857421875, 6.54345703125, 6.8790283203125, 7.214599609375, 7.5501708984375, 7.8857421875, 8.2213134765625, 8.556884765625, 8.8924560546875, 9.22802734375, 9.5635986328125, 9.899169921875, 10.2347412109375, 10.5703125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 4.0, 1.0, 10.0, 5.0, 11.0, 9.0, 11.0, 15.0, 10.0, 21.0, 16.0, 28.0, 12.0, 24.0, 21.0, 40.0, 26.0, 19.0, 39.0, 35.0, 46.0, 39.0, 30.0, 1063.0, 41.0, 39.0, 48.0, 42.0, 41.0, 29.0, 28.0, 27.0, 30.0, 23.0, 21.0, 25.0, 15.0, 16.0, 11.0, 8.0, 14.0, 9.0, 8.0, 6.0, 5.0, 1.0, 6.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-61.125, -59.40478515625, -57.6845703125, -55.96435546875, -54.244140625, -52.52392578125, -50.8037109375, -49.08349609375, -47.36328125, -45.64306640625, -43.9228515625, -42.20263671875, -40.482421875, -38.76220703125, -37.0419921875, -35.32177734375, -33.6015625, -31.88134765625, -30.1611328125, -28.44091796875, -26.720703125, -25.00048828125, -23.2802734375, -21.56005859375, -19.83984375, -18.11962890625, -16.3994140625, -14.67919921875, -12.958984375, -11.23876953125, -9.5185546875, -7.79833984375, -6.078125, -4.35791015625, -2.6376953125, -0.91748046875, 0.802734375, 2.52294921875, 4.2431640625, 5.96337890625, 7.68359375, 9.40380859375, 11.1240234375, 12.84423828125, 14.564453125, 16.28466796875, 18.0048828125, 19.72509765625, 21.4453125, 23.16552734375, 24.8857421875, 26.60595703125, 28.326171875, 30.04638671875, 31.7666015625, 33.48681640625, 35.20703125, 36.92724609375, 38.6474609375, 40.36767578125, 42.087890625, 43.80810546875, 45.5283203125, 47.24853515625, 48.96875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 10.0, 12.0, 23.0, 29.0, 33.0, 70.0, 67.0, 137.0, 173.0, 279.0, 377.0, 549.0, 863.0, 1323.0, 1948.0, 3006.0, 4666.0, 7256.0, 11450.0, 18164.0, 29952.0, 50996.0, 89540.0, 172562.0, 1323332.0, 166077.0, 86488.0, 49299.0, 29167.0, 17767.0, 11082.0, 6975.0, 4547.0, 2973.0, 1944.0, 1323.0, 887.0, 609.0, 378.0, 238.0, 183.0, 117.0, 86.0, 61.0, 38.0, 21.0, 20.0, 13.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.3125, -4.17547607421875, -4.0384521484375, -3.90142822265625, -3.764404296875, -3.62738037109375, -3.4903564453125, -3.35333251953125, -3.21630859375, -3.07928466796875, -2.9422607421875, -2.80523681640625, -2.668212890625, -2.53118896484375, -2.3941650390625, -2.25714111328125, -2.1201171875, -1.98309326171875, -1.8460693359375, -1.70904541015625, -1.572021484375, -1.43499755859375, -1.2979736328125, -1.16094970703125, -1.02392578125, -0.88690185546875, -0.7498779296875, -0.61285400390625, -0.475830078125, -0.33880615234375, -0.2017822265625, -0.06475830078125, 0.072265625, 0.20928955078125, 0.3463134765625, 0.48333740234375, 0.620361328125, 0.75738525390625, 0.8944091796875, 1.03143310546875, 1.16845703125, 1.30548095703125, 1.4425048828125, 1.57952880859375, 1.716552734375, 1.85357666015625, 1.9906005859375, 2.12762451171875, 2.2646484375, 2.40167236328125, 2.5386962890625, 2.67572021484375, 2.812744140625, 2.94976806640625, 3.0867919921875, 3.22381591796875, 3.36083984375, 3.49786376953125, 3.6348876953125, 3.77191162109375, 3.908935546875, 4.04595947265625, 4.1829833984375, 4.32000732421875, 4.45703125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 11.0, 7.0, 11.0, 14.0, 12.0, 12.0, 11.0, 20.0, 24.0, 27.0, 32.0, 77.0, 147.0, 189.0, 118.0, 54.0, 41.0, 24.0, 25.0, 15.0, 15.0, 14.0, 5.0, 11.0, 10.0, 8.0, 11.0, 7.0, 4.0, 3.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.251708984375, -0.24391746520996094, -0.23612594604492188, -0.2283344268798828, -0.22054290771484375, -0.2127513885498047, -0.20495986938476562, -0.19716835021972656, -0.1893768310546875, -0.18158531188964844, -0.17379379272460938, -0.1660022735595703, -0.15821075439453125, -0.1504192352294922, -0.14262771606445312, -0.13483619689941406, -0.127044677734375, -0.11925315856933594, -0.11146163940429688, -0.10367012023925781, -0.09587860107421875, -0.08808708190917969, -0.08029556274414062, -0.07250404357910156, -0.0647125244140625, -0.05692100524902344, -0.049129486083984375, -0.04133796691894531, -0.03354644775390625, -0.025754928588867188, -0.017963409423828125, -0.010171890258789062, -0.00238037109375, 0.0054111480712890625, 0.013202667236328125, 0.020994186401367188, 0.02878570556640625, 0.03657722473144531, 0.044368743896484375, 0.05216026306152344, 0.0599517822265625, 0.06774330139160156, 0.07553482055664062, 0.08332633972167969, 0.09111785888671875, 0.09890937805175781, 0.10670089721679688, 0.11449241638183594, 0.122283935546875, 0.13007545471191406, 0.13786697387695312, 0.1456584930419922, 0.15345001220703125, 0.1612415313720703, 0.16903305053710938, 0.17682456970214844, 0.1846160888671875, 0.19240760803222656, 0.20019912719726562, 0.2079906463623047, 0.21578216552734375, 0.2235736846923828, 0.23136520385742188, 0.23915672302246094, 0.2469482421875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 4.0, 7.0, 9.0, 9.0, 7.0, 14.0, 6.0, 13.0, 15.0, 18.0, 30.0, 46.0, 68.0, 103.0, 214.0, 1047083.0, 488.0, 123.0, 79.0, 38.0, 33.0, 20.0, 15.0, 11.0, 15.0, 10.0, 11.0, 6.0, 11.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.6796875, -7.44482421875, -7.2099609375, -6.97509765625, -6.740234375, -6.50537109375, -6.2705078125, -6.03564453125, -5.80078125, -5.56591796875, -5.3310546875, -5.09619140625, -4.861328125, -4.62646484375, -4.3916015625, -4.15673828125, -3.921875, -3.68701171875, -3.4521484375, -3.21728515625, -2.982421875, -2.74755859375, -2.5126953125, -2.27783203125, -2.04296875, -1.80810546875, -1.5732421875, -1.33837890625, -1.103515625, -0.86865234375, -0.6337890625, -0.39892578125, -0.1640625, 0.07080078125, 0.3056640625, 0.54052734375, 0.775390625, 1.01025390625, 1.2451171875, 1.47998046875, 1.71484375, 1.94970703125, 2.1845703125, 2.41943359375, 2.654296875, 2.88916015625, 3.1240234375, 3.35888671875, 3.59375, 3.82861328125, 4.0634765625, 4.29833984375, 4.533203125, 4.76806640625, 5.0029296875, 5.23779296875, 5.47265625, 5.70751953125, 5.9423828125, 6.17724609375, 6.412109375, 6.64697265625, 6.8818359375, 7.11669921875, 7.3515625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 49.0, 817.0, 140.0, 10.0, 1.0], "bins": [-1.6375054121017456, -1.6105188131332397, -1.5835323333740234, -1.5565457344055176, -1.5295592546463013, -1.5025726556777954, -1.475586175918579, -1.4485995769500732, -1.421613097190857, -1.394626498222351, -1.3676400184631348, -1.340653419494629, -1.3136669397354126, -1.2866803407669067, -1.2596938610076904, -1.2327072620391846, -1.2057206630706787, -1.1787340641021729, -1.1517475843429565, -1.1247609853744507, -1.0977745056152344, -1.0707879066467285, -1.0438014268875122, -1.0168148279190063, -0.98982834815979, -0.962841808795929, -0.9358552694320679, -0.9088687300682068, -0.8818821907043457, -0.8548956513404846, -0.8279091119766235, -0.8009225130081177, -0.7739360332489014, -0.7469494938850403, -0.7199629545211792, -0.6929764151573181, -0.665989875793457, -0.639003336429596, -0.6120167970657349, -0.585030198097229, -0.5580437183380127, -0.5310571789741516, -0.5040706396102905, -0.47708410024642944, -0.45009756088256836, -0.4231110215187073, -0.3961244523525238, -0.3691379129886627, -0.34215137362480164, -0.31516483426094055, -0.28817829489707947, -0.261191725730896, -0.2342052012681961, -0.20721866190433502, -0.18023210763931274, -0.15324556827545166, -0.12625902891159058, -0.09927248954772949, -0.07228594273328781, -0.04529939591884613, -0.018312856554985046, 0.008673682808876038, 0.035660237073898315, 0.0626467764377594, 0.08963332325220108]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 0.0, 5.0, 6.0, 6.0, 7.0, 5.0, 8.0, 11.0, 10.0, 11.0, 13.0, 13.0, 30.0, 22.0, 20.0, 26.0, 28.0, 43.0, 21.0, 38.0, 28.0, 41.0, 22.0, 42.0, 39.0, 48.0, 48.0, 53.0, 36.0, 31.0, 28.0, 29.0, 34.0, 26.0, 24.0, 32.0, 23.0, 15.0, 10.0, 12.0, 6.0, 10.0, 8.0, 6.0, 7.0, 7.0, 3.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.3662654161453247, -0.35448646545410156, -0.3427075147628784, -0.3309285640716553, -0.3191496431827545, -0.30737069249153137, -0.2955917418003082, -0.2838127911090851, -0.2720338702201843, -0.2602549195289612, -0.24847598373889923, -0.2366970330476761, -0.22491809725761414, -0.213139146566391, -0.20136019587516785, -0.1895812451839447, -0.17780229449272156, -0.1660233438014984, -0.15424440801143646, -0.14246545732021332, -0.13068652153015137, -0.11890757083892822, -0.10712862014770508, -0.09534967690706253, -0.08357073366641998, -0.07179179042577744, -0.06001284345984459, -0.04823389649391174, -0.036454953253269196, -0.024676010012626648, -0.012897059321403503, -0.0011181160807609558, 0.010660827159881592, 0.02243977226316929, 0.034218717366456985, 0.04599766433238983, 0.05777660757303238, 0.06955555081367493, 0.08133450150489807, 0.09311344474554062, 0.10489238798618317, 0.11667133122682571, 0.12845027446746826, 0.1402292251586914, 0.15200817584991455, 0.1637871116399765, 0.17556606233119965, 0.1873449981212616, 0.19912394881248474, 0.21090289950370789, 0.22268183529376984, 0.23446078598499298, 0.24623972177505493, 0.2580186724662781, 0.2697976231575012, 0.28157657384872437, 0.2933555245399475, 0.30513447523117065, 0.3169134259223938, 0.32869237661361694, 0.3404712975025177, 0.35225024819374084, 0.364029198884964, 0.37580814957618713, 0.3875870704650879]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 4.0, 5.0, 14.0, 14.0, 9.0, 12.0, 12.0, 17.0, 23.0, 19.0, 24.0, 24.0, 26.0, 37.0, 43.0, 33.0, 34.0, 41.0, 34.0, 39.0, 51.0, 32.0, 42.0, 38.0, 40.0, 45.0, 40.0, 33.0, 28.0, 32.0, 27.0, 17.0, 25.0, 18.0, 9.0, 10.0, 9.0, 5.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-81.375, -78.7626953125, -76.150390625, -73.5380859375, -70.92578125, -68.3134765625, -65.701171875, -63.0888671875, -60.4765625, -57.8642578125, -55.251953125, -52.6396484375, -50.02734375, -47.4150390625, -44.802734375, -42.1904296875, -39.578125, -36.9658203125, -34.353515625, -31.7412109375, -29.12890625, -26.5166015625, -23.904296875, -21.2919921875, -18.6796875, -16.0673828125, -13.455078125, -10.8427734375, -8.23046875, -5.6181640625, -3.005859375, -0.3935546875, 2.21875, 4.8310546875, 7.443359375, 10.0556640625, 12.66796875, 15.2802734375, 17.892578125, 20.5048828125, 23.1171875, 25.7294921875, 28.341796875, 30.9541015625, 33.56640625, 36.1787109375, 38.791015625, 41.4033203125, 44.015625, 46.6279296875, 49.240234375, 51.8525390625, 54.46484375, 57.0771484375, 59.689453125, 62.3017578125, 64.9140625, 67.5263671875, 70.138671875, 72.7509765625, 75.36328125, 77.9755859375, 80.587890625, 83.2001953125, 85.8125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 3.0, 4.0, 7.0, 8.0, 16.0, 10.0, 17.0, 24.0, 32.0, 43.0, 48.0, 74.0, 84.0, 146.0, 189.0, 278.0, 442.0, 669.0, 1092.0, 1963.0, 3368.0, 6643.0, 13776.0, 33703.0, 198790.0, 702714.0, 48399.0, 17717.0, 8137.0, 4159.0, 2256.0, 1321.0, 807.0, 512.0, 345.0, 231.0, 131.0, 130.0, 79.0, 46.0, 38.0, 26.0, 17.0, 15.0, 15.0, 13.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-189.0, -182.93359375, -176.8671875, -170.80078125, -164.734375, -158.66796875, -152.6015625, -146.53515625, -140.46875, -134.40234375, -128.3359375, -122.26953125, -116.203125, -110.13671875, -104.0703125, -98.00390625, -91.9375, -85.87109375, -79.8046875, -73.73828125, -67.671875, -61.60546875, -55.5390625, -49.47265625, -43.40625, -37.33984375, -31.2734375, -25.20703125, -19.140625, -13.07421875, -7.0078125, -0.94140625, 5.125, 11.19140625, 17.2578125, 23.32421875, 29.390625, 35.45703125, 41.5234375, 47.58984375, 53.65625, 59.72265625, 65.7890625, 71.85546875, 77.921875, 83.98828125, 90.0546875, 96.12109375, 102.1875, 108.25390625, 114.3203125, 120.38671875, 126.453125, 132.51953125, 138.5859375, 144.65234375, 150.71875, 156.78515625, 162.8515625, 168.91796875, 174.984375, 181.05078125, 187.1171875, 193.18359375, 199.25]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 7.0, 5.0, 9.0, 10.0, 13.0, 15.0, 16.0, 16.0, 26.0, 31.0, 27.0, 40.0, 46.0, 42.0, 51.0, 77.0, 89.0, 136.0, 1745.0, 125.0, 86.0, 51.0, 51.0, 44.0, 28.0, 41.0, 23.0, 22.0, 28.0, 26.0, 23.0, 15.0, 12.0, 13.0, 8.0, 13.0, 3.0, 3.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-216.75, -209.09765625, -201.4453125, -193.79296875, -186.140625, -178.48828125, -170.8359375, -163.18359375, -155.53125, -147.87890625, -140.2265625, -132.57421875, -124.921875, -117.26953125, -109.6171875, -101.96484375, -94.3125, -86.66015625, -79.0078125, -71.35546875, -63.703125, -56.05078125, -48.3984375, -40.74609375, -33.09375, -25.44140625, -17.7890625, -10.13671875, -2.484375, 5.16796875, 12.8203125, 20.47265625, 28.125, 35.77734375, 43.4296875, 51.08203125, 58.734375, 66.38671875, 74.0390625, 81.69140625, 89.34375, 96.99609375, 104.6484375, 112.30078125, 119.953125, 127.60546875, 135.2578125, 142.91015625, 150.5625, 158.21484375, 165.8671875, 173.51953125, 181.171875, 188.82421875, 196.4765625, 204.12890625, 211.78125, 219.43359375, 227.0859375, 234.73828125, 242.390625, 250.04296875, 257.6953125, 265.34765625, 273.0]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 3.0, 7.0, 12.0, 11.0, 10.0, 20.0, 15.0, 26.0, 39.0, 33.0, 42.0, 42.0, 76.0, 113.0, 243.0, 578.0, 1951.0, 10522.0, 144785.0, 2945198.0, 35287.0, 4638.0, 1143.0, 378.0, 154.0, 98.0, 58.0, 31.0, 37.0, 33.0, 15.0, 22.0, 18.0, 13.0, 11.0, 10.0, 8.0, 2.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-690.0, -669.8671875, -649.734375, -629.6015625, -609.46875, -589.3359375, -569.203125, -549.0703125, -528.9375, -508.8046875, -488.671875, -468.5390625, -448.40625, -428.2734375, -408.140625, -388.0078125, -367.875, -347.7421875, -327.609375, -307.4765625, -287.34375, -267.2109375, -247.078125, -226.9453125, -206.8125, -186.6796875, -166.546875, -146.4140625, -126.28125, -106.1484375, -86.015625, -65.8828125, -45.75, -25.6171875, -5.484375, 14.6484375, 34.78125, 54.9140625, 75.046875, 95.1796875, 115.3125, 135.4453125, 155.578125, 175.7109375, 195.84375, 215.9765625, 236.109375, 256.2421875, 276.375, 296.5078125, 316.640625, 336.7734375, 356.90625, 377.0390625, 397.171875, 417.3046875, 437.4375, 457.5703125, 477.703125, 497.8359375, 517.96875, 538.1015625, 558.234375, 578.3671875, 598.5]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [4.0, 8.0, 168.0, 778.0, 61.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-443.7018737792969, -311.68145751953125, -179.6610107421875, -47.640594482421875, 84.37985229492188, 216.40029907226562, 348.4206848144531, 480.4411315917969, 612.4615478515625, 744.4819946289062, 876.50244140625, 1008.5228271484375, 1140.543212890625, 1272.563720703125, 1404.5841064453125, 1536.6044921875, 1668.625, 1800.6453857421875, 1932.6658935546875, 2064.686279296875, 2196.706787109375, 2328.72705078125, 2460.74755859375, 2592.76806640625, 2724.78857421875, 2856.80908203125, 2988.829345703125, 3120.849853515625, 3252.870361328125, 3384.890625, 3516.9111328125, 3648.931640625, 3780.95166015625, 3912.97216796875, 4044.992431640625, 4177.0126953125, 4309.033203125, 4441.0537109375, 4573.07421875, 4705.0947265625, 4837.115234375, 4969.1357421875, 5101.15625, 5233.1767578125, 5365.19677734375, 5497.21728515625, 5629.23779296875, 5761.25830078125, 5893.2783203125, 6025.298828125, 6157.3193359375, 6289.33984375, 6421.35986328125, 6553.38037109375, 6685.40087890625, 6817.42138671875, 6949.44189453125, 7081.46240234375, 7213.48291015625, 7345.5029296875, 7477.5234375, 7609.5439453125, 7741.564453125, 7873.5849609375, 8005.60546875]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 7.0, 3.0, 1.0, 7.0, 11.0, 19.0, 14.0, 22.0, 26.0, 29.0, 29.0, 36.0, 36.0, 42.0, 42.0, 57.0, 50.0, 58.0, 42.0, 44.0, 40.0, 38.0, 43.0, 39.0, 40.0, 43.0, 27.0, 21.0, 21.0, 22.0, 23.0, 16.0, 17.0, 9.0, 6.0, 7.0, 6.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-713.80419921875, -690.6886596679688, -667.5730590820312, -644.45751953125, -621.3419799804688, -598.2264404296875, -575.11083984375, -551.9953002929688, -528.8797607421875, -505.7641906738281, -482.6486511230469, -459.5330810546875, -436.41754150390625, -413.3019714355469, -390.1864013671875, -367.07086181640625, -343.95526123046875, -320.8396911621094, -297.7241516113281, -274.60858154296875, -251.49302673339844, -228.37747192382812, -205.26190185546875, -182.14634704589844, -159.03079223632812, -135.9152374267578, -112.79967498779297, -89.68411254882812, -66.56855773925781, -43.4530029296875, -20.337432861328125, 2.7781219482421875, 25.8936767578125, 49.00923538208008, 72.12479400634766, 95.2403564453125, 118.35591125488281, 141.47146606445312, 164.5870361328125, 187.7025909423828, 210.81814575195312, 233.93370056152344, 257.04925537109375, 280.1648254394531, 303.2803955078125, 326.39593505859375, 349.5115051269531, 372.6270751953125, 395.74261474609375, 418.8581848144531, 441.9737243652344, 465.08929443359375, 488.204833984375, 511.3204040527344, 534.4359741210938, 557.551513671875, 580.6671142578125, 603.7826538085938, 626.8982543945312, 650.0137939453125, 673.1293334960938, 696.244873046875, 719.3604736328125, 742.4760131835938, 765.591552734375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 6.0, 6.0, 13.0, 11.0, 11.0, 14.0, 20.0, 25.0, 15.0, 31.0, 29.0, 31.0, 31.0, 47.0, 34.0, 32.0, 30.0, 48.0, 47.0, 37.0, 46.0, 37.0, 38.0, 38.0, 46.0, 29.0, 39.0, 32.0, 34.0, 16.0, 23.0, 8.0, 17.0, 13.0, 7.0, 9.0, 8.0, 5.0, 7.0, 11.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-91.125, -88.35546875, -85.5859375, -82.81640625, -80.046875, -77.27734375, -74.5078125, -71.73828125, -68.96875, -66.19921875, -63.4296875, -60.66015625, -57.890625, -55.12109375, -52.3515625, -49.58203125, -46.8125, -44.04296875, -41.2734375, -38.50390625, -35.734375, -32.96484375, -30.1953125, -27.42578125, -24.65625, -21.88671875, -19.1171875, -16.34765625, -13.578125, -10.80859375, -8.0390625, -5.26953125, -2.5, 0.26953125, 3.0390625, 5.80859375, 8.578125, 11.34765625, 14.1171875, 16.88671875, 19.65625, 22.42578125, 25.1953125, 27.96484375, 30.734375, 33.50390625, 36.2734375, 39.04296875, 41.8125, 44.58203125, 47.3515625, 50.12109375, 52.890625, 55.66015625, 58.4296875, 61.19921875, 63.96875, 66.73828125, 69.5078125, 72.27734375, 75.046875, 77.81640625, 80.5859375, 83.35546875, 86.125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 4.0, 16.0, 22.0, 24.0, 47.0, 55.0, 101.0, 110.0, 197.0, 297.0, 448.0, 637.0, 954.0, 1445.0, 2159.0, 3442.0, 5409.0, 9331.0, 16546.0, 34528.0, 152721.0, 1854082.0, 1878758.0, 155919.0, 35112.0, 16881.0, 9432.0, 5436.0, 3466.0, 2259.0, 1464.0, 935.0, 638.0, 419.0, 315.0, 216.0, 139.0, 75.0, 64.0, 46.0, 29.0, 34.0, 19.0, 14.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-145.75, -140.724609375, -135.69921875, -130.673828125, -125.6484375, -120.623046875, -115.59765625, -110.572265625, -105.546875, -100.521484375, -95.49609375, -90.470703125, -85.4453125, -80.419921875, -75.39453125, -70.369140625, -65.34375, -60.318359375, -55.29296875, -50.267578125, -45.2421875, -40.216796875, -35.19140625, -30.166015625, -25.140625, -20.115234375, -15.08984375, -10.064453125, -5.0390625, -0.013671875, 5.01171875, 10.037109375, 15.0625, 20.087890625, 25.11328125, 30.138671875, 35.1640625, 40.189453125, 45.21484375, 50.240234375, 55.265625, 60.291015625, 65.31640625, 70.341796875, 75.3671875, 80.392578125, 85.41796875, 90.443359375, 95.46875, 100.494140625, 105.51953125, 110.544921875, 115.5703125, 120.595703125, 125.62109375, 130.646484375, 135.671875, 140.697265625, 145.72265625, 150.748046875, 155.7734375, 160.798828125, 165.82421875, 170.849609375, 175.875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 10.0, 5.0, 14.0, 26.0, 28.0, 44.0, 63.0, 83.0, 185.0, 552.0, 1380.0, 945.0, 319.0, 159.0, 79.0, 56.0, 34.0, 26.0, 13.0, 10.0, 9.0, 9.0, 4.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.25, -193.73828125, -185.2265625, -176.71484375, -168.203125, -159.69140625, -151.1796875, -142.66796875, -134.15625, -125.64453125, -117.1328125, -108.62109375, -100.109375, -91.59765625, -83.0859375, -74.57421875, -66.0625, -57.55078125, -49.0390625, -40.52734375, -32.015625, -23.50390625, -14.9921875, -6.48046875, 2.03125, 10.54296875, 19.0546875, 27.56640625, 36.078125, 44.58984375, 53.1015625, 61.61328125, 70.125, 78.63671875, 87.1484375, 95.66015625, 104.171875, 112.68359375, 121.1953125, 129.70703125, 138.21875, 146.73046875, 155.2421875, 163.75390625, 172.265625, 180.77734375, 189.2890625, 197.80078125, 206.3125, 214.82421875, 223.3359375, 231.84765625, 240.359375, 248.87109375, 257.3828125, 265.89453125, 274.40625, 282.91796875, 291.4296875, 299.94140625, 308.453125, 316.96484375, 325.4765625, 333.98828125, 342.5]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 11.0, 19.0, 24.0, 35.0, 55.0, 91.0, 218.0, 417.0, 1060.0, 3720.0, 19249.0, 219922.0, 3872120.0, 64439.0, 9298.0, 2192.0, 730.0, 331.0, 135.0, 69.0, 45.0, 26.0, 25.0, 13.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-851.5, -829.828125, -808.15625, -786.484375, -764.8125, -743.140625, -721.46875, -699.796875, -678.125, -656.453125, -634.78125, -613.109375, -591.4375, -569.765625, -548.09375, -526.421875, -504.75, -483.078125, -461.40625, -439.734375, -418.0625, -396.390625, -374.71875, -353.046875, -331.375, -309.703125, -288.03125, -266.359375, -244.6875, -223.015625, -201.34375, -179.671875, -158.0, -136.328125, -114.65625, -92.984375, -71.3125, -49.640625, -27.96875, -6.296875, 15.375, 37.046875, 58.71875, 80.390625, 102.0625, 123.734375, 145.40625, 167.078125, 188.75, 210.421875, 232.09375, 253.765625, 275.4375, 297.109375, 318.78125, 340.453125, 362.125, 383.796875, 405.46875, 427.140625, 448.8125, 470.484375, 492.15625, 513.828125, 535.5]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 36.0, 191.0, 584.0, 153.0, 39.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3717.37109375, -3615.325927734375, -3513.280517578125, -3411.2353515625, -3309.190185546875, -3207.14501953125, -3105.099609375, -3003.054443359375, -2901.00927734375, -2798.964111328125, -2696.918701171875, -2594.87353515625, -2492.828369140625, -2390.783203125, -2288.73779296875, -2186.692626953125, -2084.647216796875, -1982.6019287109375, -1880.5567626953125, -1778.511474609375, -1676.46630859375, -1574.4210205078125, -1472.375732421875, -1370.33056640625, -1268.2852783203125, -1166.239990234375, -1064.19482421875, -962.1495361328125, -860.1043090820312, -758.05908203125, -656.0137939453125, -553.9685668945312, -451.923095703125, -349.87786865234375, -247.83261108398438, -145.787353515625, -43.74212646484375, 58.3031005859375, 160.348388671875, 262.39361572265625, 364.4388427734375, 466.48406982421875, 568.529296875, 670.5745849609375, 772.6198120117188, 874.6650390625, 976.7103271484375, 1078.755615234375, 1180.80078125, 1282.8460693359375, 1384.8912353515625, 1486.9365234375, 1588.981689453125, 1691.0269775390625, 1793.072265625, 1895.117431640625, 1997.1627197265625, 2099.2080078125, 2201.253173828125, 2303.29833984375, 2405.34375, 2507.388916015625, 2609.43408203125, 2711.4794921875, 2813.524658203125]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 8.0, 8.0, 16.0, 21.0, 19.0, 24.0, 24.0, 32.0, 30.0, 45.0, 41.0, 38.0, 53.0, 55.0, 59.0, 52.0, 45.0, 50.0, 47.0, 44.0, 49.0, 45.0, 42.0, 26.0, 23.0, 25.0, 14.0, 12.0, 15.0, 10.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-652.7791748046875, -631.3751220703125, -609.9710693359375, -588.5670166015625, -567.1629638671875, -545.7589721679688, -524.3549194335938, -502.95086669921875, -481.54681396484375, -460.14276123046875, -438.73870849609375, -417.3346862792969, -395.9306335449219, -374.5265808105469, -353.12255859375, -331.718505859375, -310.314453125, -288.910400390625, -267.50634765625, -246.10232543945312, -224.69827270507812, -203.29421997070312, -181.8901824951172, -160.48614501953125, -139.08209228515625, -117.67804718017578, -96.27400207519531, -74.86995697021484, -53.465911865234375, -32.061866760253906, -10.657821655273438, 10.7462158203125, 32.15032958984375, 53.55437469482422, 74.95841979980469, 96.36246490478516, 117.76651000976562, 139.17056274414062, 160.57460021972656, 181.9786376953125, 203.3826904296875, 224.7867431640625, 246.19078063964844, 267.5948181152344, 288.9988708496094, 310.4029235839844, 331.80694580078125, 353.21099853515625, 374.61505126953125, 396.01910400390625, 417.42315673828125, 438.8271789550781, 460.2312316894531, 481.6352844238281, 503.039306640625, 524.443359375, 545.847412109375, 567.25146484375, 588.655517578125, 610.0595703125, 631.463623046875, 652.8676147460938, 674.2716674804688, 695.6757202148438, 717.0797729492188]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 1.0, 1.0, 4.0, 8.0, 5.0, 16.0, 11.0, 8.0, 13.0, 20.0, 23.0, 14.0, 23.0, 24.0, 39.0, 33.0, 21.0, 39.0, 37.0, 30.0, 33.0, 46.0, 41.0, 52.0, 44.0, 49.0, 36.0, 41.0, 45.0, 31.0, 30.0, 27.0, 18.0, 28.0, 23.0, 17.0, 14.0, 12.0, 12.0, 4.0, 6.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-93.1875, -90.4892578125, -87.791015625, -85.0927734375, -82.39453125, -79.6962890625, -76.998046875, -74.2998046875, -71.6015625, -68.9033203125, -66.205078125, -63.5068359375, -60.80859375, -58.1103515625, -55.412109375, -52.7138671875, -50.015625, -47.3173828125, -44.619140625, -41.9208984375, -39.22265625, -36.5244140625, -33.826171875, -31.1279296875, -28.4296875, -25.7314453125, -23.033203125, -20.3349609375, -17.63671875, -14.9384765625, -12.240234375, -9.5419921875, -6.84375, -4.1455078125, -1.447265625, 1.2509765625, 3.94921875, 6.6474609375, 9.345703125, 12.0439453125, 14.7421875, 17.4404296875, 20.138671875, 22.8369140625, 25.53515625, 28.2333984375, 30.931640625, 33.6298828125, 36.328125, 39.0263671875, 41.724609375, 44.4228515625, 47.12109375, 49.8193359375, 52.517578125, 55.2158203125, 57.9140625, 60.6123046875, 63.310546875, 66.0087890625, 68.70703125, 71.4052734375, 74.103515625, 76.8017578125, 79.5]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 9.0, 17.0, 30.0, 38.0, 56.0, 94.0, 154.0, 258.0, 409.0, 604.0, 957.0, 1535.0, 2694.0, 4260.0, 7159.0, 12854.0, 22292.0, 41544.0, 78460.0, 165355.0, 348010.0, 178051.0, 83767.0, 43584.0, 23767.0, 13340.0, 7654.0, 4519.0, 2767.0, 1594.0, 1030.0, 637.0, 351.0, 269.0, 159.0, 106.0, 66.0, 37.0, 24.0, 20.0, 10.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.557373046875, -8.29443359375, -8.031494140625, -7.7685546875, -7.505615234375, -7.24267578125, -6.979736328125, -6.716796875, -6.453857421875, -6.19091796875, -5.927978515625, -5.6650390625, -5.402099609375, -5.13916015625, -4.876220703125, -4.61328125, -4.350341796875, -4.08740234375, -3.824462890625, -3.5615234375, -3.298583984375, -3.03564453125, -2.772705078125, -2.509765625, -2.246826171875, -1.98388671875, -1.720947265625, -1.4580078125, -1.195068359375, -0.93212890625, -0.669189453125, -0.40625, -0.143310546875, 0.11962890625, 0.382568359375, 0.6455078125, 0.908447265625, 1.17138671875, 1.434326171875, 1.697265625, 1.960205078125, 2.22314453125, 2.486083984375, 2.7490234375, 3.011962890625, 3.27490234375, 3.537841796875, 3.80078125, 4.063720703125, 4.32666015625, 4.589599609375, 4.8525390625, 5.115478515625, 5.37841796875, 5.641357421875, 5.904296875, 6.167236328125, 6.43017578125, 6.693115234375, 6.9560546875, 7.218994140625, 7.48193359375, 7.744873046875, 8.0078125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 1.0, 7.0, 5.0, 8.0, 6.0, 12.0, 14.0, 14.0, 15.0, 16.0, 24.0, 22.0, 20.0, 26.0, 28.0, 37.0, 51.0, 46.0, 51.0, 53.0, 1054.0, 41.0, 39.0, 40.0, 28.0, 35.0, 45.0, 36.0, 36.0, 28.0, 31.0, 27.0, 22.0, 11.0, 16.0, 12.0, 21.0, 8.0, 7.0, 10.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-62.375, -60.53515625, -58.6953125, -56.85546875, -55.015625, -53.17578125, -51.3359375, -49.49609375, -47.65625, -45.81640625, -43.9765625, -42.13671875, -40.296875, -38.45703125, -36.6171875, -34.77734375, -32.9375, -31.09765625, -29.2578125, -27.41796875, -25.578125, -23.73828125, -21.8984375, -20.05859375, -18.21875, -16.37890625, -14.5390625, -12.69921875, -10.859375, -9.01953125, -7.1796875, -5.33984375, -3.5, -1.66015625, 0.1796875, 2.01953125, 3.859375, 5.69921875, 7.5390625, 9.37890625, 11.21875, 13.05859375, 14.8984375, 16.73828125, 18.578125, 20.41796875, 22.2578125, 24.09765625, 25.9375, 27.77734375, 29.6171875, 31.45703125, 33.296875, 35.13671875, 36.9765625, 38.81640625, 40.65625, 42.49609375, 44.3359375, 46.17578125, 48.015625, 49.85546875, 51.6953125, 53.53515625, 55.375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 12.0, 13.0, 29.0, 45.0, 59.0, 71.0, 99.0, 144.0, 262.0, 382.0, 548.0, 826.0, 1263.0, 1870.0, 2833.0, 4537.0, 7079.0, 11156.0, 18440.0, 30898.0, 53315.0, 95519.0, 185217.0, 1323244.0, 157420.0, 83833.0, 47029.0, 26980.0, 16132.0, 9913.0, 6304.0, 3997.0, 2582.0, 1666.0, 1102.0, 789.0, 480.0, 305.0, 215.0, 157.0, 130.0, 72.0, 53.0, 41.0, 20.0, 16.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.4296875, -4.29290771484375, -4.1561279296875, -4.01934814453125, -3.882568359375, -3.74578857421875, -3.6090087890625, -3.47222900390625, -3.33544921875, -3.19866943359375, -3.0618896484375, -2.92510986328125, -2.788330078125, -2.65155029296875, -2.5147705078125, -2.37799072265625, -2.2412109375, -2.10443115234375, -1.9676513671875, -1.83087158203125, -1.694091796875, -1.55731201171875, -1.4205322265625, -1.28375244140625, -1.14697265625, -1.01019287109375, -0.8734130859375, -0.73663330078125, -0.599853515625, -0.46307373046875, -0.3262939453125, -0.18951416015625, -0.052734375, 0.08404541015625, 0.2208251953125, 0.35760498046875, 0.494384765625, 0.63116455078125, 0.7679443359375, 0.90472412109375, 1.04150390625, 1.17828369140625, 1.3150634765625, 1.45184326171875, 1.588623046875, 1.72540283203125, 1.8621826171875, 1.99896240234375, 2.1357421875, 2.27252197265625, 2.4093017578125, 2.54608154296875, 2.682861328125, 2.81964111328125, 2.9564208984375, 3.09320068359375, 3.22998046875, 3.36676025390625, 3.5035400390625, 3.64031982421875, 3.777099609375, 3.91387939453125, 4.0506591796875, 4.18743896484375, 4.32421875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 3.0, 1.0, 3.0, 7.0, 10.0, 6.0, 17.0, 17.0, 16.0, 22.0, 41.0, 45.0, 62.0, 88.0, 121.0, 129.0, 89.0, 72.0, 54.0, 34.0, 25.0, 20.0, 24.0, 16.0, 14.0, 8.0, 10.0, 10.0, 14.0, 2.0, 7.0, 4.0, 0.0, 2.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.272705078125, -0.2655525207519531, -0.25839996337890625, -0.2512474060058594, -0.2440948486328125, -0.23694229125976562, -0.22978973388671875, -0.22263717651367188, -0.215484619140625, -0.20833206176757812, -0.20117950439453125, -0.19402694702148438, -0.1868743896484375, -0.17972183227539062, -0.17256927490234375, -0.16541671752929688, -0.15826416015625, -0.15111160278320312, -0.14395904541015625, -0.13680648803710938, -0.1296539306640625, -0.12250137329101562, -0.11534881591796875, -0.10819625854492188, -0.101043701171875, -0.09389114379882812, -0.08673858642578125, -0.07958602905273438, -0.0724334716796875, -0.06528091430664062, -0.05812835693359375, -0.050975799560546875, -0.0438232421875, -0.036670684814453125, -0.02951812744140625, -0.022365570068359375, -0.0152130126953125, -0.008060455322265625, -0.00090789794921875, 0.006244659423828125, 0.013397216796875, 0.020549774169921875, 0.02770233154296875, 0.034854888916015625, 0.0420074462890625, 0.049160003662109375, 0.05631256103515625, 0.06346511840820312, 0.07061767578125, 0.07777023315429688, 0.08492279052734375, 0.09207534790039062, 0.0992279052734375, 0.10638046264648438, 0.11353302001953125, 0.12068557739257812, 0.127838134765625, 0.13499069213867188, 0.14214324951171875, 0.14929580688476562, 0.1564483642578125, 0.16360092163085938, 0.17075347900390625, 0.17790603637695312, 0.18505859375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 7.0, 5.0, 11.0, 9.0, 9.0, 12.0, 9.0, 22.0, 21.0, 23.0, 33.0, 43.0, 96.0, 124.0, 238.0, 1046916.0, 535.0, 145.0, 82.0, 60.0, 39.0, 24.0, 12.0, 19.0, 19.0, 2.0, 10.0, 8.0, 3.0, 0.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.4439697265625, -5.223876953125, -5.0037841796875, -4.78369140625, -4.5635986328125, -4.343505859375, -4.1234130859375, -3.9033203125, -3.6832275390625, -3.463134765625, -3.2430419921875, -3.02294921875, -2.8028564453125, -2.582763671875, -2.3626708984375, -2.142578125, -1.9224853515625, -1.702392578125, -1.4822998046875, -1.26220703125, -1.0421142578125, -0.822021484375, -0.6019287109375, -0.3818359375, -0.1617431640625, 0.058349609375, 0.2784423828125, 0.49853515625, 0.7186279296875, 0.938720703125, 1.1588134765625, 1.37890625, 1.5989990234375, 1.819091796875, 2.0391845703125, 2.25927734375, 2.4793701171875, 2.699462890625, 2.9195556640625, 3.1396484375, 3.3597412109375, 3.579833984375, 3.7999267578125, 4.02001953125, 4.2401123046875, 4.460205078125, 4.6802978515625, 4.900390625, 5.1204833984375, 5.340576171875, 5.5606689453125, 5.78076171875, 6.0008544921875, 6.220947265625, 6.4410400390625, 6.6611328125, 6.8812255859375, 7.101318359375, 7.3214111328125, 7.54150390625, 7.7615966796875, 7.981689453125, 8.2017822265625, 8.421875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 77.0, 912.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4252603054046631, -0.40330490469932556, -0.38134950399398804, -0.3593940734863281, -0.337438702583313, -0.3154832720756531, -0.29352787137031555, -0.271572470664978, -0.2496170699596405, -0.22766166925430298, -0.20570626854896545, -0.18375085294246674, -0.1617954522371292, -0.1398400515317917, -0.11788463592529297, -0.09592923521995544, -0.07397383451461792, -0.0520184300839901, -0.030063025653362274, -0.008107617497444153, 0.013847783207893372, 0.035803183913230896, 0.057758599519729614, 0.07971400022506714, 0.10166940093040466, 0.12362480163574219, 0.1455802023410797, 0.16753561794757843, 0.18949101865291595, 0.21144641935825348, 0.2334018349647522, 0.2553572356700897, 0.27731257677078247, 0.29926797747612, 0.3212233781814575, 0.34317880868911743, 0.36513417959213257, 0.3870896100997925, 0.40904501080513, 0.43100041151046753, 0.45295581221580505, 0.4749112129211426, 0.4968666136264801, 0.5188220143318176, 0.5407774448394775, 0.5627328157424927, 0.5846882462501526, 0.6066436767578125, 0.6285990476608276, 0.6505544781684875, 0.6725098490715027, 0.6944652795791626, 0.7164206504821777, 0.7383760809898376, 0.7603315114974976, 0.7822868824005127, 0.8042422533035278, 0.8261976838111877, 0.8481530547142029, 0.8701084852218628, 0.8920638561248779, 0.9140192866325378, 0.9359747171401978, 0.9579300880432129, 0.9798855185508728]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 10.0, 8.0, 6.0, 7.0, 6.0, 6.0, 17.0, 23.0, 21.0, 27.0, 21.0, 25.0, 28.0, 37.0, 47.0, 33.0, 52.0, 49.0, 47.0, 50.0, 46.0, 42.0, 52.0, 48.0, 50.0, 27.0, 37.0, 31.0, 28.0, 19.0, 14.0, 22.0, 15.0, 14.0, 12.0, 7.0, 10.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.17474377155303955, -0.16944855451583862, -0.1641533374786377, -0.15885813534259796, -0.15356291830539703, -0.1482677012681961, -0.14297249913215637, -0.13767728209495544, -0.13238206505775452, -0.1270868480205536, -0.12179163843393326, -0.11649642884731293, -0.111201211810112, -0.10590599477291107, -0.10061078518629074, -0.09531557559967041, -0.09002035856246948, -0.08472514152526855, -0.07942993193864822, -0.0741347223520279, -0.06883950531482697, -0.06354428827762604, -0.05824907869100571, -0.05295386537909508, -0.04765865206718445, -0.04236343875527382, -0.03706822544336319, -0.03177301213145256, -0.02647779881954193, -0.021182585507631302, -0.015887372195720673, -0.010592158883810043, -0.005296945571899414, -1.73225998878479e-06, 0.0052934810519218445, 0.010588694363832474, 0.015883907675743103, 0.021179120987653732, 0.02647433429956436, 0.03176954761147499, 0.03706476092338562, 0.04235997423529625, 0.04765518754720688, 0.05295040085911751, 0.05824561417102814, 0.06354083120822906, 0.0688360407948494, 0.07413125038146973, 0.07942646741867065, 0.08472168445587158, 0.09001689404249191, 0.09531210362911224, 0.10060732066631317, 0.1059025377035141, 0.11119774729013443, 0.11649295687675476, 0.12178817391395569, 0.12708339095115662, 0.13237860798835754, 0.13767381012439728, 0.1429690271615982, 0.14826424419879913, 0.15355944633483887, 0.1588546633720398, 0.16414988040924072]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 1.0, 1.0, 4.0, 8.0, 5.0, 16.0, 11.0, 8.0, 13.0, 20.0, 23.0, 14.0, 23.0, 24.0, 39.0, 33.0, 21.0, 39.0, 37.0, 30.0, 33.0, 46.0, 41.0, 52.0, 44.0, 49.0, 36.0, 41.0, 45.0, 31.0, 30.0, 27.0, 18.0, 28.0, 23.0, 17.0, 14.0, 12.0, 12.0, 4.0, 6.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-93.1875, -90.4892578125, -87.791015625, -85.0927734375, -82.39453125, -79.6962890625, -76.998046875, -74.2998046875, -71.6015625, -68.9033203125, -66.205078125, -63.5068359375, -60.80859375, -58.1103515625, -55.412109375, -52.7138671875, -50.015625, -47.3173828125, -44.619140625, -41.9208984375, -39.22265625, -36.5244140625, -33.826171875, -31.1279296875, -28.4296875, -25.7314453125, -23.033203125, -20.3349609375, -17.63671875, -14.9384765625, -12.240234375, -9.5419921875, -6.84375, -4.1455078125, -1.447265625, 1.2509765625, 3.94921875, 6.6474609375, 9.345703125, 12.0439453125, 14.7421875, 17.4404296875, 20.138671875, 22.8369140625, 25.53515625, 28.2333984375, 30.931640625, 33.6298828125, 36.328125, 39.0263671875, 41.724609375, 44.4228515625, 47.12109375, 49.8193359375, 52.517578125, 55.2158203125, 57.9140625, 60.6123046875, 63.310546875, 66.0087890625, 68.70703125, 71.4052734375, 74.103515625, 76.8017578125, 79.5]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 4.0, 5.0, 12.0, 21.0, 26.0, 30.0, 48.0, 78.0, 97.0, 170.0, 244.0, 353.0, 646.0, 876.0, 1414.0, 2242.0, 3693.0, 6348.0, 12036.0, 25753.0, 73105.0, 560481.0, 266587.0, 50310.0, 20151.0, 9832.0, 5404.0, 3096.0, 1951.0, 1284.0, 788.0, 514.0, 296.0, 203.0, 142.0, 116.0, 61.0, 33.0, 24.0, 20.0, 21.0, 10.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-155.375, -150.49609375, -145.6171875, -140.73828125, -135.859375, -130.98046875, -126.1015625, -121.22265625, -116.34375, -111.46484375, -106.5859375, -101.70703125, -96.828125, -91.94921875, -87.0703125, -82.19140625, -77.3125, -72.43359375, -67.5546875, -62.67578125, -57.796875, -52.91796875, -48.0390625, -43.16015625, -38.28125, -33.40234375, -28.5234375, -23.64453125, -18.765625, -13.88671875, -9.0078125, -4.12890625, 0.75, 5.62890625, 10.5078125, 15.38671875, 20.265625, 25.14453125, 30.0234375, 34.90234375, 39.78125, 44.66015625, 49.5390625, 54.41796875, 59.296875, 64.17578125, 69.0546875, 73.93359375, 78.8125, 83.69140625, 88.5703125, 93.44921875, 98.328125, 103.20703125, 108.0859375, 112.96484375, 117.84375, 122.72265625, 127.6015625, 132.48046875, 137.359375, 142.23828125, 147.1171875, 151.99609375, 156.875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 8.0, 9.0, 8.0, 19.0, 17.0, 23.0, 21.0, 44.0, 23.0, 30.0, 47.0, 43.0, 59.0, 69.0, 99.0, 137.0, 1586.0, 254.0, 107.0, 69.0, 63.0, 55.0, 37.0, 29.0, 27.0, 27.0, 22.0, 29.0, 11.0, 14.0, 17.0, 5.0, 14.0, 7.0, 6.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-261.5, -253.2734375, -245.046875, -236.8203125, -228.59375, -220.3671875, -212.140625, -203.9140625, -195.6875, -187.4609375, -179.234375, -171.0078125, -162.78125, -154.5546875, -146.328125, -138.1015625, -129.875, -121.6484375, -113.421875, -105.1953125, -96.96875, -88.7421875, -80.515625, -72.2890625, -64.0625, -55.8359375, -47.609375, -39.3828125, -31.15625, -22.9296875, -14.703125, -6.4765625, 1.75, 9.9765625, 18.203125, 26.4296875, 34.65625, 42.8828125, 51.109375, 59.3359375, 67.5625, 75.7890625, 84.015625, 92.2421875, 100.46875, 108.6953125, 116.921875, 125.1484375, 133.375, 141.6015625, 149.828125, 158.0546875, 166.28125, 174.5078125, 182.734375, 190.9609375, 199.1875, 207.4140625, 215.640625, 223.8671875, 232.09375, 240.3203125, 248.546875, 256.7734375, 265.0]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 4.0, 5.0, 9.0, 17.0, 26.0, 22.0, 52.0, 63.0, 103.0, 158.0, 309.0, 796.0, 2620.0, 12433.0, 138489.0, 2909835.0, 69081.0, 8333.0, 1914.0, 693.0, 305.0, 144.0, 100.0, 58.0, 40.0, 24.0, 11.0, 11.0, 12.0, 8.0, 4.0, 13.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-396.0, -382.96875, -369.9375, -356.90625, -343.875, -330.84375, -317.8125, -304.78125, -291.75, -278.71875, -265.6875, -252.65625, -239.625, -226.59375, -213.5625, -200.53125, -187.5, -174.46875, -161.4375, -148.40625, -135.375, -122.34375, -109.3125, -96.28125, -83.25, -70.21875, -57.1875, -44.15625, -31.125, -18.09375, -5.0625, 7.96875, 21.0, 34.03125, 47.0625, 60.09375, 73.125, 86.15625, 99.1875, 112.21875, 125.25, 138.28125, 151.3125, 164.34375, 177.375, 190.40625, 203.4375, 216.46875, 229.5, 242.53125, 255.5625, 268.59375, 281.625, 294.65625, 307.6875, 320.71875, 333.75, 346.78125, 359.8125, 372.84375, 385.875, 398.90625, 411.9375, 424.96875, 438.0]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 19.0, 61.0, 257.0, 455.0, 166.0, 50.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-286.64801025390625, -247.61993408203125, -208.5918731689453, -169.56381225585938, -130.53573608398438, -91.50765991210938, -52.47959899902344, -13.4515380859375, 25.5765380859375, 64.60460662841797, 103.63267517089844, 142.66073608398438, 181.68881225585938, 220.71688842773438, 259.74493408203125, 298.77301025390625, 337.80108642578125, 376.82916259765625, 415.85723876953125, 454.8852844238281, 493.9133605957031, 532.94140625, 571.969482421875, 610.99755859375, 650.025634765625, 689.0537109375, 728.081787109375, 767.10986328125, 806.137939453125, 845.166015625, 884.1940307617188, 923.2221069335938, 962.250244140625, 1001.2783203125, 1040.306396484375, 1079.33447265625, 1118.362548828125, 1157.390625, 1196.418701171875, 1235.44677734375, 1274.474853515625, 1313.5029296875, 1352.531005859375, 1391.55908203125, 1430.587158203125, 1469.615234375, 1508.643310546875, 1547.67138671875, 1586.6993408203125, 1625.7274169921875, 1664.7554931640625, 1703.7835693359375, 1742.8116455078125, 1781.8397216796875, 1820.8677978515625, 1859.895751953125, 1898.923828125, 1937.951904296875, 1976.97998046875, 2016.008056640625, 2055.0361328125, 2094.064208984375, 2133.09228515625, 2172.120361328125, 2211.1484375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 11.0, 8.0, 7.0, 8.0, 14.0, 13.0, 18.0, 24.0, 22.0, 19.0, 23.0, 27.0, 27.0, 43.0, 38.0, 44.0, 38.0, 36.0, 50.0, 48.0, 42.0, 48.0, 53.0, 39.0, 45.0, 32.0, 35.0, 30.0, 36.0, 21.0, 21.0, 12.0, 11.0, 15.0, 11.0, 8.0, 4.0, 10.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-546.4813842773438, -529.1879272460938, -511.8945007324219, -494.60107421875, -477.3076171875, -460.01416015625, -442.7207336425781, -425.42730712890625, -408.13385009765625, -390.84039306640625, -373.5469665527344, -356.2535400390625, -338.9600830078125, -321.6666259765625, -304.3731994628906, -287.07977294921875, -269.78631591796875, -252.4928741455078, -235.19943237304688, -217.90599060058594, -200.612548828125, -183.31910705566406, -166.02566528320312, -148.7322235107422, -131.43878173828125, -114.14533996582031, -96.85189819335938, -79.55845642089844, -62.2650146484375, -44.97157287597656, -27.678131103515625, -10.384689331054688, 6.90869140625, 24.202133178710938, 41.495574951171875, 58.78901672363281, 76.08245849609375, 93.37590026855469, 110.66934204101562, 127.96278381347656, 145.2562255859375, 162.54966735839844, 179.84310913085938, 197.1365509033203, 214.42999267578125, 231.7234344482422, 249.01687622070312, 266.310302734375, 283.603759765625, 300.897216796875, 318.1906433105469, 335.48406982421875, 352.77752685546875, 370.07098388671875, 387.3644104003906, 404.6578369140625, 421.9512939453125, 439.2447509765625, 456.5381774902344, 473.83160400390625, 491.12506103515625, 508.41851806640625, 525.7119140625, 543.00537109375, 560.298828125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 4.0, 2.0, 7.0, 13.0, 17.0, 10.0, 18.0, 9.0, 14.0, 17.0, 22.0, 26.0, 27.0, 26.0, 37.0, 36.0, 35.0, 32.0, 46.0, 52.0, 31.0, 54.0, 40.0, 42.0, 35.0, 45.0, 34.0, 28.0, 27.0, 35.0, 36.0, 17.0, 17.0, 21.0, 18.0, 14.0, 10.0, 7.0, 9.0, 6.0, 3.0, 5.0, 5.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-87.9375, -85.1826171875, -82.427734375, -79.6728515625, -76.91796875, -74.1630859375, -71.408203125, -68.6533203125, -65.8984375, -63.1435546875, -60.388671875, -57.6337890625, -54.87890625, -52.1240234375, -49.369140625, -46.6142578125, -43.859375, -41.1044921875, -38.349609375, -35.5947265625, -32.83984375, -30.0849609375, -27.330078125, -24.5751953125, -21.8203125, -19.0654296875, -16.310546875, -13.5556640625, -10.80078125, -8.0458984375, -5.291015625, -2.5361328125, 0.21875, 2.9736328125, 5.728515625, 8.4833984375, 11.23828125, 13.9931640625, 16.748046875, 19.5029296875, 22.2578125, 25.0126953125, 27.767578125, 30.5224609375, 33.27734375, 36.0322265625, 38.787109375, 41.5419921875, 44.296875, 47.0517578125, 49.806640625, 52.5615234375, 55.31640625, 58.0712890625, 60.826171875, 63.5810546875, 66.3359375, 69.0908203125, 71.845703125, 74.6005859375, 77.35546875, 80.1103515625, 82.865234375, 85.6201171875, 88.375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 5.0, 9.0, 10.0, 18.0, 24.0, 41.0, 72.0, 102.0, 208.0, 433.0, 940.0, 2302.0, 6286.0, 20316.0, 244017.0, 3746782.0, 146295.0, 17162.0, 5508.0, 1981.0, 856.0, 368.0, 224.0, 120.0, 59.0, 33.0, 28.0, 16.0, 12.0, 10.0, 5.0, 2.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-281.0, -271.453125, -261.90625, -252.359375, -242.8125, -233.265625, -223.71875, -214.171875, -204.625, -195.078125, -185.53125, -175.984375, -166.4375, -156.890625, -147.34375, -137.796875, -128.25, -118.703125, -109.15625, -99.609375, -90.0625, -80.515625, -70.96875, -61.421875, -51.875, -42.328125, -32.78125, -23.234375, -13.6875, -4.140625, 5.40625, 14.953125, 24.5, 34.046875, 43.59375, 53.140625, 62.6875, 72.234375, 81.78125, 91.328125, 100.875, 110.421875, 119.96875, 129.515625, 139.0625, 148.609375, 158.15625, 167.703125, 177.25, 186.796875, 196.34375, 205.890625, 215.4375, 224.984375, 234.53125, 244.078125, 253.625, 263.171875, 272.71875, 282.265625, 291.8125, 301.359375, 310.90625, 320.453125, 330.0]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 6.0, 5.0, 15.0, 9.0, 22.0, 14.0, 18.0, 32.0, 40.0, 56.0, 99.0, 192.0, 485.0, 1017.0, 1108.0, 467.0, 191.0, 80.0, 49.0, 38.0, 34.0, 19.0, 19.0, 9.0, 17.0, 5.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-201.875, -196.271484375, -190.66796875, -185.064453125, -179.4609375, -173.857421875, -168.25390625, -162.650390625, -157.046875, -151.443359375, -145.83984375, -140.236328125, -134.6328125, -129.029296875, -123.42578125, -117.822265625, -112.21875, -106.615234375, -101.01171875, -95.408203125, -89.8046875, -84.201171875, -78.59765625, -72.994140625, -67.390625, -61.787109375, -56.18359375, -50.580078125, -44.9765625, -39.373046875, -33.76953125, -28.166015625, -22.5625, -16.958984375, -11.35546875, -5.751953125, -0.1484375, 5.455078125, 11.05859375, 16.662109375, 22.265625, 27.869140625, 33.47265625, 39.076171875, 44.6796875, 50.283203125, 55.88671875, 61.490234375, 67.09375, 72.697265625, 78.30078125, 83.904296875, 89.5078125, 95.111328125, 100.71484375, 106.318359375, 111.921875, 117.525390625, 123.12890625, 128.732421875, 134.3359375, 139.939453125, 145.54296875, 151.146484375, 156.75]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 9.0, 21.0, 13.0, 28.0, 25.0, 55.0, 94.0, 192.0, 270.0, 481.0, 907.0, 1943.0, 3933.0, 9122.0, 23196.0, 77011.0, 1295854.0, 2645138.0, 90899.0, 26558.0, 9963.0, 4244.0, 2060.0, 990.0, 528.0, 284.0, 159.0, 103.0, 65.0, 37.0, 27.0, 18.0, 11.0, 15.0, 11.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-273.5, -264.96875, -256.4375, -247.90625, -239.375, -230.84375, -222.3125, -213.78125, -205.25, -196.71875, -188.1875, -179.65625, -171.125, -162.59375, -154.0625, -145.53125, -137.0, -128.46875, -119.9375, -111.40625, -102.875, -94.34375, -85.8125, -77.28125, -68.75, -60.21875, -51.6875, -43.15625, -34.625, -26.09375, -17.5625, -9.03125, -0.5, 8.03125, 16.5625, 25.09375, 33.625, 42.15625, 50.6875, 59.21875, 67.75, 76.28125, 84.8125, 93.34375, 101.875, 110.40625, 118.9375, 127.46875, 136.0, 144.53125, 153.0625, 161.59375, 170.125, 178.65625, 187.1875, 195.71875, 204.25, 212.78125, 221.3125, 229.84375, 238.375, 246.90625, 255.4375, 263.96875, 272.5]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 13.0, 27.0, 57.0, 152.0, 364.0, 261.0, 90.0, 26.0, 11.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2300.016845703125, -2253.71630859375, -2207.415771484375, -2161.114990234375, -2114.814453125, -2068.513916015625, -2022.21337890625, -1975.9127197265625, -1929.612060546875, -1883.3115234375, -1837.0108642578125, -1790.7103271484375, -1744.40966796875, -1698.109130859375, -1651.80859375, -1605.5079345703125, -1559.2073974609375, -1512.9068603515625, -1466.606201171875, -1420.3056640625, -1374.0050048828125, -1327.7044677734375, -1281.40380859375, -1235.103271484375, -1188.802734375, -1142.502197265625, -1096.2015380859375, -1049.9010009765625, -1003.600341796875, -957.2998046875, -910.9992065429688, -864.6986083984375, -818.3980712890625, -772.0974731445312, -725.796875, -679.496337890625, -633.1956787109375, -586.8951416015625, -540.5945434570312, -494.2939453125, -447.99334716796875, -401.6927490234375, -355.39215087890625, -309.0915832519531, -262.7909851074219, -216.49038696289062, -170.1898193359375, -123.88922119140625, -77.588623046875, -31.28803253173828, 15.012557983398438, 61.313140869140625, 107.61373901367188, 153.91433715820312, 200.21490478515625, 246.5155029296875, 292.81610107421875, 339.11669921875, 385.41729736328125, 431.7178649902344, 478.0184631347656, 524.319091796875, 570.61962890625, 616.9202270507812, 663.2208251953125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 8.0, 10.0, 11.0, 19.0, 15.0, 15.0, 23.0, 21.0, 21.0, 29.0, 37.0, 27.0, 35.0, 47.0, 40.0, 36.0, 27.0, 40.0, 53.0, 49.0, 34.0, 42.0, 37.0, 25.0, 34.0, 20.0, 27.0, 34.0, 19.0, 30.0, 21.0, 26.0, 12.0, 16.0, 13.0, 7.0, 4.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-371.20050048828125, -358.5307922363281, -345.861083984375, -333.19140625, -320.5216979980469, -307.85198974609375, -295.1822814941406, -282.5125732421875, -269.8428955078125, -257.1731872558594, -244.5034942626953, -231.8337860107422, -219.16409301757812, -206.494384765625, -193.82467651367188, -181.1549835205078, -168.4852752685547, -155.81556701660156, -143.1458740234375, -130.47616577148438, -117.80647277832031, -105.13676452636719, -92.4670639038086, -79.79736328125, -67.1276626586914, -54.45796203613281, -41.78826141357422, -29.11855697631836, -16.448856353759766, -3.779155731201172, 8.890548706054688, 21.56024932861328, 34.229949951171875, 46.89965057373047, 59.56935119628906, 72.23905944824219, 84.90875244140625, 97.57846069335938, 110.24816131591797, 122.91786193847656, 135.58755493164062, 148.25726318359375, 160.9269561767578, 173.59666442871094, 186.266357421875, 198.93606567382812, 211.60577392578125, 224.2754669189453, 236.94517517089844, 249.61488342285156, 262.2845764160156, 274.95428466796875, 287.6239929199219, 300.2936706542969, 312.96337890625, 325.6330871582031, 338.30279541015625, 350.9725036621094, 363.6422119140625, 376.3118896484375, 388.9815979003906, 401.65130615234375, 414.3210144042969, 426.99072265625, 439.660400390625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 8.0, 9.0, 7.0, 18.0, 17.0, 19.0, 26.0, 20.0, 31.0, 35.0, 27.0, 41.0, 40.0, 20.0, 39.0, 42.0, 52.0, 39.0, 40.0, 42.0, 44.0, 40.0, 42.0, 46.0, 41.0, 37.0, 19.0, 21.0, 23.0, 22.0, 17.0, 13.0, 13.0, 10.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.4375, -87.58984375, -84.7421875, -81.89453125, -79.046875, -76.19921875, -73.3515625, -70.50390625, -67.65625, -64.80859375, -61.9609375, -59.11328125, -56.265625, -53.41796875, -50.5703125, -47.72265625, -44.875, -42.02734375, -39.1796875, -36.33203125, -33.484375, -30.63671875, -27.7890625, -24.94140625, -22.09375, -19.24609375, -16.3984375, -13.55078125, -10.703125, -7.85546875, -5.0078125, -2.16015625, 0.6875, 3.53515625, 6.3828125, 9.23046875, 12.078125, 14.92578125, 17.7734375, 20.62109375, 23.46875, 26.31640625, 29.1640625, 32.01171875, 34.859375, 37.70703125, 40.5546875, 43.40234375, 46.25, 49.09765625, 51.9453125, 54.79296875, 57.640625, 60.48828125, 63.3359375, 66.18359375, 69.03125, 71.87890625, 74.7265625, 77.57421875, 80.421875, 83.26953125, 86.1171875, 88.96484375, 91.8125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 8.0, 17.0, 23.0, 28.0, 34.0, 56.0, 94.0, 122.0, 214.0, 324.0, 521.0, 810.0, 1203.0, 1920.0, 3054.0, 4856.0, 7692.0, 12304.0, 20375.0, 34086.0, 61466.0, 114575.0, 237093.0, 262322.0, 125301.0, 65900.0, 36663.0, 21859.0, 13485.0, 7942.0, 5147.0, 3218.0, 2101.0, 1286.0, 896.0, 540.0, 379.0, 218.0, 130.0, 93.0, 69.0, 50.0, 22.0, 23.0, 11.0, 10.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.1171875, -7.8717041015625, -7.626220703125, -7.3807373046875, -7.13525390625, -6.8897705078125, -6.644287109375, -6.3988037109375, -6.1533203125, -5.9078369140625, -5.662353515625, -5.4168701171875, -5.17138671875, -4.9259033203125, -4.680419921875, -4.4349365234375, -4.189453125, -3.9439697265625, -3.698486328125, -3.4530029296875, -3.20751953125, -2.9620361328125, -2.716552734375, -2.4710693359375, -2.2255859375, -1.9801025390625, -1.734619140625, -1.4891357421875, -1.24365234375, -0.9981689453125, -0.752685546875, -0.5072021484375, -0.26171875, -0.0162353515625, 0.229248046875, 0.4747314453125, 0.72021484375, 0.9656982421875, 1.211181640625, 1.4566650390625, 1.7021484375, 1.9476318359375, 2.193115234375, 2.4385986328125, 2.68408203125, 2.9295654296875, 3.175048828125, 3.4205322265625, 3.666015625, 3.9114990234375, 4.156982421875, 4.4024658203125, 4.64794921875, 4.8934326171875, 5.138916015625, 5.3843994140625, 5.6298828125, 5.8753662109375, 6.120849609375, 6.3663330078125, 6.61181640625, 6.8572998046875, 7.102783203125, 7.3482666015625, 7.59375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 1.0, 6.0, 5.0, 12.0, 11.0, 8.0, 12.0, 20.0, 19.0, 19.0, 22.0, 25.0, 32.0, 22.0, 39.0, 38.0, 54.0, 44.0, 42.0, 39.0, 33.0, 1063.0, 45.0, 49.0, 45.0, 30.0, 35.0, 37.0, 33.0, 30.0, 19.0, 22.0, 19.0, 11.0, 10.0, 11.0, 13.0, 7.0, 14.0, 9.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-60.59375, -58.7763671875, -56.958984375, -55.1416015625, -53.32421875, -51.5068359375, -49.689453125, -47.8720703125, -46.0546875, -44.2373046875, -42.419921875, -40.6025390625, -38.78515625, -36.9677734375, -35.150390625, -33.3330078125, -31.515625, -29.6982421875, -27.880859375, -26.0634765625, -24.24609375, -22.4287109375, -20.611328125, -18.7939453125, -16.9765625, -15.1591796875, -13.341796875, -11.5244140625, -9.70703125, -7.8896484375, -6.072265625, -4.2548828125, -2.4375, -0.6201171875, 1.197265625, 3.0146484375, 4.83203125, 6.6494140625, 8.466796875, 10.2841796875, 12.1015625, 13.9189453125, 15.736328125, 17.5537109375, 19.37109375, 21.1884765625, 23.005859375, 24.8232421875, 26.640625, 28.4580078125, 30.275390625, 32.0927734375, 33.91015625, 35.7275390625, 37.544921875, 39.3623046875, 41.1796875, 42.9970703125, 44.814453125, 46.6318359375, 48.44921875, 50.2666015625, 52.083984375, 53.9013671875, 55.71875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 7.0, 6.0, 6.0, 18.0, 17.0, 20.0, 36.0, 57.0, 81.0, 99.0, 174.0, 229.0, 311.0, 424.0, 613.0, 898.0, 1307.0, 1912.0, 2749.0, 4239.0, 6307.0, 9602.0, 14833.0, 24322.0, 39304.0, 64923.0, 114380.0, 267275.0, 1221058.0, 129491.0, 73452.0, 43275.0, 26725.0, 16532.0, 10800.0, 7172.0, 4597.0, 3148.0, 2102.0, 1453.0, 988.0, 661.0, 442.0, 321.0, 234.0, 157.0, 110.0, 78.0, 69.0, 38.0, 26.0, 14.0, 15.0, 11.0, 8.0, 8.0, 2.0, 2.0, 2.0, 3.0], "bins": [-4.1015625, -3.97381591796875, -3.8460693359375, -3.71832275390625, -3.590576171875, -3.46282958984375, -3.3350830078125, -3.20733642578125, -3.07958984375, -2.95184326171875, -2.8240966796875, -2.69635009765625, -2.568603515625, -2.44085693359375, -2.3131103515625, -2.18536376953125, -2.0576171875, -1.92987060546875, -1.8021240234375, -1.67437744140625, -1.546630859375, -1.41888427734375, -1.2911376953125, -1.16339111328125, -1.03564453125, -0.90789794921875, -0.7801513671875, -0.65240478515625, -0.524658203125, -0.39691162109375, -0.2691650390625, -0.14141845703125, -0.013671875, 0.11407470703125, 0.2418212890625, 0.36956787109375, 0.497314453125, 0.62506103515625, 0.7528076171875, 0.88055419921875, 1.00830078125, 1.13604736328125, 1.2637939453125, 1.39154052734375, 1.519287109375, 1.64703369140625, 1.7747802734375, 1.90252685546875, 2.0302734375, 2.15802001953125, 2.2857666015625, 2.41351318359375, 2.541259765625, 2.66900634765625, 2.7967529296875, 2.92449951171875, 3.05224609375, 3.17999267578125, 3.3077392578125, 3.43548583984375, 3.563232421875, 3.69097900390625, 3.8187255859375, 3.94647216796875, 4.07421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 2.0, 6.0, 5.0, 8.0, 11.0, 8.0, 11.0, 12.0, 22.0, 12.0, 21.0, 29.0, 39.0, 66.0, 84.0, 109.0, 140.0, 85.0, 74.0, 55.0, 30.0, 33.0, 29.0, 15.0, 12.0, 13.0, 8.0, 8.0, 10.0, 6.0, 8.0, 3.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1943359375, -0.18828773498535156, -0.18223953247070312, -0.1761913299560547, -0.17014312744140625, -0.1640949249267578, -0.15804672241210938, -0.15199851989746094, -0.1459503173828125, -0.13990211486816406, -0.13385391235351562, -0.1278057098388672, -0.12175750732421875, -0.11570930480957031, -0.10966110229492188, -0.10361289978027344, -0.097564697265625, -0.09151649475097656, -0.08546829223632812, -0.07942008972167969, -0.07337188720703125, -0.06732368469238281, -0.061275482177734375, -0.05522727966308594, -0.0491790771484375, -0.04313087463378906, -0.037082672119140625, -0.031034469604492188, -0.02498626708984375, -0.018938064575195312, -0.012889862060546875, -0.0068416595458984375, -0.00079345703125, 0.0052547454833984375, 0.011302947998046875, 0.017351150512695312, 0.02339935302734375, 0.029447555541992188, 0.035495758056640625, 0.04154396057128906, 0.0475921630859375, 0.05364036560058594, 0.059688568115234375, 0.06573677062988281, 0.07178497314453125, 0.07783317565917969, 0.08388137817382812, 0.08992958068847656, 0.095977783203125, 0.10202598571777344, 0.10807418823242188, 0.11412239074707031, 0.12017059326171875, 0.1262187957763672, 0.13226699829101562, 0.13831520080566406, 0.1443634033203125, 0.15041160583496094, 0.15645980834960938, 0.1625080108642578, 0.16855621337890625, 0.1746044158935547, 0.18065261840820312, 0.18670082092285156, 0.1927490234375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 8.0, 5.0, 6.0, 7.0, 14.0, 11.0, 13.0, 17.0, 28.0, 40.0, 39.0, 86.0, 127.0, 289.0, 1046346.0, 995.0, 178.0, 96.0, 58.0, 34.0, 24.0, 21.0, 18.0, 13.0, 8.0, 11.0, 10.0, 5.0, 6.0, 5.0, 2.0, 6.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.12890625, -5.9359130859375, -5.742919921875, -5.5499267578125, -5.35693359375, -5.1639404296875, -4.970947265625, -4.7779541015625, -4.5849609375, -4.3919677734375, -4.198974609375, -4.0059814453125, -3.81298828125, -3.6199951171875, -3.427001953125, -3.2340087890625, -3.041015625, -2.8480224609375, -2.655029296875, -2.4620361328125, -2.26904296875, -2.0760498046875, -1.883056640625, -1.6900634765625, -1.4970703125, -1.3040771484375, -1.111083984375, -0.9180908203125, -0.72509765625, -0.5321044921875, -0.339111328125, -0.1461181640625, 0.046875, 0.2398681640625, 0.432861328125, 0.6258544921875, 0.81884765625, 1.0118408203125, 1.204833984375, 1.3978271484375, 1.5908203125, 1.7838134765625, 1.976806640625, 2.1697998046875, 2.36279296875, 2.5557861328125, 2.748779296875, 2.9417724609375, 3.134765625, 3.3277587890625, 3.520751953125, 3.7137451171875, 3.90673828125, 4.0997314453125, 4.292724609375, 4.4857177734375, 4.6787109375, 4.8717041015625, 5.064697265625, 5.2576904296875, 5.45068359375, 5.6436767578125, 5.836669921875, 6.0296630859375, 6.22265625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 34.0, 987.0], "bins": [-4.7409892082214355, -4.66603946685791, -4.591089725494385, -4.516139984130859, -4.441190242767334, -4.366240501403809, -4.291290760040283, -4.216341018676758, -4.141390800476074, -4.066441059112549, -3.9914913177490234, -3.916541576385498, -3.8415918350219727, -3.766641855239868, -3.6916921138763428, -3.6167423725128174, -3.541792869567871, -3.4668431282043457, -3.3918933868408203, -3.316943645477295, -3.2419939041137695, -3.167043924331665, -3.0920941829681396, -3.0171444416046143, -2.942194700241089, -2.8672449588775635, -2.792295217514038, -2.7173454761505127, -2.642395496368408, -2.567445755004883, -2.4924960136413574, -2.417546272277832, -2.3425967693328857, -2.2676470279693604, -2.192697286605835, -2.1177475452423096, -2.042797565460205, -1.9678479433059692, -1.8928980827331543, -1.817948341369629, -1.7429986000061035, -1.6680488586425781, -1.5930991172790527, -1.5181492567062378, -1.4431995153427124, -1.368249773979187, -1.293299913406372, -1.2183501720428467, -1.1434004306793213, -1.068450689315796, -0.9935008883476257, -0.9185510873794556, -0.8436013460159302, -0.7686516046524048, -0.6937018036842346, -0.6187520027160645, -0.5438022017478943, -0.4688524305820465, -0.39390265941619873, -0.31895288825035095, -0.24400311708450317, -0.1690533459186554, -0.09410357475280762, -0.01915377378463745, 0.055795956403017044]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 7.0, 12.0, 12.0, 5.0, 8.0, 13.0, 12.0, 17.0, 16.0, 28.0, 25.0, 23.0, 32.0, 37.0, 31.0, 39.0, 34.0, 41.0, 36.0, 49.0, 42.0, 29.0, 34.0, 42.0, 40.0, 40.0, 30.0, 23.0, 31.0, 25.0, 28.0, 27.0, 17.0, 21.0, 12.0, 11.0, 12.0, 9.0, 5.0, 7.0, 4.0, 11.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.284653902053833, -0.2759450376033783, -0.26723620295524597, -0.25852733850479126, -0.24981847405433655, -0.24110962450504303, -0.2324007749557495, -0.2236919105052948, -0.2149830460548401, -0.20627419650554657, -0.19756533205509186, -0.18885648250579834, -0.18014761805534363, -0.1714387685060501, -0.1627299189567566, -0.15402105450630188, -0.14531220495700836, -0.13660335540771484, -0.12789449095726013, -0.11918564140796661, -0.1104767769575119, -0.10176792740821838, -0.09305907040834427, -0.08435021340847015, -0.07564135640859604, -0.06693249940872192, -0.05822364240884781, -0.04951478913426399, -0.04080593213438988, -0.03209707513451576, -0.023388221859931946, -0.01467936486005783, -0.005970507860183716, 0.0027383482083678246, 0.011447204276919365, 0.02015605941414833, 0.028864916414022446, 0.03757377341389656, 0.04628262668848038, 0.05499148368835449, 0.06370034068822861, 0.07240919768810272, 0.08111805468797684, 0.08982691168785095, 0.09853576123714447, 0.10724462568759918, 0.1159534752368927, 0.12466233223676682, 0.13337118923664093, 0.14208003878593445, 0.15078890323638916, 0.15949775278568268, 0.1682066172361374, 0.1769154667854309, 0.18562433123588562, 0.19433318078517914, 0.20304203033447266, 0.21175087988376617, 0.2204597443342209, 0.2291685938835144, 0.23787745833396912, 0.24658630788326263, 0.25529515743255615, 0.26400402188301086, 0.2727128863334656]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 8.0, 9.0, 7.0, 18.0, 17.0, 19.0, 26.0, 20.0, 31.0, 35.0, 27.0, 41.0, 40.0, 20.0, 39.0, 42.0, 52.0, 39.0, 40.0, 42.0, 44.0, 40.0, 42.0, 46.0, 41.0, 37.0, 19.0, 21.0, 23.0, 22.0, 17.0, 13.0, 13.0, 10.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.4375, -87.58984375, -84.7421875, -81.89453125, -79.046875, -76.19921875, -73.3515625, -70.50390625, -67.65625, -64.80859375, -61.9609375, -59.11328125, -56.265625, -53.41796875, -50.5703125, -47.72265625, -44.875, -42.02734375, -39.1796875, -36.33203125, -33.484375, -30.63671875, -27.7890625, -24.94140625, -22.09375, -19.24609375, -16.3984375, -13.55078125, -10.703125, -7.85546875, -5.0078125, -2.16015625, 0.6875, 3.53515625, 6.3828125, 9.23046875, 12.078125, 14.92578125, 17.7734375, 20.62109375, 23.46875, 26.31640625, 29.1640625, 32.01171875, 34.859375, 37.70703125, 40.5546875, 43.40234375, 46.25, 49.09765625, 51.9453125, 54.79296875, 57.640625, 60.48828125, 63.3359375, 66.18359375, 69.03125, 71.87890625, 74.7265625, 77.57421875, 80.421875, 83.26953125, 86.1171875, 88.96484375, 91.8125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 9.0, 4.0, 12.0, 12.0, 17.0, 52.0, 48.0, 55.0, 106.0, 151.0, 217.0, 374.0, 614.0, 953.0, 1819.0, 3428.0, 7156.0, 16571.0, 48190.0, 289335.0, 567470.0, 71461.0, 22025.0, 8979.0, 4228.0, 2191.0, 1174.0, 704.0, 404.0, 250.0, 164.0, 121.0, 74.0, 53.0, 26.0, 29.0, 15.0, 18.0, 11.0, 9.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-171.0, -165.509765625, -160.01953125, -154.529296875, -149.0390625, -143.548828125, -138.05859375, -132.568359375, -127.078125, -121.587890625, -116.09765625, -110.607421875, -105.1171875, -99.626953125, -94.13671875, -88.646484375, -83.15625, -77.666015625, -72.17578125, -66.685546875, -61.1953125, -55.705078125, -50.21484375, -44.724609375, -39.234375, -33.744140625, -28.25390625, -22.763671875, -17.2734375, -11.783203125, -6.29296875, -0.802734375, 4.6875, 10.177734375, 15.66796875, 21.158203125, 26.6484375, 32.138671875, 37.62890625, 43.119140625, 48.609375, 54.099609375, 59.58984375, 65.080078125, 70.5703125, 76.060546875, 81.55078125, 87.041015625, 92.53125, 98.021484375, 103.51171875, 109.001953125, 114.4921875, 119.982421875, 125.47265625, 130.962890625, 136.453125, 141.943359375, 147.43359375, 152.923828125, 158.4140625, 163.904296875, 169.39453125, 174.884765625, 180.375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 5.0, 12.0, 12.0, 16.0, 10.0, 12.0, 19.0, 32.0, 33.0, 33.0, 34.0, 23.0, 33.0, 44.0, 64.0, 77.0, 161.0, 1651.0, 271.0, 83.0, 52.0, 47.0, 45.0, 27.0, 31.0, 30.0, 26.0, 27.0, 25.0, 10.0, 15.0, 21.0, 13.0, 13.0, 11.0, 8.0, 3.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.875, -178.900390625, -171.92578125, -164.951171875, -157.9765625, -151.001953125, -144.02734375, -137.052734375, -130.078125, -123.103515625, -116.12890625, -109.154296875, -102.1796875, -95.205078125, -88.23046875, -81.255859375, -74.28125, -67.306640625, -60.33203125, -53.357421875, -46.3828125, -39.408203125, -32.43359375, -25.458984375, -18.484375, -11.509765625, -4.53515625, 2.439453125, 9.4140625, 16.388671875, 23.36328125, 30.337890625, 37.3125, 44.287109375, 51.26171875, 58.236328125, 65.2109375, 72.185546875, 79.16015625, 86.134765625, 93.109375, 100.083984375, 107.05859375, 114.033203125, 121.0078125, 127.982421875, 134.95703125, 141.931640625, 148.90625, 155.880859375, 162.85546875, 169.830078125, 176.8046875, 183.779296875, 190.75390625, 197.728515625, 204.703125, 211.677734375, 218.65234375, 225.626953125, 232.6015625, 239.576171875, 246.55078125, 253.525390625, 260.5]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 12.0, 7.0, 11.0, 21.0, 23.0, 31.0, 42.0, 62.0, 83.0, 102.0, 174.0, 282.0, 710.0, 2642.0, 14221.0, 228770.0, 2848540.0, 41891.0, 5616.0, 1270.0, 487.0, 231.0, 125.0, 84.0, 70.0, 49.0, 39.0, 23.0, 18.0, 11.0, 19.0, 7.0, 6.0, 11.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-372.25, -360.3359375, -348.421875, -336.5078125, -324.59375, -312.6796875, -300.765625, -288.8515625, -276.9375, -265.0234375, -253.109375, -241.1953125, -229.28125, -217.3671875, -205.453125, -193.5390625, -181.625, -169.7109375, -157.796875, -145.8828125, -133.96875, -122.0546875, -110.140625, -98.2265625, -86.3125, -74.3984375, -62.484375, -50.5703125, -38.65625, -26.7421875, -14.828125, -2.9140625, 9.0, 20.9140625, 32.828125, 44.7421875, 56.65625, 68.5703125, 80.484375, 92.3984375, 104.3125, 116.2265625, 128.140625, 140.0546875, 151.96875, 163.8828125, 175.796875, 187.7109375, 199.625, 211.5390625, 223.453125, 235.3671875, 247.28125, 259.1953125, 271.109375, 283.0234375, 294.9375, 306.8515625, 318.765625, 330.6796875, 342.59375, 354.5078125, 366.421875, 378.3359375, 390.25]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 58.0, 154.0, 375.0, 310.0, 89.0, 16.0, 4.0, 2.0], "bins": [-1590.63232421875, -1563.561279296875, -1536.4903564453125, -1509.4193115234375, -1482.348388671875, -1455.27734375, -1428.2064208984375, -1401.1353759765625, -1374.064453125, -1346.993408203125, -1319.9224853515625, -1292.8514404296875, -1265.780517578125, -1238.70947265625, -1211.6385498046875, -1184.5675048828125, -1157.49658203125, -1130.425537109375, -1103.3546142578125, -1076.2835693359375, -1049.212646484375, -1022.1416625976562, -995.0706787109375, -967.9996337890625, -940.9285888671875, -913.8576049804688, -886.78662109375, -859.7156372070312, -832.6446533203125, -805.5736694335938, -778.502685546875, -751.431640625, -724.3607177734375, -697.2897338867188, -670.21875, -643.1477661132812, -616.0767822265625, -589.0057983398438, -561.934814453125, -534.86376953125, -507.7928161621094, -480.7218322753906, -453.6508483886719, -426.579833984375, -399.50885009765625, -372.4378662109375, -345.36688232421875, -318.2958984375, -291.22491455078125, -264.1539306640625, -237.08294677734375, -210.01194763183594, -182.9409637451172, -155.86997985839844, -128.79898071289062, -101.72799682617188, -74.65701293945312, -47.58602523803711, -20.515037536621094, 6.5559539794921875, 33.62693786621094, 60.69792175292969, 87.7689208984375, 114.83990478515625, 141.910888671875]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 9.0, 8.0, 4.0, 21.0, 18.0, 25.0, 12.0, 26.0, 20.0, 23.0, 22.0, 29.0, 34.0, 28.0, 33.0, 32.0, 45.0, 41.0, 31.0, 33.0, 43.0, 39.0, 42.0, 44.0, 49.0, 33.0, 33.0, 26.0, 21.0, 25.0, 21.0, 25.0, 12.0, 9.0, 10.0, 10.0, 8.0, 15.0, 8.0, 8.0, 7.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-394.71240234375, -381.53668212890625, -368.3609619140625, -355.18524169921875, -342.009521484375, -328.83380126953125, -315.6580810546875, -302.48236083984375, -289.306640625, -276.13092041015625, -262.9552001953125, -249.77947998046875, -236.603759765625, -223.42803955078125, -210.25233459472656, -197.0766143798828, -183.90090942382812, -170.72518920898438, -157.54946899414062, -144.37374877929688, -131.19802856445312, -118.0223159790039, -104.84660339355469, -91.67088317871094, -78.49516296386719, -65.31944274902344, -52.14372634887695, -38.96800994873047, -25.79228973388672, -12.616569519042969, 0.55914306640625, 13.73486328125, 26.910552978515625, 40.086273193359375, 53.26198959350586, 66.43770599365234, 79.6134262084961, 92.78914642333984, 105.96485900878906, 119.14057922363281, 132.31629943847656, 145.4920196533203, 158.66773986816406, 171.84344482421875, 185.0191650390625, 198.19488525390625, 211.37060546875, 224.54632568359375, 237.7220458984375, 250.89776611328125, 264.073486328125, 277.24920654296875, 290.4249267578125, 303.60064697265625, 316.7763671875, 329.95208740234375, 343.1278076171875, 356.30352783203125, 369.479248046875, 382.65496826171875, 395.8306884765625, 409.00640869140625, 422.18212890625, 435.35784912109375, 448.5335388183594]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 7.0, 11.0, 20.0, 12.0, 16.0, 25.0, 27.0, 25.0, 32.0, 35.0, 29.0, 28.0, 44.0, 31.0, 55.0, 55.0, 31.0, 49.0, 44.0, 41.0, 51.0, 36.0, 43.0, 36.0, 28.0, 22.0, 31.0, 20.0, 21.0, 24.0, 14.0, 12.0, 6.0, 4.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.625, -90.6845703125, -87.744140625, -84.8037109375, -81.86328125, -78.9228515625, -75.982421875, -73.0419921875, -70.1015625, -67.1611328125, -64.220703125, -61.2802734375, -58.33984375, -55.3994140625, -52.458984375, -49.5185546875, -46.578125, -43.6376953125, -40.697265625, -37.7568359375, -34.81640625, -31.8759765625, -28.935546875, -25.9951171875, -23.0546875, -20.1142578125, -17.173828125, -14.2333984375, -11.29296875, -8.3525390625, -5.412109375, -2.4716796875, 0.46875, 3.4091796875, 6.349609375, 9.2900390625, 12.23046875, 15.1708984375, 18.111328125, 21.0517578125, 23.9921875, 26.9326171875, 29.873046875, 32.8134765625, 35.75390625, 38.6943359375, 41.634765625, 44.5751953125, 47.515625, 50.4560546875, 53.396484375, 56.3369140625, 59.27734375, 62.2177734375, 65.158203125, 68.0986328125, 71.0390625, 73.9794921875, 76.919921875, 79.8603515625, 82.80078125, 85.7412109375, 88.681640625, 91.6220703125, 94.5625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 5.0, 4.0, 10.0, 9.0, 18.0, 29.0, 31.0, 50.0, 69.0, 112.0, 136.0, 274.0, 525.0, 4027.0, 4182422.0, 5312.0, 487.0, 213.0, 156.0, 87.0, 55.0, 67.0, 43.0, 25.0, 16.0, 13.0, 10.0, 10.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2194.0, -2117.09375, -2040.1875, -1963.28125, -1886.375, -1809.46875, -1732.5625, -1655.65625, -1578.75, -1501.84375, -1424.9375, -1348.03125, -1271.125, -1194.21875, -1117.3125, -1040.40625, -963.5, -886.59375, -809.6875, -732.78125, -655.875, -578.96875, -502.0625, -425.15625, -348.25, -271.34375, -194.4375, -117.53125, -40.625, 36.28125, 113.1875, 190.09375, 267.0, 343.90625, 420.8125, 497.71875, 574.625, 651.53125, 728.4375, 805.34375, 882.25, 959.15625, 1036.0625, 1112.96875, 1189.875, 1266.78125, 1343.6875, 1420.59375, 1497.5, 1574.40625, 1651.3125, 1728.21875, 1805.125, 1882.03125, 1958.9375, 2035.84375, 2112.75, 2189.65625, 2266.5625, 2343.46875, 2420.375, 2497.28125, 2574.1875, 2651.09375, 2728.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 7.0, 7.0, 10.0, 10.0, 8.0, 17.0, 9.0, 16.0, 20.0, 30.0, 24.0, 42.0, 53.0, 75.0, 111.0, 231.0, 435.0, 942.0, 923.0, 433.0, 207.0, 140.0, 72.0, 53.0, 43.0, 32.0, 31.0, 20.0, 22.0, 8.0, 9.0, 10.0, 5.0, 3.0, 2.0, 3.0, 7.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-124.6875, -120.2333984375, -115.779296875, -111.3251953125, -106.87109375, -102.4169921875, -97.962890625, -93.5087890625, -89.0546875, -84.6005859375, -80.146484375, -75.6923828125, -71.23828125, -66.7841796875, -62.330078125, -57.8759765625, -53.421875, -48.9677734375, -44.513671875, -40.0595703125, -35.60546875, -31.1513671875, -26.697265625, -22.2431640625, -17.7890625, -13.3349609375, -8.880859375, -4.4267578125, 0.02734375, 4.4814453125, 8.935546875, 13.3896484375, 17.84375, 22.2978515625, 26.751953125, 31.2060546875, 35.66015625, 40.1142578125, 44.568359375, 49.0224609375, 53.4765625, 57.9306640625, 62.384765625, 66.8388671875, 71.29296875, 75.7470703125, 80.201171875, 84.6552734375, 89.109375, 93.5634765625, 98.017578125, 102.4716796875, 106.92578125, 111.3798828125, 115.833984375, 120.2880859375, 124.7421875, 129.1962890625, 133.650390625, 138.1044921875, 142.55859375, 147.0126953125, 151.466796875, 155.9208984375, 160.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 15.0, 9.0, 14.0, 15.0, 21.0, 21.0, 24.0, 29.0, 42.0, 43.0, 63.0, 126.0, 661.0, 6183.0, 149271.0, 4006633.0, 28338.0, 2024.0, 328.0, 120.0, 48.0, 36.0, 33.0, 35.0, 25.0, 19.0, 13.0, 8.0, 12.0, 10.0, 9.0, 5.0, 9.0, 5.0, 6.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-828.0, -802.34375, -776.6875, -751.03125, -725.375, -699.71875, -674.0625, -648.40625, -622.75, -597.09375, -571.4375, -545.78125, -520.125, -494.46875, -468.8125, -443.15625, -417.5, -391.84375, -366.1875, -340.53125, -314.875, -289.21875, -263.5625, -237.90625, -212.25, -186.59375, -160.9375, -135.28125, -109.625, -83.96875, -58.3125, -32.65625, -7.0, 18.65625, 44.3125, 69.96875, 95.625, 121.28125, 146.9375, 172.59375, 198.25, 223.90625, 249.5625, 275.21875, 300.875, 326.53125, 352.1875, 377.84375, 403.5, 429.15625, 454.8125, 480.46875, 506.125, 531.78125, 557.4375, 583.09375, 608.75, 634.40625, 660.0625, 685.71875, 711.375, 737.03125, 762.6875, 788.34375, 814.0]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 38.0, 133.0, 379.0, 321.0, 110.0, 19.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-642.8279418945312, -588.6417846679688, -534.4556884765625, -480.26953125, -426.0834045410156, -371.89727783203125, -317.71112060546875, -263.5249938964844, -209.3388671875, -155.15274047851562, -100.96659851074219, -46.78045654296875, 7.405670166015625, 61.591796875, 115.7779541015625, 169.96408081054688, 224.15020751953125, 278.3363342285156, 332.5224609375, 386.7086181640625, 440.8947448730469, 495.08087158203125, 549.2670288085938, 603.453125, 657.6392822265625, 711.825439453125, 766.0115356445312, 820.1976928710938, 874.3837890625, 928.5699462890625, 982.756103515625, 1036.9422607421875, 1091.12841796875, 1145.3145751953125, 1199.500732421875, 1253.686767578125, 1307.8729248046875, 1362.05908203125, 1416.2452392578125, 1470.431396484375, 1524.617431640625, 1578.8035888671875, 1632.98974609375, 1687.17578125, 1741.3619384765625, 1795.548095703125, 1849.7342529296875, 1903.92041015625, 1958.1065673828125, 2012.292724609375, 2066.478759765625, 2120.6650390625, 2174.85107421875, 2229.037109375, 2283.223388671875, 2337.409423828125, 2391.595703125, 2445.78173828125, 2499.968017578125, 2554.154052734375, 2608.34033203125, 2662.5263671875, 2716.71240234375, 2770.898681640625, 2825.084716796875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 2.0, 2.0, 8.0, 6.0, 19.0, 17.0, 17.0, 21.0, 26.0, 16.0, 25.0, 19.0, 26.0, 33.0, 32.0, 45.0, 38.0, 37.0, 45.0, 43.0, 38.0, 34.0, 31.0, 41.0, 33.0, 40.0, 30.0, 24.0, 32.0, 23.0, 28.0, 21.0, 19.0, 18.0, 22.0, 17.0, 14.0, 10.0, 11.0, 4.0, 6.0, 11.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-382.009033203125, -370.2220458984375, -358.4350891113281, -346.6481018066406, -334.86114501953125, -323.07415771484375, -311.28717041015625, -299.5002136230469, -287.7132568359375, -275.92626953125, -264.1393127441406, -252.35232543945312, -240.56536865234375, -228.77838134765625, -216.9914093017578, -205.20443725585938, -193.41744995117188, -181.63047790527344, -169.843505859375, -158.0565185546875, -146.26956176757812, -134.48257446289062, -122.69560241699219, -110.90863037109375, -99.12165832519531, -87.33468627929688, -75.54771423339844, -63.76073455810547, -51.97376251220703, -40.186790466308594, -28.399810791015625, -16.612838745117188, -4.82586669921875, 6.96110725402832, 18.74808120727539, 30.535057067871094, 42.32202911376953, 54.10900115966797, 65.89598083496094, 77.68295288085938, 89.46992492675781, 101.25689697265625, 113.04386901855469, 124.83084869384766, 136.61782836914062, 148.40478515625, 160.1917724609375, 171.97874450683594, 183.76571655273438, 195.5526885986328, 207.33966064453125, 219.12664794921875, 230.91360473632812, 242.70059204101562, 254.48756408691406, 266.2745361328125, 278.0615234375, 289.8485107421875, 301.6354675292969, 313.4224548339844, 325.20941162109375, 336.99639892578125, 348.78338623046875, 360.5703430175781, 372.3572998046875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 12.0, 9.0, 10.0, 20.0, 25.0, 19.0, 30.0, 19.0, 21.0, 31.0, 31.0, 38.0, 38.0, 33.0, 45.0, 41.0, 43.0, 47.0, 34.0, 44.0, 50.0, 50.0, 26.0, 33.0, 31.0, 40.0, 29.0, 32.0, 15.0, 25.0, 17.0, 11.0, 17.0, 6.0, 4.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.25, -92.4873046875, -89.724609375, -86.9619140625, -84.19921875, -81.4365234375, -78.673828125, -75.9111328125, -73.1484375, -70.3857421875, -67.623046875, -64.8603515625, -62.09765625, -59.3349609375, -56.572265625, -53.8095703125, -51.046875, -48.2841796875, -45.521484375, -42.7587890625, -39.99609375, -37.2333984375, -34.470703125, -31.7080078125, -28.9453125, -26.1826171875, -23.419921875, -20.6572265625, -17.89453125, -15.1318359375, -12.369140625, -9.6064453125, -6.84375, -4.0810546875, -1.318359375, 1.4443359375, 4.20703125, 6.9697265625, 9.732421875, 12.4951171875, 15.2578125, 18.0205078125, 20.783203125, 23.5458984375, 26.30859375, 29.0712890625, 31.833984375, 34.5966796875, 37.359375, 40.1220703125, 42.884765625, 45.6474609375, 48.41015625, 51.1728515625, 53.935546875, 56.6982421875, 59.4609375, 62.2236328125, 64.986328125, 67.7490234375, 70.51171875, 73.2744140625, 76.037109375, 78.7998046875, 81.5625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 10.0, 15.0, 16.0, 19.0, 21.0, 49.0, 54.0, 92.0, 103.0, 202.0, 265.0, 428.0, 648.0, 1047.0, 1738.0, 3312.0, 6485.0, 14010.0, 32193.0, 86415.0, 286110.0, 416961.0, 120368.0, 42906.0, 17552.0, 7996.0, 3993.0, 2116.0, 1217.0, 771.0, 489.0, 293.0, 217.0, 130.0, 105.0, 71.0, 47.0, 29.0, 14.0, 12.0, 14.0, 7.0, 12.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.01318359375, -15.4638671875, -14.91455078125, -14.365234375, -13.81591796875, -13.2666015625, -12.71728515625, -12.16796875, -11.61865234375, -11.0693359375, -10.52001953125, -9.970703125, -9.42138671875, -8.8720703125, -8.32275390625, -7.7734375, -7.22412109375, -6.6748046875, -6.12548828125, -5.576171875, -5.02685546875, -4.4775390625, -3.92822265625, -3.37890625, -2.82958984375, -2.2802734375, -1.73095703125, -1.181640625, -0.63232421875, -0.0830078125, 0.46630859375, 1.015625, 1.56494140625, 2.1142578125, 2.66357421875, 3.212890625, 3.76220703125, 4.3115234375, 4.86083984375, 5.41015625, 5.95947265625, 6.5087890625, 7.05810546875, 7.607421875, 8.15673828125, 8.7060546875, 9.25537109375, 9.8046875, 10.35400390625, 10.9033203125, 11.45263671875, 12.001953125, 12.55126953125, 13.1005859375, 13.64990234375, 14.19921875, 14.74853515625, 15.2978515625, 15.84716796875, 16.396484375, 16.94580078125, 17.4951171875, 18.04443359375, 18.59375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 1.0, 5.0, 7.0, 10.0, 7.0, 9.0, 11.0, 22.0, 20.0, 20.0, 25.0, 25.0, 32.0, 39.0, 32.0, 27.0, 47.0, 38.0, 38.0, 44.0, 1079.0, 38.0, 42.0, 45.0, 30.0, 40.0, 38.0, 31.0, 27.0, 45.0, 28.0, 12.0, 21.0, 14.0, 18.0, 14.0, 4.0, 5.0, 11.0, 14.0, 8.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-58.21875, -56.4453125, -54.671875, -52.8984375, -51.125, -49.3515625, -47.578125, -45.8046875, -44.03125, -42.2578125, -40.484375, -38.7109375, -36.9375, -35.1640625, -33.390625, -31.6171875, -29.84375, -28.0703125, -26.296875, -24.5234375, -22.75, -20.9765625, -19.203125, -17.4296875, -15.65625, -13.8828125, -12.109375, -10.3359375, -8.5625, -6.7890625, -5.015625, -3.2421875, -1.46875, 0.3046875, 2.078125, 3.8515625, 5.625, 7.3984375, 9.171875, 10.9453125, 12.71875, 14.4921875, 16.265625, 18.0390625, 19.8125, 21.5859375, 23.359375, 25.1328125, 26.90625, 28.6796875, 30.453125, 32.2265625, 34.0, 35.7734375, 37.546875, 39.3203125, 41.09375, 42.8671875, 44.640625, 46.4140625, 48.1875, 49.9609375, 51.734375, 53.5078125, 55.28125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 3.0, 6.0, 9.0, 12.0, 18.0, 14.0, 22.0, 42.0, 39.0, 62.0, 82.0, 122.0, 160.0, 238.0, 354.0, 492.0, 743.0, 1131.0, 1896.0, 2801.0, 4409.0, 7450.0, 11833.0, 19614.0, 33589.0, 57523.0, 101384.0, 193150.0, 1299189.0, 153821.0, 85347.0, 48671.0, 28431.0, 16917.0, 10226.0, 6048.0, 3910.0, 2419.0, 1635.0, 1065.0, 718.0, 474.0, 323.0, 263.0, 152.0, 105.0, 56.0, 55.0, 29.0, 25.0, 13.0, 14.0, 10.0, 7.0, 9.0, 5.0, 5.0, 1.0, 2.0, 3.0], "bins": [-4.91015625, -4.75836181640625, -4.6065673828125, -4.45477294921875, -4.302978515625, -4.15118408203125, -3.9993896484375, -3.84759521484375, -3.69580078125, -3.54400634765625, -3.3922119140625, -3.24041748046875, -3.088623046875, -2.93682861328125, -2.7850341796875, -2.63323974609375, -2.4814453125, -2.32965087890625, -2.1778564453125, -2.02606201171875, -1.874267578125, -1.72247314453125, -1.5706787109375, -1.41888427734375, -1.26708984375, -1.11529541015625, -0.9635009765625, -0.81170654296875, -0.659912109375, -0.50811767578125, -0.3563232421875, -0.20452880859375, -0.052734375, 0.09906005859375, 0.2508544921875, 0.40264892578125, 0.554443359375, 0.70623779296875, 0.8580322265625, 1.00982666015625, 1.16162109375, 1.31341552734375, 1.4652099609375, 1.61700439453125, 1.768798828125, 1.92059326171875, 2.0723876953125, 2.22418212890625, 2.3759765625, 2.52777099609375, 2.6795654296875, 2.83135986328125, 2.983154296875, 3.13494873046875, 3.2867431640625, 3.43853759765625, 3.59033203125, 3.74212646484375, 3.8939208984375, 4.04571533203125, 4.197509765625, 4.34930419921875, 4.5010986328125, 4.65289306640625, 4.8046875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 3.0, 3.0, 8.0, 7.0, 8.0, 5.0, 8.0, 9.0, 15.0, 9.0, 19.0, 20.0, 21.0, 34.0, 53.0, 80.0, 97.0, 111.0, 136.0, 93.0, 50.0, 41.0, 27.0, 32.0, 21.0, 12.0, 13.0, 9.0, 7.0, 7.0, 6.0, 7.0, 2.0, 2.0, 8.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2410888671875, -0.23300743103027344, -0.22492599487304688, -0.2168445587158203, -0.20876312255859375, -0.2006816864013672, -0.19260025024414062, -0.18451881408691406, -0.1764373779296875, -0.16835594177246094, -0.16027450561523438, -0.1521930694580078, -0.14411163330078125, -0.1360301971435547, -0.12794876098632812, -0.11986732482910156, -0.111785888671875, -0.10370445251464844, -0.09562301635742188, -0.08754158020019531, -0.07946014404296875, -0.07137870788574219, -0.06329727172851562, -0.05521583557128906, -0.0471343994140625, -0.03905296325683594, -0.030971527099609375, -0.022890090942382812, -0.01480865478515625, -0.0067272186279296875, 0.001354217529296875, 0.009435653686523438, 0.01751708984375, 0.025598526000976562, 0.033679962158203125, 0.04176139831542969, 0.04984283447265625, 0.05792427062988281, 0.06600570678710938, 0.07408714294433594, 0.0821685791015625, 0.09025001525878906, 0.09833145141601562, 0.10641288757324219, 0.11449432373046875, 0.12257575988769531, 0.13065719604492188, 0.13873863220214844, 0.146820068359375, 0.15490150451660156, 0.16298294067382812, 0.1710643768310547, 0.17914581298828125, 0.1872272491455078, 0.19530868530273438, 0.20339012145996094, 0.2114715576171875, 0.21955299377441406, 0.22763442993164062, 0.2357158660888672, 0.24379730224609375, 0.2518787384033203, 0.2599601745605469, 0.26804161071777344, 0.276123046875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 7.0, 5.0, 2.0, 5.0, 8.0, 13.0, 13.0, 15.0, 16.0, 28.0, 38.0, 52.0, 63.0, 118.0, 232.0, 718.0, 980269.0, 65759.0, 589.0, 212.0, 114.0, 57.0, 52.0, 39.0, 20.0, 15.0, 13.0, 16.0, 9.0, 9.0, 13.0, 8.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.7578125, -9.478515625, -9.19921875, -8.919921875, -8.640625, -8.361328125, -8.08203125, -7.802734375, -7.5234375, -7.244140625, -6.96484375, -6.685546875, -6.40625, -6.126953125, -5.84765625, -5.568359375, -5.2890625, -5.009765625, -4.73046875, -4.451171875, -4.171875, -3.892578125, -3.61328125, -3.333984375, -3.0546875, -2.775390625, -2.49609375, -2.216796875, -1.9375, -1.658203125, -1.37890625, -1.099609375, -0.8203125, -0.541015625, -0.26171875, 0.017578125, 0.296875, 0.576171875, 0.85546875, 1.134765625, 1.4140625, 1.693359375, 1.97265625, 2.251953125, 2.53125, 2.810546875, 3.08984375, 3.369140625, 3.6484375, 3.927734375, 4.20703125, 4.486328125, 4.765625, 5.044921875, 5.32421875, 5.603515625, 5.8828125, 6.162109375, 6.44140625, 6.720703125, 7.0, 7.279296875, 7.55859375, 7.837890625, 8.1171875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 942.0, 72.0, 3.0, 1.0], "bins": [-13.160978317260742, -12.94421672821045, -12.727455139160156, -12.51069450378418, -12.293932914733887, -12.077171325683594, -11.8604097366333, -11.643648147583008, -11.426886558532715, -11.210124969482422, -10.993363380432129, -10.776601791381836, -10.55984115600586, -10.343079566955566, -10.126317977905273, -9.90955638885498, -9.692795753479004, -9.476034164428711, -9.259272575378418, -9.042510986328125, -8.825750350952148, -8.608988761901855, -8.392227172851562, -8.17546558380127, -7.958703994750977, -7.741942405700684, -7.525181293487549, -7.308419704437256, -7.091658115386963, -6.874897003173828, -6.658135414123535, -6.441373825073242, -6.224612236022949, -6.007850646972656, -5.7910895347595215, -5.5743279457092285, -5.3575663566589355, -5.140805244445801, -4.924043655395508, -4.707282066345215, -4.49052095413208, -4.273759365081787, -4.056998252868652, -3.8402366638183594, -3.6234753131866455, -3.4067139625549316, -3.1899523735046387, -2.973191022872925, -2.756429672241211, -2.539668321609497, -2.322906732559204, -2.1061453819274902, -1.8893840312957764, -1.672622561454773, -1.4558610916137695, -1.2390997409820557, -1.0223382711410522, -0.8055768609046936, -0.588815450668335, -0.37205398082733154, -0.1552925705909729, 0.06146883964538574, 0.27823030948638916, 0.494991660118103, 0.7117531299591064]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 4.0, 7.0, 8.0, 9.0, 11.0, 10.0, 9.0, 9.0, 12.0, 15.0, 22.0, 16.0, 24.0, 36.0, 31.0, 27.0, 25.0, 39.0, 45.0, 32.0, 31.0, 38.0, 38.0, 33.0, 31.0, 34.0, 49.0, 35.0, 29.0, 30.0, 29.0, 29.0, 27.0, 15.0, 15.0, 23.0, 23.0, 20.0, 11.0, 13.0, 6.0, 14.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.2085365653038025, -0.20219039916992188, -0.19584421813488007, -0.18949805200099945, -0.18315188586711884, -0.17680570483207703, -0.1704595386981964, -0.1641133725643158, -0.15776720643043518, -0.15142104029655457, -0.14507485926151276, -0.13872869312763214, -0.13238252699375153, -0.12603634595870972, -0.1196901798248291, -0.11334401369094849, -0.10699783265590668, -0.10065165907144547, -0.09430549293756485, -0.08795931935310364, -0.08161315321922302, -0.07526697963476181, -0.0689208060503006, -0.06257463991641998, -0.05622846633195877, -0.04988229647278786, -0.04353612661361694, -0.03718995302915573, -0.030843783169984818, -0.024497613310813904, -0.01815143972635269, -0.011805269867181778, -0.005459100008010864, 0.000887070782482624, 0.007233241572976112, 0.013579413294792175, 0.01992558315396309, 0.026271753013134003, 0.032617926597595215, 0.03896409645676613, 0.04531026631593704, 0.051656436175107956, 0.05800260603427887, 0.06434877961874008, 0.0706949532032013, 0.07704111933708191, 0.08338729292154312, 0.08973346650600433, 0.09607963263988495, 0.10242580622434616, 0.10877197235822678, 0.11511814594268799, 0.1214643120765686, 0.12781047821044922, 0.13415665924549103, 0.14050282537937164, 0.14684900641441345, 0.15319517254829407, 0.15954135358333588, 0.1658875197172165, 0.1722336858510971, 0.17857986688613892, 0.18492603302001953, 0.19127219915390015, 0.19761836528778076]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 12.0, 9.0, 10.0, 20.0, 25.0, 19.0, 30.0, 19.0, 21.0, 31.0, 31.0, 38.0, 38.0, 33.0, 45.0, 40.0, 44.0, 47.0, 34.0, 44.0, 50.0, 50.0, 26.0, 33.0, 31.0, 40.0, 29.0, 32.0, 15.0, 25.0, 17.0, 10.0, 18.0, 6.0, 4.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.25, -92.4873046875, -89.724609375, -86.9619140625, -84.19921875, -81.4365234375, -78.673828125, -75.9111328125, -73.1484375, -70.3857421875, -67.623046875, -64.8603515625, -62.09765625, -59.3349609375, -56.572265625, -53.8095703125, -51.046875, -48.2841796875, -45.521484375, -42.7587890625, -39.99609375, -37.2333984375, -34.470703125, -31.7080078125, -28.9453125, -26.1826171875, -23.419921875, -20.6572265625, -17.89453125, -15.1318359375, -12.369140625, -9.6064453125, -6.84375, -4.0810546875, -1.318359375, 1.4443359375, 4.20703125, 6.9697265625, 9.732421875, 12.4951171875, 15.2578125, 18.0205078125, 20.783203125, 23.5458984375, 26.30859375, 29.0712890625, 31.833984375, 34.5966796875, 37.359375, 40.1220703125, 42.884765625, 45.6474609375, 48.41015625, 51.1728515625, 53.935546875, 56.6982421875, 59.4609375, 62.2236328125, 64.986328125, 67.7490234375, 70.51171875, 73.2744140625, 76.037109375, 78.7998046875, 81.5625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 5.0, 14.0, 17.0, 16.0, 21.0, 42.0, 61.0, 75.0, 81.0, 144.0, 207.0, 273.0, 447.0, 609.0, 820.0, 1203.0, 1859.0, 2831.0, 4859.0, 8870.0, 18755.0, 45502.0, 136400.0, 461342.0, 239423.0, 69548.0, 26452.0, 12027.0, 6153.0, 3668.0, 2152.0, 1469.0, 925.0, 679.0, 454.0, 344.0, 243.0, 141.0, 128.0, 90.0, 58.0, 38.0, 34.0, 19.0, 17.0, 11.0, 8.0, 10.0, 6.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-131.125, -127.1162109375, -123.107421875, -119.0986328125, -115.08984375, -111.0810546875, -107.072265625, -103.0634765625, -99.0546875, -95.0458984375, -91.037109375, -87.0283203125, -83.01953125, -79.0107421875, -75.001953125, -70.9931640625, -66.984375, -62.9755859375, -58.966796875, -54.9580078125, -50.94921875, -46.9404296875, -42.931640625, -38.9228515625, -34.9140625, -30.9052734375, -26.896484375, -22.8876953125, -18.87890625, -14.8701171875, -10.861328125, -6.8525390625, -2.84375, 1.1650390625, 5.173828125, 9.1826171875, 13.19140625, 17.2001953125, 21.208984375, 25.2177734375, 29.2265625, 33.2353515625, 37.244140625, 41.2529296875, 45.26171875, 49.2705078125, 53.279296875, 57.2880859375, 61.296875, 65.3056640625, 69.314453125, 73.3232421875, 77.33203125, 81.3408203125, 85.349609375, 89.3583984375, 93.3671875, 97.3759765625, 101.384765625, 105.3935546875, 109.40234375, 113.4111328125, 117.419921875, 121.4287109375, 125.4375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 6.0, 9.0, 10.0, 16.0, 19.0, 26.0, 34.0, 31.0, 37.0, 40.0, 66.0, 68.0, 102.0, 231.0, 1567.0, 252.0, 109.0, 65.0, 75.0, 49.0, 43.0, 43.0, 32.0, 25.0, 21.0, 17.0, 4.0, 9.0, 7.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-261.5, -253.234375, -244.96875, -236.703125, -228.4375, -220.171875, -211.90625, -203.640625, -195.375, -187.109375, -178.84375, -170.578125, -162.3125, -154.046875, -145.78125, -137.515625, -129.25, -120.984375, -112.71875, -104.453125, -96.1875, -87.921875, -79.65625, -71.390625, -63.125, -54.859375, -46.59375, -38.328125, -30.0625, -21.796875, -13.53125, -5.265625, 3.0, 11.265625, 19.53125, 27.796875, 36.0625, 44.328125, 52.59375, 60.859375, 69.125, 77.390625, 85.65625, 93.921875, 102.1875, 110.453125, 118.71875, 126.984375, 135.25, 143.515625, 151.78125, 160.046875, 168.3125, 176.578125, 184.84375, 193.109375, 201.375, 209.640625, 217.90625, 226.171875, 234.4375, 242.703125, 250.96875, 259.234375, 267.5]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 9.0, 8.0, 12.0, 13.0, 17.0, 29.0, 25.0, 47.0, 75.0, 128.0, 208.0, 424.0, 1340.0, 75354.0, 3063374.0, 3221.0, 661.0, 298.0, 152.0, 106.0, 53.0, 40.0, 23.0, 22.0, 7.0, 19.0, 18.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1222.0, -1188.25, -1154.5, -1120.75, -1087.0, -1053.25, -1019.5, -985.75, -952.0, -918.25, -884.5, -850.75, -817.0, -783.25, -749.5, -715.75, -682.0, -648.25, -614.5, -580.75, -547.0, -513.25, -479.5, -445.75, -412.0, -378.25, -344.5, -310.75, -277.0, -243.25, -209.5, -175.75, -142.0, -108.25, -74.5, -40.75, -7.0, 26.75, 60.5, 94.25, 128.0, 161.75, 195.5, 229.25, 263.0, 296.75, 330.5, 364.25, 398.0, 431.75, 465.5, 499.25, 533.0, 566.75, 600.5, 634.25, 668.0, 701.75, 735.5, 769.25, 803.0, 836.75, 870.5, 904.25, 938.0]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 15.0, 506.0, 486.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7437.69970703125, -7272.3701171875, -7107.0400390625, -6941.71044921875, -6776.380859375, -6611.05126953125, -6445.72119140625, -6280.3916015625, -6115.06201171875, -5949.732421875, -5784.40234375, -5619.07275390625, -5453.7431640625, -5288.41357421875, -5123.08349609375, -4957.75390625, -4792.423828125, -4627.09423828125, -4461.76416015625, -4296.4345703125, -4131.10498046875, -3965.775146484375, -3800.4453125, -3635.11572265625, -3469.7861328125, -3304.456298828125, -3139.126708984375, -2973.796875, -2808.46728515625, -2643.137451171875, -2477.8076171875, -2312.47802734375, -2147.1484375, -1981.8187255859375, -1816.489013671875, -1651.1591796875, -1485.82958984375, -1320.499755859375, -1155.1700439453125, -989.84033203125, -824.5106201171875, -659.180908203125, -493.8511657714844, -328.52142333984375, -163.19171142578125, 2.13800048828125, 167.4677734375, 332.7974853515625, 498.127197265625, 663.4569091796875, 828.78662109375, 994.1163940429688, 1159.446044921875, 1324.77587890625, 1490.1055908203125, 1655.435302734375, 1820.7650146484375, 1986.0947265625, 2151.424560546875, 2316.754150390625, 2482.083984375, 2647.41357421875, 2812.743408203125, 2978.0732421875, 3143.40283203125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 11.0, 6.0, 5.0, 11.0, 10.0, 13.0, 16.0, 21.0, 21.0, 24.0, 25.0, 20.0, 25.0, 32.0, 40.0, 35.0, 41.0, 29.0, 38.0, 44.0, 33.0, 50.0, 43.0, 33.0, 29.0, 33.0, 35.0, 36.0, 24.0, 29.0, 29.0, 19.0, 26.0, 17.0, 17.0, 8.0, 14.0, 15.0, 13.0, 5.0, 2.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-535.8380737304688, -517.5827026367188, -499.3272705078125, -481.0718688964844, -462.81646728515625, -444.5610656738281, -426.3056640625, -408.05029296875, -389.79486083984375, -371.5394592285156, -353.2840576171875, -335.0286560058594, -316.77325439453125, -298.5178527832031, -280.262451171875, -262.007080078125, -243.75167846679688, -225.49627685546875, -207.24087524414062, -188.9854736328125, -170.73007202148438, -152.47467041015625, -134.2192840576172, -115.96388244628906, -97.70848083496094, -79.45307922363281, -61.19768142700195, -42.942283630371094, -24.68688201904297, -6.431480407714844, 11.82391357421875, 30.079315185546875, 48.334716796875, 66.59011840820312, 84.84552001953125, 103.10091400146484, 121.35631561279297, 139.61172485351562, 157.8671112060547, 176.1225128173828, 194.37791442871094, 212.63331604003906, 230.8887176513672, 249.14410400390625, 267.3995056152344, 285.6549072265625, 303.9103088378906, 322.16571044921875, 340.4211120605469, 358.676513671875, 376.9319152832031, 395.18731689453125, 413.4427185058594, 431.6981201171875, 449.9534912109375, 468.20892333984375, 486.46429443359375, 504.7196960449219, 522.97509765625, 541.23046875, 559.4859008789062, 577.7412719726562, 595.9967041015625, 614.2520751953125, 632.5075073242188]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 4.0, 6.0, 7.0, 7.0, 17.0, 11.0, 17.0, 16.0, 22.0, 19.0, 27.0, 30.0, 23.0, 33.0, 38.0, 46.0, 40.0, 42.0, 52.0, 41.0, 42.0, 42.0, 42.0, 39.0, 45.0, 38.0, 36.0, 33.0, 33.0, 29.0, 31.0, 20.0, 13.0, 10.0, 9.0, 2.0, 11.0, 9.0, 6.0, 4.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-105.9375, -102.9794921875, -100.021484375, -97.0634765625, -94.10546875, -91.1474609375, -88.189453125, -85.2314453125, -82.2734375, -79.3154296875, -76.357421875, -73.3994140625, -70.44140625, -67.4833984375, -64.525390625, -61.5673828125, -58.609375, -55.6513671875, -52.693359375, -49.7353515625, -46.77734375, -43.8193359375, -40.861328125, -37.9033203125, -34.9453125, -31.9873046875, -29.029296875, -26.0712890625, -23.11328125, -20.1552734375, -17.197265625, -14.2392578125, -11.28125, -8.3232421875, -5.365234375, -2.4072265625, 0.55078125, 3.5087890625, 6.466796875, 9.4248046875, 12.3828125, 15.3408203125, 18.298828125, 21.2568359375, 24.21484375, 27.1728515625, 30.130859375, 33.0888671875, 36.046875, 39.0048828125, 41.962890625, 44.9208984375, 47.87890625, 50.8369140625, 53.794921875, 56.7529296875, 59.7109375, 62.6689453125, 65.626953125, 68.5849609375, 71.54296875, 74.5009765625, 77.458984375, 80.4169921875, 83.375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 5.0, 18.0, 19.0, 25.0, 33.0, 35.0, 49.0, 65.0, 83.0, 111.0, 142.0, 214.0, 295.0, 385.0, 570.0, 843.0, 1390.0, 2484.0, 4912.0, 11313.0, 32341.0, 253419.0, 3061812.0, 737988.0, 56047.0, 15364.0, 6402.0, 3013.0, 1652.0, 951.0, 653.0, 444.0, 292.0, 225.0, 156.0, 117.0, 100.0, 65.0, 51.0, 48.0, 38.0, 27.0, 14.0, 16.0, 9.0, 12.0, 6.0, 9.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-225.375, -218.02734375, -210.6796875, -203.33203125, -195.984375, -188.63671875, -181.2890625, -173.94140625, -166.59375, -159.24609375, -151.8984375, -144.55078125, -137.203125, -129.85546875, -122.5078125, -115.16015625, -107.8125, -100.46484375, -93.1171875, -85.76953125, -78.421875, -71.07421875, -63.7265625, -56.37890625, -49.03125, -41.68359375, -34.3359375, -26.98828125, -19.640625, -12.29296875, -4.9453125, 2.40234375, 9.75, 17.09765625, 24.4453125, 31.79296875, 39.140625, 46.48828125, 53.8359375, 61.18359375, 68.53125, 75.87890625, 83.2265625, 90.57421875, 97.921875, 105.26953125, 112.6171875, 119.96484375, 127.3125, 134.66015625, 142.0078125, 149.35546875, 156.703125, 164.05078125, 171.3984375, 178.74609375, 186.09375, 193.44140625, 200.7890625, 208.13671875, 215.484375, 222.83203125, 230.1796875, 237.52734375, 244.875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 8.0, 8.0, 12.0, 8.0, 15.0, 29.0, 45.0, 32.0, 83.0, 75.0, 133.0, 200.0, 272.0, 513.0, 833.0, 719.0, 367.0, 209.0, 146.0, 87.0, 72.0, 52.0, 31.0, 18.0, 27.0, 18.0, 18.0, 12.0, 8.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-248.125, -242.3203125, -236.515625, -230.7109375, -224.90625, -219.1015625, -213.296875, -207.4921875, -201.6875, -195.8828125, -190.078125, -184.2734375, -178.46875, -172.6640625, -166.859375, -161.0546875, -155.25, -149.4453125, -143.640625, -137.8359375, -132.03125, -126.2265625, -120.421875, -114.6171875, -108.8125, -103.0078125, -97.203125, -91.3984375, -85.59375, -79.7890625, -73.984375, -68.1796875, -62.375, -56.5703125, -50.765625, -44.9609375, -39.15625, -33.3515625, -27.546875, -21.7421875, -15.9375, -10.1328125, -4.328125, 1.4765625, 7.28125, 13.0859375, 18.890625, 24.6953125, 30.5, 36.3046875, 42.109375, 47.9140625, 53.71875, 59.5234375, 65.328125, 71.1328125, 76.9375, 82.7421875, 88.546875, 94.3515625, 100.15625, 105.9609375, 111.765625, 117.5703125, 123.375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 8.0, 11.0, 13.0, 31.0, 37.0, 41.0, 66.0, 95.0, 177.0, 259.0, 487.0, 1051.0, 2492.0, 7180.0, 26244.0, 147579.0, 3316645.0, 609627.0, 60918.0, 13768.0, 4241.0, 1632.0, 705.0, 355.0, 217.0, 141.0, 82.0, 71.0, 29.0, 18.0, 26.0, 14.0, 8.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.25, -241.10546875, -230.9609375, -220.81640625, -210.671875, -200.52734375, -190.3828125, -180.23828125, -170.09375, -159.94921875, -149.8046875, -139.66015625, -129.515625, -119.37109375, -109.2265625, -99.08203125, -88.9375, -78.79296875, -68.6484375, -58.50390625, -48.359375, -38.21484375, -28.0703125, -17.92578125, -7.78125, 2.36328125, 12.5078125, 22.65234375, 32.796875, 42.94140625, 53.0859375, 63.23046875, 73.375, 83.51953125, 93.6640625, 103.80859375, 113.953125, 124.09765625, 134.2421875, 144.38671875, 154.53125, 164.67578125, 174.8203125, 184.96484375, 195.109375, 205.25390625, 215.3984375, 225.54296875, 235.6875, 245.83203125, 255.9765625, 266.12109375, 276.265625, 286.41015625, 296.5546875, 306.69921875, 316.84375, 326.98828125, 337.1328125, 347.27734375, 357.421875, 367.56640625, 377.7109375, 387.85546875, 398.0]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 23.0, 949.0, 40.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15112.060546875, -14787.337890625, -14462.6162109375, -14137.8935546875, -13813.1708984375, -13488.44921875, -13163.7265625, -12839.00390625, -12514.28125, -12189.55859375, -11864.8369140625, -11540.1142578125, -11215.3916015625, -10890.669921875, -10565.947265625, -10241.224609375, -9916.5029296875, -9591.7802734375, -9267.05859375, -8942.3359375, -8617.61328125, -8292.890625, -7968.1689453125, -7643.4462890625, -7318.72412109375, -6994.001953125, -6669.279296875, -6344.55712890625, -6019.8349609375, -5695.1123046875, -5370.39013671875, -5045.66796875, -4720.9462890625, -4396.22412109375, -4071.50146484375, -3746.779296875, -3422.056884765625, -3097.33447265625, -2772.6123046875, -2447.889892578125, -2123.16748046875, -1798.445068359375, -1473.7227783203125, -1149.00048828125, -824.278076171875, -499.5556640625, -174.8333740234375, 149.888916015625, 474.611328125, 799.3336791992188, 1124.0560302734375, 1448.7783203125, 1773.500732421875, 2098.22314453125, 2422.9453125, 2747.667724609375, 3072.39013671875, 3397.112548828125, 3721.8349609375, 4046.55712890625, 4371.279296875, 4696.001953125, 5020.72412109375, 5345.4462890625, 5670.1689453125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 9.0, 15.0, 11.0, 16.0, 20.0, 19.0, 29.0, 34.0, 34.0, 42.0, 44.0, 48.0, 55.0, 51.0, 45.0, 47.0, 57.0, 52.0, 58.0, 46.0, 45.0, 41.0, 31.0, 21.0, 35.0, 22.0, 16.0, 12.0, 8.0, 6.0, 8.0, 10.0, 4.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-706.4814453125, -682.6838989257812, -658.8864135742188, -635.0888671875, -611.2913208007812, -587.4937744140625, -563.6962890625, -539.8987426757812, -516.1011962890625, -492.3036804199219, -468.5061340332031, -444.7086181640625, -420.91107177734375, -397.1135559082031, -373.3160400390625, -349.51849365234375, -325.7209777832031, -301.9234619140625, -278.12591552734375, -254.32839965820312, -230.53085327148438, -206.73333740234375, -182.93580627441406, -159.13827514648438, -135.3407440185547, -111.543212890625, -87.74568176269531, -63.948158264160156, -40.15062713623047, -16.35309600830078, 7.444427490234375, 31.241958618164062, 55.03948974609375, 78.83702087402344, 102.63455200195312, 126.43207550048828, 150.2296142578125, 174.02713012695312, 197.8246612548828, 221.6221923828125, 245.4197235107422, 269.2172546386719, 293.0147705078125, 316.81231689453125, 340.6098327636719, 364.4073791503906, 388.20489501953125, 412.00244140625, 435.7999572753906, 459.59747314453125, 483.39501953125, 507.1925354003906, 530.9900512695312, 554.78759765625, 578.5851440429688, 602.3826904296875, 626.18017578125, 649.9777221679688, 673.7752075195312, 697.57275390625, 721.3703002929688, 745.1678466796875, 768.96533203125, 792.7628784179688, 816.5604248046875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 5.0, 15.0, 9.0, 17.0, 14.0, 16.0, 24.0, 25.0, 25.0, 32.0, 32.0, 28.0, 30.0, 36.0, 30.0, 39.0, 39.0, 57.0, 51.0, 35.0, 38.0, 39.0, 31.0, 42.0, 36.0, 37.0, 38.0, 23.0, 26.0, 16.0, 23.0, 20.0, 14.0, 11.0, 15.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-82.625, -80.39697265625, -78.1689453125, -75.94091796875, -73.712890625, -71.48486328125, -69.2568359375, -67.02880859375, -64.80078125, -62.57275390625, -60.3447265625, -58.11669921875, -55.888671875, -53.66064453125, -51.4326171875, -49.20458984375, -46.9765625, -44.74853515625, -42.5205078125, -40.29248046875, -38.064453125, -35.83642578125, -33.6083984375, -31.38037109375, -29.15234375, -26.92431640625, -24.6962890625, -22.46826171875, -20.240234375, -18.01220703125, -15.7841796875, -13.55615234375, -11.328125, -9.10009765625, -6.8720703125, -4.64404296875, -2.416015625, -0.18798828125, 2.0400390625, 4.26806640625, 6.49609375, 8.72412109375, 10.9521484375, 13.18017578125, 15.408203125, 17.63623046875, 19.8642578125, 22.09228515625, 24.3203125, 26.54833984375, 28.7763671875, 31.00439453125, 33.232421875, 35.46044921875, 37.6884765625, 39.91650390625, 42.14453125, 44.37255859375, 46.6005859375, 48.82861328125, 51.056640625, 53.28466796875, 55.5126953125, 57.74072265625, 59.96875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 9.0, 7.0, 11.0, 13.0, 26.0, 36.0, 63.0, 84.0, 152.0, 211.0, 338.0, 604.0, 1002.0, 1877.0, 3580.0, 7079.0, 14327.0, 31103.0, 70644.0, 171128.0, 402917.0, 197137.0, 79163.0, 34501.0, 15822.0, 7877.0, 3993.0, 2046.0, 1131.0, 653.0, 343.0, 243.0, 122.0, 105.0, 59.0, 45.0, 28.0, 25.0, 12.0, 13.0, 8.0, 4.0, 4.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.7784423828125, -10.447509765625, -10.1165771484375, -9.78564453125, -9.4547119140625, -9.123779296875, -8.7928466796875, -8.4619140625, -8.1309814453125, -7.800048828125, -7.4691162109375, -7.13818359375, -6.8072509765625, -6.476318359375, -6.1453857421875, -5.814453125, -5.4835205078125, -5.152587890625, -4.8216552734375, -4.49072265625, -4.1597900390625, -3.828857421875, -3.4979248046875, -3.1669921875, -2.8360595703125, -2.505126953125, -2.1741943359375, -1.84326171875, -1.5123291015625, -1.181396484375, -0.8504638671875, -0.51953125, -0.1885986328125, 0.142333984375, 0.4732666015625, 0.80419921875, 1.1351318359375, 1.466064453125, 1.7969970703125, 2.1279296875, 2.4588623046875, 2.789794921875, 3.1207275390625, 3.45166015625, 3.7825927734375, 4.113525390625, 4.4444580078125, 4.775390625, 5.1063232421875, 5.437255859375, 5.7681884765625, 6.09912109375, 6.4300537109375, 6.760986328125, 7.0919189453125, 7.4228515625, 7.7537841796875, 8.084716796875, 8.4156494140625, 8.74658203125, 9.0775146484375, 9.408447265625, 9.7393798828125, 10.0703125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 3.0, 7.0, 3.0, 6.0, 11.0, 17.0, 11.0, 9.0, 21.0, 23.0, 28.0, 33.0, 33.0, 36.0, 28.0, 42.0, 35.0, 49.0, 45.0, 1075.0, 44.0, 39.0, 40.0, 37.0, 37.0, 42.0, 37.0, 41.0, 33.0, 26.0, 21.0, 24.0, 14.0, 26.0, 14.0, 12.0, 10.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-56.4375, -54.90234375, -53.3671875, -51.83203125, -50.296875, -48.76171875, -47.2265625, -45.69140625, -44.15625, -42.62109375, -41.0859375, -39.55078125, -38.015625, -36.48046875, -34.9453125, -33.41015625, -31.875, -30.33984375, -28.8046875, -27.26953125, -25.734375, -24.19921875, -22.6640625, -21.12890625, -19.59375, -18.05859375, -16.5234375, -14.98828125, -13.453125, -11.91796875, -10.3828125, -8.84765625, -7.3125, -5.77734375, -4.2421875, -2.70703125, -1.171875, 0.36328125, 1.8984375, 3.43359375, 4.96875, 6.50390625, 8.0390625, 9.57421875, 11.109375, 12.64453125, 14.1796875, 15.71484375, 17.25, 18.78515625, 20.3203125, 21.85546875, 23.390625, 24.92578125, 26.4609375, 27.99609375, 29.53125, 31.06640625, 32.6015625, 34.13671875, 35.671875, 37.20703125, 38.7421875, 40.27734375, 41.8125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 4.0, 24.0, 24.0, 31.0, 46.0, 83.0, 122.0, 191.0, 266.0, 444.0, 710.0, 1137.0, 1928.0, 3276.0, 5739.0, 9898.0, 17266.0, 30489.0, 56623.0, 109590.0, 264809.0, 1299797.0, 138404.0, 70135.0, 37591.0, 20596.0, 11440.0, 6646.0, 3804.0, 2267.0, 1362.0, 900.0, 556.0, 317.0, 196.0, 141.0, 95.0, 54.0, 44.0, 24.0, 13.0, 15.0, 10.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.087158203125, -3.95166015625, -3.816162109375, -3.6806640625, -3.545166015625, -3.40966796875, -3.274169921875, -3.138671875, -3.003173828125, -2.86767578125, -2.732177734375, -2.5966796875, -2.461181640625, -2.32568359375, -2.190185546875, -2.0546875, -1.919189453125, -1.78369140625, -1.648193359375, -1.5126953125, -1.377197265625, -1.24169921875, -1.106201171875, -0.970703125, -0.835205078125, -0.69970703125, -0.564208984375, -0.4287109375, -0.293212890625, -0.15771484375, -0.022216796875, 0.11328125, 0.248779296875, 0.38427734375, 0.519775390625, 0.6552734375, 0.790771484375, 0.92626953125, 1.061767578125, 1.197265625, 1.332763671875, 1.46826171875, 1.603759765625, 1.7392578125, 1.874755859375, 2.01025390625, 2.145751953125, 2.28125, 2.416748046875, 2.55224609375, 2.687744140625, 2.8232421875, 2.958740234375, 3.09423828125, 3.229736328125, 3.365234375, 3.500732421875, 3.63623046875, 3.771728515625, 3.9072265625, 4.042724609375, 4.17822265625, 4.313720703125, 4.44921875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 11.0, 17.0, 17.0, 14.0, 23.0, 27.0, 39.0, 64.0, 89.0, 115.0, 187.0, 100.0, 75.0, 49.0, 31.0, 35.0, 19.0, 11.0, 20.0, 7.0, 16.0, 8.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3916015625, -0.37979888916015625, -0.3679962158203125, -0.35619354248046875, -0.344390869140625, -0.33258819580078125, -0.3207855224609375, -0.30898284912109375, -0.29718017578125, -0.28537750244140625, -0.2735748291015625, -0.26177215576171875, -0.249969482421875, -0.23816680908203125, -0.2263641357421875, -0.21456146240234375, -0.2027587890625, -0.19095611572265625, -0.1791534423828125, -0.16735076904296875, -0.155548095703125, -0.14374542236328125, -0.1319427490234375, -0.12014007568359375, -0.10833740234375, -0.09653472900390625, -0.0847320556640625, -0.07292938232421875, -0.061126708984375, -0.04932403564453125, -0.0375213623046875, -0.02571868896484375, -0.013916015625, -0.00211334228515625, 0.0096893310546875, 0.02149200439453125, 0.033294677734375, 0.04509735107421875, 0.0569000244140625, 0.06870269775390625, 0.08050537109375, 0.09230804443359375, 0.1041107177734375, 0.11591339111328125, 0.127716064453125, 0.13951873779296875, 0.1513214111328125, 0.16312408447265625, 0.1749267578125, 0.18672943115234375, 0.1985321044921875, 0.21033477783203125, 0.222137451171875, 0.23394012451171875, 0.2457427978515625, 0.25754547119140625, 0.26934814453125, 0.28115081787109375, 0.2929534912109375, 0.30475616455078125, 0.316558837890625, 0.32836151123046875, 0.3401641845703125, 0.35196685791015625, 0.36376953125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 7.0, 1.0, 10.0, 8.0, 11.0, 13.0, 18.0, 17.0, 39.0, 41.0, 47.0, 83.0, 128.0, 242.0, 691.0, 1043321.0, 2965.0, 392.0, 183.0, 100.0, 52.0, 46.0, 32.0, 29.0, 18.0, 17.0, 11.0, 8.0, 9.0, 5.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.95703125, -7.69854736328125, -7.4400634765625, -7.18157958984375, -6.923095703125, -6.66461181640625, -6.4061279296875, -6.14764404296875, -5.88916015625, -5.63067626953125, -5.3721923828125, -5.11370849609375, -4.855224609375, -4.59674072265625, -4.3382568359375, -4.07977294921875, -3.8212890625, -3.56280517578125, -3.3043212890625, -3.04583740234375, -2.787353515625, -2.52886962890625, -2.2703857421875, -2.01190185546875, -1.75341796875, -1.49493408203125, -1.2364501953125, -0.97796630859375, -0.719482421875, -0.46099853515625, -0.2025146484375, 0.05596923828125, 0.314453125, 0.57293701171875, 0.8314208984375, 1.08990478515625, 1.348388671875, 1.60687255859375, 1.8653564453125, 2.12384033203125, 2.38232421875, 2.64080810546875, 2.8992919921875, 3.15777587890625, 3.416259765625, 3.67474365234375, 3.9332275390625, 4.19171142578125, 4.4501953125, 4.70867919921875, 4.9671630859375, 5.22564697265625, 5.484130859375, 5.74261474609375, 6.0010986328125, 6.25958251953125, 6.51806640625, 6.77655029296875, 7.0350341796875, 7.29351806640625, 7.552001953125, 7.81048583984375, 8.0689697265625, 8.32745361328125, 8.5859375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 918.0, 96.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7686578035354614, -0.6809415817260742, -0.5932254195213318, -0.5055092573165894, -0.41779303550720215, -0.33007684350013733, -0.2423606514930725, -0.15464448928833008, -0.06692826747894287, 0.020787924528121948, 0.10850411653518677, 0.1962203085422516, 0.2839365005493164, 0.3716526925563812, 0.45936888456344604, 0.5470850467681885, 0.6348012685775757, 0.7225174903869629, 0.8102336525917053, 0.8979498147964478, 0.985666036605835, 1.0733822584152222, 1.1610984802246094, 1.248814582824707, 1.3365308046340942, 1.4242470264434814, 1.511963129043579, 1.5996793508529663, 1.6873955726623535, 1.7751117944717407, 1.862828016281128, 1.9505441188812256, 2.0382604598999023, 2.1259765625, 2.2136929035186768, 2.3014090061187744, 2.389125347137451, 2.476841449737549, 2.5645575523376465, 2.652273654937744, 2.739989995956421, 2.8277060985565186, 2.9154224395751953, 3.003138542175293, 3.0908546447753906, 3.1785709857940674, 3.266287088394165, 3.354003429412842, 3.4417195320129395, 3.529435634613037, 3.617151975631714, 3.7048680782318115, 3.7925844192504883, 3.880300521850586, 3.9680166244506836, 4.055732727050781, 4.143448829650879, 4.231164932250977, 4.318881034851074, 4.40659761428833, 4.494313716888428, 4.582029819488525, 4.669745922088623, 4.757462024688721, 4.845178604125977]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 4.0, 5.0, 5.0, 9.0, 8.0, 14.0, 13.0, 13.0, 9.0, 17.0, 19.0, 17.0, 24.0, 23.0, 29.0, 38.0, 33.0, 34.0, 38.0, 23.0, 39.0, 32.0, 47.0, 33.0, 40.0, 41.0, 39.0, 32.0, 30.0, 34.0, 37.0, 36.0, 17.0, 24.0, 23.0, 23.0, 22.0, 14.0, 16.0, 8.0, 10.0, 6.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2980431914329529, -0.2886809706687927, -0.2793187201023102, -0.26995649933815, -0.2605942487716675, -0.2512320280075073, -0.24186980724334717, -0.23250757157802582, -0.22314533591270447, -0.21378310024738312, -0.20442086458206177, -0.1950586438179016, -0.18569640815258026, -0.1763341724872589, -0.16697195172309875, -0.1576097160577774, -0.14824748039245605, -0.1388852447271347, -0.12952300906181335, -0.1201607882976532, -0.11079855263233185, -0.1014363169670105, -0.09207408875226974, -0.08271186053752899, -0.07334962487220764, -0.06398738920688629, -0.05462516099214554, -0.04526292905211449, -0.035900697112083435, -0.026538465172052383, -0.017176233232021332, -0.007814005017280579, 0.0015482306480407715, 0.010910462588071823, 0.020272694528102875, 0.029634926468133926, 0.03899715840816498, 0.04835939034819603, 0.05772162228822708, 0.06708385050296783, 0.07644608616828918, 0.08580832183361053, 0.09517055004835129, 0.10453277826309204, 0.11389501392841339, 0.12325724959373474, 0.1326194703578949, 0.14198170602321625, 0.1513439416885376, 0.16070617735385895, 0.1700684130191803, 0.17943063378334045, 0.1887928694486618, 0.19815510511398315, 0.2075173258781433, 0.21687956154346466, 0.226241797208786, 0.23560403287410736, 0.2449662685394287, 0.25432848930358887, 0.263690710067749, 0.27305296063423157, 0.2824151813983917, 0.29177743196487427, 0.3011396527290344]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 5.0, 14.0, 10.0, 17.0, 13.0, 17.0, 23.0, 25.0, 26.0, 32.0, 31.0, 28.0, 30.0, 37.0, 30.0, 38.0, 40.0, 56.0, 51.0, 36.0, 37.0, 39.0, 32.0, 41.0, 36.0, 38.0, 37.0, 24.0, 26.0, 16.0, 22.0, 21.0, 14.0, 11.0, 15.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-82.6875, -80.45849609375, -78.2294921875, -76.00048828125, -73.771484375, -71.54248046875, -69.3134765625, -67.08447265625, -64.85546875, -62.62646484375, -60.3974609375, -58.16845703125, -55.939453125, -53.71044921875, -51.4814453125, -49.25244140625, -47.0234375, -44.79443359375, -42.5654296875, -40.33642578125, -38.107421875, -35.87841796875, -33.6494140625, -31.42041015625, -29.19140625, -26.96240234375, -24.7333984375, -22.50439453125, -20.275390625, -18.04638671875, -15.8173828125, -13.58837890625, -11.359375, -9.13037109375, -6.9013671875, -4.67236328125, -2.443359375, -0.21435546875, 2.0146484375, 4.24365234375, 6.47265625, 8.70166015625, 10.9306640625, 13.15966796875, 15.388671875, 17.61767578125, 19.8466796875, 22.07568359375, 24.3046875, 26.53369140625, 28.7626953125, 30.99169921875, 33.220703125, 35.44970703125, 37.6787109375, 39.90771484375, 42.13671875, 44.36572265625, 46.5947265625, 48.82373046875, 51.052734375, 53.28173828125, 55.5107421875, 57.73974609375, 59.96875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 8.0, 5.0, 8.0, 14.0, 14.0, 26.0, 40.0, 65.0, 73.0, 116.0, 181.0, 282.0, 443.0, 678.0, 1058.0, 1631.0, 2831.0, 5212.0, 10155.0, 25920.0, 103156.0, 636477.0, 193538.0, 38183.0, 13455.0, 6196.0, 3331.0, 2046.0, 1233.0, 743.0, 496.0, 320.0, 205.0, 145.0, 75.0, 72.0, 39.0, 26.0, 22.0, 13.0, 7.0, 7.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.625, -145.546875, -140.46875, -135.390625, -130.3125, -125.234375, -120.15625, -115.078125, -110.0, -104.921875, -99.84375, -94.765625, -89.6875, -84.609375, -79.53125, -74.453125, -69.375, -64.296875, -59.21875, -54.140625, -49.0625, -43.984375, -38.90625, -33.828125, -28.75, -23.671875, -18.59375, -13.515625, -8.4375, -3.359375, 1.71875, 6.796875, 11.875, 16.953125, 22.03125, 27.109375, 32.1875, 37.265625, 42.34375, 47.421875, 52.5, 57.578125, 62.65625, 67.734375, 72.8125, 77.890625, 82.96875, 88.046875, 93.125, 98.203125, 103.28125, 108.359375, 113.4375, 118.515625, 123.59375, 128.671875, 133.75, 138.828125, 143.90625, 148.984375, 154.0625, 159.140625, 164.21875, 169.296875, 174.375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 4.0, 8.0, 5.0, 6.0, 15.0, 10.0, 16.0, 22.0, 26.0, 28.0, 37.0, 32.0, 36.0, 59.0, 55.0, 84.0, 126.0, 231.0, 1493.0, 230.0, 99.0, 64.0, 64.0, 43.0, 25.0, 32.0, 32.0, 35.0, 26.0, 17.0, 16.0, 9.0, 10.0, 11.0, 8.0, 6.0, 8.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-151.875, -147.041015625, -142.20703125, -137.373046875, -132.5390625, -127.705078125, -122.87109375, -118.037109375, -113.203125, -108.369140625, -103.53515625, -98.701171875, -93.8671875, -89.033203125, -84.19921875, -79.365234375, -74.53125, -69.697265625, -64.86328125, -60.029296875, -55.1953125, -50.361328125, -45.52734375, -40.693359375, -35.859375, -31.025390625, -26.19140625, -21.357421875, -16.5234375, -11.689453125, -6.85546875, -2.021484375, 2.8125, 7.646484375, 12.48046875, 17.314453125, 22.1484375, 26.982421875, 31.81640625, 36.650390625, 41.484375, 46.318359375, 51.15234375, 55.986328125, 60.8203125, 65.654296875, 70.48828125, 75.322265625, 80.15625, 84.990234375, 89.82421875, 94.658203125, 99.4921875, 104.326171875, 109.16015625, 113.994140625, 118.828125, 123.662109375, 128.49609375, 133.330078125, 138.1640625, 142.998046875, 147.83203125, 152.666015625, 157.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 10.0, 6.0, 13.0, 12.0, 17.0, 12.0, 26.0, 27.0, 47.0, 89.0, 132.0, 207.0, 381.0, 819.0, 3999.0, 2874594.0, 261210.0, 2529.0, 662.0, 328.0, 193.0, 122.0, 80.0, 50.0, 31.0, 24.0, 23.0, 13.0, 13.0, 12.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-688.5, -669.3203125, -650.140625, -630.9609375, -611.78125, -592.6015625, -573.421875, -554.2421875, -535.0625, -515.8828125, -496.703125, -477.5234375, -458.34375, -439.1640625, -419.984375, -400.8046875, -381.625, -362.4453125, -343.265625, -324.0859375, -304.90625, -285.7265625, -266.546875, -247.3671875, -228.1875, -209.0078125, -189.828125, -170.6484375, -151.46875, -132.2890625, -113.109375, -93.9296875, -74.75, -55.5703125, -36.390625, -17.2109375, 1.96875, 21.1484375, 40.328125, 59.5078125, 78.6875, 97.8671875, 117.046875, 136.2265625, 155.40625, 174.5859375, 193.765625, 212.9453125, 232.125, 251.3046875, 270.484375, 289.6640625, 308.84375, 328.0234375, 347.203125, 366.3828125, 385.5625, 404.7421875, 423.921875, 443.1015625, 462.28125, 481.4609375, 500.640625, 519.8203125, 539.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 13.0, 37.0, 64.0, 123.0, 189.0, 198.0, 163.0, 113.0, 55.0, 24.0, 13.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-305.8585510253906, -281.7736511230469, -257.6887512207031, -233.60385131835938, -209.51895141601562, -185.43405151367188, -161.34913635253906, -137.2642364501953, -113.17933654785156, -89.09443664550781, -65.00953674316406, -40.92462921142578, -16.83972930908203, 7.245170593261719, 31.330078125, 55.41497802734375, 79.4998779296875, 103.58477783203125, 127.669677734375, 151.75457763671875, 175.8394775390625, 199.92437744140625, 224.00929260253906, 248.0941925048828, 272.1790771484375, 296.26397705078125, 320.348876953125, 344.43377685546875, 368.5186767578125, 392.60357666015625, 416.6884765625, 440.77337646484375, 464.85833740234375, 488.9432373046875, 513.0281372070312, 537.113037109375, 561.1979370117188, 585.2828369140625, 609.3677368164062, 633.45263671875, 657.5375366210938, 681.6224365234375, 705.7073364257812, 729.792236328125, 753.8771362304688, 777.9620361328125, 802.0469360351562, 826.1318359375, 850.216796875, 874.3016967773438, 898.3865966796875, 922.4714965820312, 946.556396484375, 970.6412963867188, 994.7261962890625, 1018.8110961914062, 1042.89599609375, 1066.98095703125, 1091.0657958984375, 1115.1507568359375, 1139.235595703125, 1163.320556640625, 1187.4053955078125, 1211.4903564453125, 1235.5751953125]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 8.0, 5.0, 8.0, 6.0, 11.0, 8.0, 14.0, 13.0, 12.0, 18.0, 24.0, 24.0, 25.0, 21.0, 29.0, 31.0, 27.0, 29.0, 26.0, 35.0, 35.0, 28.0, 33.0, 37.0, 37.0, 31.0, 40.0, 41.0, 33.0, 22.0, 30.0, 30.0, 33.0, 29.0, 24.0, 20.0, 15.0, 14.0, 10.0, 18.0, 5.0, 12.0, 11.0, 11.0, 4.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-398.1130065917969, -385.73126220703125, -373.3495178222656, -360.9677734375, -348.5860290527344, -336.20428466796875, -323.82257080078125, -311.4407958984375, -299.05908203125, -286.6773376464844, -274.29559326171875, -261.9138488769531, -249.5321044921875, -237.15036010742188, -224.7686309814453, -212.3868865966797, -200.005126953125, -187.62338256835938, -175.24163818359375, -162.85989379882812, -150.4781494140625, -138.09640502929688, -125.71467590332031, -113.33293151855469, -100.95118713378906, -88.56944274902344, -76.18769836425781, -63.80596160888672, -51.424217224121094, -39.04247283935547, -26.660736083984375, -14.27899169921875, -1.897216796875, 10.484525680541992, 22.866268157958984, 35.248008728027344, 47.62975311279297, 60.011497497558594, 72.39323425292969, 84.77497863769531, 97.15672302246094, 109.53846740722656, 121.92021179199219, 134.30194091796875, 146.68368530273438, 159.0654296875, 171.44717407226562, 183.82891845703125, 196.21066284179688, 208.5924072265625, 220.97415161132812, 233.35589599609375, 245.73764038085938, 258.119384765625, 270.5010986328125, 282.88287353515625, 295.26458740234375, 307.6463317871094, 320.028076171875, 332.4098205566406, 344.79156494140625, 357.1733093261719, 369.5550537109375, 381.936767578125, 394.31854248046875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 4.0, 5.0, 11.0, 7.0, 10.0, 13.0, 13.0, 25.0, 17.0, 26.0, 28.0, 31.0, 30.0, 28.0, 32.0, 37.0, 36.0, 35.0, 36.0, 38.0, 48.0, 43.0, 50.0, 36.0, 48.0, 48.0, 40.0, 30.0, 24.0, 29.0, 20.0, 26.0, 11.0, 16.0, 11.0, 15.0, 15.0, 8.0, 4.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-82.25, -79.916015625, -77.58203125, -75.248046875, -72.9140625, -70.580078125, -68.24609375, -65.912109375, -63.578125, -61.244140625, -58.91015625, -56.576171875, -54.2421875, -51.908203125, -49.57421875, -47.240234375, -44.90625, -42.572265625, -40.23828125, -37.904296875, -35.5703125, -33.236328125, -30.90234375, -28.568359375, -26.234375, -23.900390625, -21.56640625, -19.232421875, -16.8984375, -14.564453125, -12.23046875, -9.896484375, -7.5625, -5.228515625, -2.89453125, -0.560546875, 1.7734375, 4.107421875, 6.44140625, 8.775390625, 11.109375, 13.443359375, 15.77734375, 18.111328125, 20.4453125, 22.779296875, 25.11328125, 27.447265625, 29.78125, 32.115234375, 34.44921875, 36.783203125, 39.1171875, 41.451171875, 43.78515625, 46.119140625, 48.453125, 50.787109375, 53.12109375, 55.455078125, 57.7890625, 60.123046875, 62.45703125, 64.791015625, 67.125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 6.0, 10.0, 14.0, 19.0, 29.0, 37.0, 44.0, 69.0, 95.0, 125.0, 156.0, 250.0, 328.0, 451.0, 601.0, 909.0, 1376.0, 2177.0, 4059.0, 9696.0, 42482.0, 1251510.0, 2754236.0, 99393.0, 13505.0, 5112.0, 2593.0, 1586.0, 1025.0, 675.0, 458.0, 319.0, 241.0, 180.0, 127.0, 108.0, 65.0, 52.0, 44.0, 26.0, 26.0, 17.0, 12.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-220.25, -212.9453125, -205.640625, -198.3359375, -191.03125, -183.7265625, -176.421875, -169.1171875, -161.8125, -154.5078125, -147.203125, -139.8984375, -132.59375, -125.2890625, -117.984375, -110.6796875, -103.375, -96.0703125, -88.765625, -81.4609375, -74.15625, -66.8515625, -59.546875, -52.2421875, -44.9375, -37.6328125, -30.328125, -23.0234375, -15.71875, -8.4140625, -1.109375, 6.1953125, 13.5, 20.8046875, 28.109375, 35.4140625, 42.71875, 50.0234375, 57.328125, 64.6328125, 71.9375, 79.2421875, 86.546875, 93.8515625, 101.15625, 108.4609375, 115.765625, 123.0703125, 130.375, 137.6796875, 144.984375, 152.2890625, 159.59375, 166.8984375, 174.203125, 181.5078125, 188.8125, 196.1171875, 203.421875, 210.7265625, 218.03125, 225.3359375, 232.640625, 239.9453125, 247.25]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 9.0, 24.0, 25.0, 27.0, 53.0, 80.0, 111.0, 202.0, 339.0, 561.0, 798.0, 687.0, 429.0, 245.0, 159.0, 98.0, 52.0, 41.0, 30.0, 28.0, 19.0, 14.0, 5.0, 11.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-186.625, -181.267578125, -175.91015625, -170.552734375, -165.1953125, -159.837890625, -154.48046875, -149.123046875, -143.765625, -138.408203125, -133.05078125, -127.693359375, -122.3359375, -116.978515625, -111.62109375, -106.263671875, -100.90625, -95.548828125, -90.19140625, -84.833984375, -79.4765625, -74.119140625, -68.76171875, -63.404296875, -58.046875, -52.689453125, -47.33203125, -41.974609375, -36.6171875, -31.259765625, -25.90234375, -20.544921875, -15.1875, -9.830078125, -4.47265625, 0.884765625, 6.2421875, 11.599609375, 16.95703125, 22.314453125, 27.671875, 33.029296875, 38.38671875, 43.744140625, 49.1015625, 54.458984375, 59.81640625, 65.173828125, 70.53125, 75.888671875, 81.24609375, 86.603515625, 91.9609375, 97.318359375, 102.67578125, 108.033203125, 113.390625, 118.748046875, 124.10546875, 129.462890625, 134.8203125, 140.177734375, 145.53515625, 150.892578125, 156.25]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 7.0, 7.0, 2.0, 21.0, 24.0, 29.0, 37.0, 58.0, 96.0, 206.0, 435.0, 1120.0, 4830.0, 55006.0, 3883271.0, 235823.0, 10322.0, 1863.0, 585.0, 259.0, 116.0, 54.0, 46.0, 24.0, 16.0, 9.0, 6.0, 4.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-416.25, -402.68359375, -389.1171875, -375.55078125, -361.984375, -348.41796875, -334.8515625, -321.28515625, -307.71875, -294.15234375, -280.5859375, -267.01953125, -253.453125, -239.88671875, -226.3203125, -212.75390625, -199.1875, -185.62109375, -172.0546875, -158.48828125, -144.921875, -131.35546875, -117.7890625, -104.22265625, -90.65625, -77.08984375, -63.5234375, -49.95703125, -36.390625, -22.82421875, -9.2578125, 4.30859375, 17.875, 31.44140625, 45.0078125, 58.57421875, 72.140625, 85.70703125, 99.2734375, 112.83984375, 126.40625, 139.97265625, 153.5390625, 167.10546875, 180.671875, 194.23828125, 207.8046875, 221.37109375, 234.9375, 248.50390625, 262.0703125, 275.63671875, 289.203125, 302.76953125, 316.3359375, 329.90234375, 343.46875, 357.03515625, 370.6015625, 384.16796875, 397.734375, 411.30078125, 424.8671875, 438.43359375, 452.0]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 89.0, 807.0, 112.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7563.4990234375, -7419.3623046875, -7275.2255859375, -7131.0888671875, -6986.9521484375, -6842.8154296875, -6698.6787109375, -6554.54150390625, -6410.40478515625, -6266.26806640625, -6122.13134765625, -5977.99462890625, -5833.85791015625, -5689.720703125, -5545.583984375, -5401.447265625, -5257.310546875, -5113.173828125, -4969.037109375, -4824.900390625, -4680.763671875, -4536.626953125, -4392.490234375, -4248.35302734375, -4104.216796875, -3960.080078125, -3815.943359375, -3671.806640625, -3527.669677734375, -3383.532958984375, -3239.396240234375, -3095.259521484375, -2951.123046875, -2806.986328125, -2662.849609375, -2518.712890625, -2374.575927734375, -2230.439208984375, -2086.302490234375, -1942.165771484375, -1798.02880859375, -1653.89208984375, -1509.7552490234375, -1365.6185302734375, -1221.481689453125, -1077.344970703125, -933.208251953125, -789.0714721679688, -644.9346923828125, -500.79791259765625, -356.6611633300781, -212.5244140625, -68.38763427734375, 75.7491455078125, 219.8858642578125, 364.02264404296875, 508.159423828125, 652.2962036132812, 796.4329833984375, 940.5697021484375, 1084.70654296875, 1228.84326171875, 1372.97998046875, 1517.11669921875, 1661.2535400390625]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 3.0, 9.0, 11.0, 12.0, 9.0, 11.0, 13.0, 21.0, 26.0, 22.0, 19.0, 38.0, 38.0, 34.0, 37.0, 35.0, 39.0, 31.0, 39.0, 52.0, 45.0, 42.0, 30.0, 41.0, 50.0, 41.0, 30.0, 34.0, 32.0, 27.0, 24.0, 21.0, 11.0, 16.0, 12.0, 11.0, 12.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-407.47088623046875, -393.225341796875, -378.97979736328125, -364.7342529296875, -350.48870849609375, -336.2431640625, -321.99761962890625, -307.7520751953125, -293.50653076171875, -279.260986328125, -265.01544189453125, -250.7698974609375, -236.52435302734375, -222.27880859375, -208.03326416015625, -193.7877197265625, -179.54217529296875, -165.296630859375, -151.05108642578125, -136.8055419921875, -122.55999755859375, -108.314453125, -94.06890869140625, -79.8233642578125, -65.57781982421875, -51.332275390625, -37.08673095703125, -22.8411865234375, -8.59564208984375, 5.64990234375, 19.89544677734375, 34.1409912109375, 48.38653564453125, 62.632080078125, 76.87762451171875, 91.1231689453125, 105.36871337890625, 119.6142578125, 133.85980224609375, 148.1053466796875, 162.35089111328125, 176.596435546875, 190.84197998046875, 205.0875244140625, 219.33306884765625, 233.57861328125, 247.82415771484375, 262.0697021484375, 276.31524658203125, 290.560791015625, 304.80633544921875, 319.0518798828125, 333.29742431640625, 347.54296875, 361.78851318359375, 376.0340576171875, 390.27960205078125, 404.525146484375, 418.77069091796875, 433.0162353515625, 447.26177978515625, 461.50732421875, 475.75286865234375, 489.9984130859375, 504.24395751953125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 7.0, 3.0, 11.0, 4.0, 8.0, 13.0, 20.0, 23.0, 17.0, 20.0, 32.0, 29.0, 30.0, 44.0, 35.0, 36.0, 38.0, 39.0, 45.0, 44.0, 51.0, 44.0, 43.0, 31.0, 35.0, 54.0, 32.0, 30.0, 23.0, 31.0, 20.0, 24.0, 17.0, 14.0, 9.0, 15.0, 10.0, 11.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-78.1875, -76.1728515625, -74.158203125, -72.1435546875, -70.12890625, -68.1142578125, -66.099609375, -64.0849609375, -62.0703125, -60.0556640625, -58.041015625, -56.0263671875, -54.01171875, -51.9970703125, -49.982421875, -47.9677734375, -45.953125, -43.9384765625, -41.923828125, -39.9091796875, -37.89453125, -35.8798828125, -33.865234375, -31.8505859375, -29.8359375, -27.8212890625, -25.806640625, -23.7919921875, -21.77734375, -19.7626953125, -17.748046875, -15.7333984375, -13.71875, -11.7041015625, -9.689453125, -7.6748046875, -5.66015625, -3.6455078125, -1.630859375, 0.3837890625, 2.3984375, 4.4130859375, 6.427734375, 8.4423828125, 10.45703125, 12.4716796875, 14.486328125, 16.5009765625, 18.515625, 20.5302734375, 22.544921875, 24.5595703125, 26.57421875, 28.5888671875, 30.603515625, 32.6181640625, 34.6328125, 36.6474609375, 38.662109375, 40.6767578125, 42.69140625, 44.7060546875, 46.720703125, 48.7353515625, 50.75]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 7.0, 9.0, 7.0, 10.0, 28.0, 34.0, 45.0, 42.0, 77.0, 79.0, 90.0, 121.0, 116.0, 167.0, 238.0, 335.0, 540.0, 727.0, 1030.0, 1510.0, 2204.0, 3388.0, 5485.0, 8962.0, 15228.0, 28408.0, 55066.0, 115054.0, 246496.0, 284436.0, 135364.0, 64928.0, 32773.0, 17624.0, 10060.0, 6096.0, 3816.0, 2466.0, 1664.0, 1106.0, 776.0, 485.0, 359.0, 261.0, 177.0, 134.0, 121.0, 75.0, 72.0, 69.0, 46.0, 50.0, 40.0, 26.0, 15.0, 11.0, 8.0, 2.0, 3.0, 2.0, 3.0], "bins": [-9.0859375, -8.802978515625, -8.52001953125, -8.237060546875, -7.9541015625, -7.671142578125, -7.38818359375, -7.105224609375, -6.822265625, -6.539306640625, -6.25634765625, -5.973388671875, -5.6904296875, -5.407470703125, -5.12451171875, -4.841552734375, -4.55859375, -4.275634765625, -3.99267578125, -3.709716796875, -3.4267578125, -3.143798828125, -2.86083984375, -2.577880859375, -2.294921875, -2.011962890625, -1.72900390625, -1.446044921875, -1.1630859375, -0.880126953125, -0.59716796875, -0.314208984375, -0.03125, 0.251708984375, 0.53466796875, 0.817626953125, 1.1005859375, 1.383544921875, 1.66650390625, 1.949462890625, 2.232421875, 2.515380859375, 2.79833984375, 3.081298828125, 3.3642578125, 3.647216796875, 3.93017578125, 4.213134765625, 4.49609375, 4.779052734375, 5.06201171875, 5.344970703125, 5.6279296875, 5.910888671875, 6.19384765625, 6.476806640625, 6.759765625, 7.042724609375, 7.32568359375, 7.608642578125, 7.8916015625, 8.174560546875, 8.45751953125, 8.740478515625, 9.0234375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 6.0, 6.0, 5.0, 15.0, 11.0, 21.0, 18.0, 15.0, 14.0, 31.0, 31.0, 38.0, 34.0, 37.0, 41.0, 42.0, 56.0, 52.0, 1055.0, 28.0, 44.0, 56.0, 36.0, 50.0, 32.0, 31.0, 37.0, 36.0, 28.0, 29.0, 16.0, 8.0, 16.0, 11.0, 5.0, 9.0, 10.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.875, -45.51708984375, -44.1591796875, -42.80126953125, -41.443359375, -40.08544921875, -38.7275390625, -37.36962890625, -36.01171875, -34.65380859375, -33.2958984375, -31.93798828125, -30.580078125, -29.22216796875, -27.8642578125, -26.50634765625, -25.1484375, -23.79052734375, -22.4326171875, -21.07470703125, -19.716796875, -18.35888671875, -17.0009765625, -15.64306640625, -14.28515625, -12.92724609375, -11.5693359375, -10.21142578125, -8.853515625, -7.49560546875, -6.1376953125, -4.77978515625, -3.421875, -2.06396484375, -0.7060546875, 0.65185546875, 2.009765625, 3.36767578125, 4.7255859375, 6.08349609375, 7.44140625, 8.79931640625, 10.1572265625, 11.51513671875, 12.873046875, 14.23095703125, 15.5888671875, 16.94677734375, 18.3046875, 19.66259765625, 21.0205078125, 22.37841796875, 23.736328125, 25.09423828125, 26.4521484375, 27.81005859375, 29.16796875, 30.52587890625, 31.8837890625, 33.24169921875, 34.599609375, 35.95751953125, 37.3154296875, 38.67333984375, 40.03125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 12.0, 9.0, 8.0, 25.0, 31.0, 36.0, 61.0, 61.0, 110.0, 135.0, 244.0, 306.0, 454.0, 667.0, 1022.0, 1488.0, 2271.0, 3574.0, 5533.0, 8908.0, 14313.0, 23785.0, 40462.0, 70034.0, 128069.0, 1243730.0, 279828.0, 114518.0, 63064.0, 36465.0, 21717.0, 13101.0, 8179.0, 5048.0, 3310.0, 2151.0, 1344.0, 953.0, 637.0, 431.0, 311.0, 226.0, 161.0, 91.0, 72.0, 61.0, 36.0, 23.0, 15.0, 10.0, 9.0, 8.0, 7.0, 3.0, 0.0, 2.0, 3.0], "bins": [-4.44140625, -4.30645751953125, -4.1715087890625, -4.03656005859375, -3.901611328125, -3.76666259765625, -3.6317138671875, -3.49676513671875, -3.36181640625, -3.22686767578125, -3.0919189453125, -2.95697021484375, -2.822021484375, -2.68707275390625, -2.5521240234375, -2.41717529296875, -2.2822265625, -2.14727783203125, -2.0123291015625, -1.87738037109375, -1.742431640625, -1.60748291015625, -1.4725341796875, -1.33758544921875, -1.20263671875, -1.06768798828125, -0.9327392578125, -0.79779052734375, -0.662841796875, -0.52789306640625, -0.3929443359375, -0.25799560546875, -0.123046875, 0.01190185546875, 0.1468505859375, 0.28179931640625, 0.416748046875, 0.55169677734375, 0.6866455078125, 0.82159423828125, 0.95654296875, 1.09149169921875, 1.2264404296875, 1.36138916015625, 1.496337890625, 1.63128662109375, 1.7662353515625, 1.90118408203125, 2.0361328125, 2.17108154296875, 2.3060302734375, 2.44097900390625, 2.575927734375, 2.71087646484375, 2.8458251953125, 2.98077392578125, 3.11572265625, 3.25067138671875, 3.3856201171875, 3.52056884765625, 3.655517578125, 3.79046630859375, 3.9254150390625, 4.06036376953125, 4.1953125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 8.0, 7.0, 5.0, 7.0, 8.0, 7.0, 11.0, 17.0, 30.0, 17.0, 24.0, 48.0, 89.0, 176.0, 203.0, 103.0, 59.0, 37.0, 24.0, 15.0, 22.0, 16.0, 10.0, 5.0, 11.0, 5.0, 9.0, 10.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2418212890625, -0.23378944396972656, -0.22575759887695312, -0.2177257537841797, -0.20969390869140625, -0.2016620635986328, -0.19363021850585938, -0.18559837341308594, -0.1775665283203125, -0.16953468322753906, -0.16150283813476562, -0.1534709930419922, -0.14543914794921875, -0.1374073028564453, -0.12937545776367188, -0.12134361267089844, -0.113311767578125, -0.10527992248535156, -0.09724807739257812, -0.08921623229980469, -0.08118438720703125, -0.07315254211425781, -0.06512069702148438, -0.05708885192871094, -0.0490570068359375, -0.04102516174316406, -0.032993316650390625, -0.024961471557617188, -0.01692962646484375, -0.008897781372070312, -0.000865936279296875, 0.0071659088134765625, 0.01519775390625, 0.023229598999023438, 0.031261444091796875, 0.03929328918457031, 0.04732513427734375, 0.05535697937011719, 0.06338882446289062, 0.07142066955566406, 0.0794525146484375, 0.08748435974121094, 0.09551620483398438, 0.10354804992675781, 0.11157989501953125, 0.11961174011230469, 0.12764358520507812, 0.13567543029785156, 0.143707275390625, 0.15173912048339844, 0.15977096557617188, 0.1678028106689453, 0.17583465576171875, 0.1838665008544922, 0.19189834594726562, 0.19993019104003906, 0.2079620361328125, 0.21599388122558594, 0.22402572631835938, 0.2320575714111328, 0.24008941650390625, 0.2481212615966797, 0.2561531066894531, 0.26418495178222656, 0.272216796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 15.0, 10.0, 14.0, 13.0, 29.0, 33.0, 41.0, 73.0, 101.0, 184.0, 440.0, 5432.0, 1040902.0, 601.0, 232.0, 125.0, 78.0, 56.0, 31.0, 30.0, 19.0, 14.0, 8.0, 13.0, 9.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.79296875, -6.59417724609375, -6.3953857421875, -6.19659423828125, -5.997802734375, -5.79901123046875, -5.6002197265625, -5.40142822265625, -5.20263671875, -5.00384521484375, -4.8050537109375, -4.60626220703125, -4.407470703125, -4.20867919921875, -4.0098876953125, -3.81109619140625, -3.6123046875, -3.41351318359375, -3.2147216796875, -3.01593017578125, -2.817138671875, -2.61834716796875, -2.4195556640625, -2.22076416015625, -2.02197265625, -1.82318115234375, -1.6243896484375, -1.42559814453125, -1.226806640625, -1.02801513671875, -0.8292236328125, -0.63043212890625, -0.431640625, -0.23284912109375, -0.0340576171875, 0.16473388671875, 0.363525390625, 0.56231689453125, 0.7611083984375, 0.95989990234375, 1.15869140625, 1.35748291015625, 1.5562744140625, 1.75506591796875, 1.953857421875, 2.15264892578125, 2.3514404296875, 2.55023193359375, 2.7490234375, 2.94781494140625, 3.1466064453125, 3.34539794921875, 3.544189453125, 3.74298095703125, 3.9417724609375, 4.14056396484375, 4.33935546875, 4.53814697265625, 4.7369384765625, 4.93572998046875, 5.134521484375, 5.33331298828125, 5.5321044921875, 5.73089599609375, 5.9296875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1010.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1715028285980225, -0.9954726696014404, -0.8194425106048584, -0.6434123516082764, -0.46738219261169434, -0.2913520336151123, -0.11532187461853027, 0.06070828437805176, 0.2367384433746338, 0.4127686023712158, 0.5887987613677979, 0.7648289203643799, 0.9408590793609619, 1.116889238357544, 1.292919397354126, 1.468949556350708, 1.64497971534729, 1.821009874343872, 1.997040033340454, 2.173070192337036, 2.349100351333618, 2.5251305103302, 2.7011606693267822, 2.8771908283233643, 3.0532209873199463, 3.2292511463165283, 3.4052813053131104, 3.5813114643096924, 3.7573416233062744, 3.9333717823028564, 4.109401702880859, 4.285431861877441, 4.461462020874023, 4.6374921798706055, 4.8135223388671875, 4.9895524978637695, 5.165582656860352, 5.341612815856934, 5.517642974853516, 5.693673133850098, 5.86970329284668, 6.045733451843262, 6.221763610839844, 6.397793769836426, 6.573823928833008, 6.74985408782959, 6.925884246826172, 7.101914405822754, 7.277944564819336, 7.453974723815918, 7.6300048828125, 7.806035041809082, 7.982065200805664, 8.158095359802246, 8.334125518798828, 8.51015567779541, 8.686185836791992, 8.862215995788574, 9.038246154785156, 9.214276313781738, 9.39030647277832, 9.566336631774902, 9.742366790771484, 9.918396949768066, 10.094427108764648]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 13.0, 11.0, 14.0, 11.0, 15.0, 25.0, 24.0, 32.0, 41.0, 35.0, 27.0, 51.0, 62.0, 52.0, 47.0, 71.0, 64.0, 55.0, 43.0, 45.0, 51.0, 39.0, 28.0, 20.0, 20.0, 22.0, 20.0, 9.0, 19.0, 13.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.6530327796936035, -0.6372945308685303, -0.6215563416481018, -0.6058180928230286, -0.5900799036026001, -0.5743416547775269, -0.5586034655570984, -0.5428652167320251, -0.5271270275115967, -0.5113887786865234, -0.49565058946609497, -0.4799123704433441, -0.46417415142059326, -0.44843590259552, -0.43269768357276917, -0.4169594645500183, -0.40122121572494507, -0.3854829967021942, -0.36974477767944336, -0.3540065586566925, -0.33826833963394165, -0.3225300908088684, -0.30679187178611755, -0.2910536527633667, -0.27531543374061584, -0.259577214717865, -0.24383899569511414, -0.2281007617712021, -0.21236254274845123, -0.19662432372570038, -0.18088608980178833, -0.16514787077903748, -0.14940959215164185, -0.133671373128891, -0.11793314665555954, -0.10219492018222809, -0.08645670115947723, -0.07071848213672638, -0.05498025566339493, -0.03924202919006348, -0.023503810167312622, -0.007765587419271469, 0.007972635328769684, 0.023710858076810837, 0.03944908082485199, 0.055187299847602844, 0.0709255263209343, 0.08666375279426575, 0.1024019718170166, 0.11814019083976746, 0.1338784098625183, 0.14961664378643036, 0.1653548628091812, 0.18109308183193207, 0.19683131575584412, 0.21256953477859497, 0.22830775380134583, 0.24404597282409668, 0.25978419184684753, 0.2755224108695984, 0.29126065969467163, 0.3069988489151001, 0.32273709774017334, 0.3384753167629242, 0.35421353578567505]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 7.0, 3.0, 11.0, 4.0, 8.0, 13.0, 21.0, 21.0, 18.0, 21.0, 30.0, 30.0, 31.0, 43.0, 34.0, 37.0, 39.0, 39.0, 45.0, 43.0, 51.0, 44.0, 43.0, 31.0, 36.0, 53.0, 32.0, 30.0, 23.0, 31.0, 18.0, 26.0, 17.0, 14.0, 9.0, 15.0, 10.0, 11.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-78.1875, -76.1728515625, -74.158203125, -72.1435546875, -70.12890625, -68.1142578125, -66.099609375, -64.0849609375, -62.0703125, -60.0556640625, -58.041015625, -56.0263671875, -54.01171875, -51.9970703125, -49.982421875, -47.9677734375, -45.953125, -43.9384765625, -41.923828125, -39.9091796875, -37.89453125, -35.8798828125, -33.865234375, -31.8505859375, -29.8359375, -27.8212890625, -25.806640625, -23.7919921875, -21.77734375, -19.7626953125, -17.748046875, -15.7333984375, -13.71875, -11.7041015625, -9.689453125, -7.6748046875, -5.66015625, -3.6455078125, -1.630859375, 0.3837890625, 2.3984375, 4.4130859375, 6.427734375, 8.4423828125, 10.45703125, 12.4716796875, 14.486328125, 16.5009765625, 18.515625, 20.5302734375, 22.544921875, 24.5595703125, 26.57421875, 28.5888671875, 30.603515625, 32.6181640625, 34.6328125, 36.6474609375, 38.662109375, 40.6767578125, 42.69140625, 44.7060546875, 46.720703125, 48.7353515625, 50.75]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 4.0, 7.0, 10.0, 14.0, 11.0, 30.0, 33.0, 58.0, 54.0, 90.0, 168.0, 266.0, 319.0, 695.0, 982.0, 1802.0, 3291.0, 7633.0, 21774.0, 87888.0, 518826.0, 318682.0, 57274.0, 15851.0, 6064.0, 2847.0, 1482.0, 848.0, 524.0, 347.0, 206.0, 132.0, 115.0, 59.0, 46.0, 33.0, 27.0, 17.0, 14.0, 12.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0], "bins": [-126.375, -123.123046875, -119.87109375, -116.619140625, -113.3671875, -110.115234375, -106.86328125, -103.611328125, -100.359375, -97.107421875, -93.85546875, -90.603515625, -87.3515625, -84.099609375, -80.84765625, -77.595703125, -74.34375, -71.091796875, -67.83984375, -64.587890625, -61.3359375, -58.083984375, -54.83203125, -51.580078125, -48.328125, -45.076171875, -41.82421875, -38.572265625, -35.3203125, -32.068359375, -28.81640625, -25.564453125, -22.3125, -19.060546875, -15.80859375, -12.556640625, -9.3046875, -6.052734375, -2.80078125, 0.451171875, 3.703125, 6.955078125, 10.20703125, 13.458984375, 16.7109375, 19.962890625, 23.21484375, 26.466796875, 29.71875, 32.970703125, 36.22265625, 39.474609375, 42.7265625, 45.978515625, 49.23046875, 52.482421875, 55.734375, 58.986328125, 62.23828125, 65.490234375, 68.7421875, 71.994140625, 75.24609375, 78.498046875, 81.75]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 7.0, 10.0, 10.0, 16.0, 11.0, 14.0, 18.0, 21.0, 25.0, 28.0, 30.0, 27.0, 50.0, 51.0, 80.0, 92.0, 140.0, 251.0, 1466.0, 163.0, 99.0, 74.0, 52.0, 29.0, 49.0, 36.0, 34.0, 26.0, 25.0, 18.0, 17.0, 10.0, 9.0, 16.0, 7.0, 3.0, 3.0, 5.0, 2.0, 3.0, 5.0, 1.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-143.75, -139.5546875, -135.359375, -131.1640625, -126.96875, -122.7734375, -118.578125, -114.3828125, -110.1875, -105.9921875, -101.796875, -97.6015625, -93.40625, -89.2109375, -85.015625, -80.8203125, -76.625, -72.4296875, -68.234375, -64.0390625, -59.84375, -55.6484375, -51.453125, -47.2578125, -43.0625, -38.8671875, -34.671875, -30.4765625, -26.28125, -22.0859375, -17.890625, -13.6953125, -9.5, -5.3046875, -1.109375, 3.0859375, 7.28125, 11.4765625, 15.671875, 19.8671875, 24.0625, 28.2578125, 32.453125, 36.6484375, 40.84375, 45.0390625, 49.234375, 53.4296875, 57.625, 61.8203125, 66.015625, 70.2109375, 74.40625, 78.6015625, 82.796875, 86.9921875, 91.1875, 95.3828125, 99.578125, 103.7734375, 107.96875, 112.1640625, 116.359375, 120.5546875, 124.75]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 8.0, 3.0, 4.0, 4.0, 14.0, 9.0, 13.0, 21.0, 24.0, 25.0, 36.0, 50.0, 73.0, 98.0, 101.0, 196.0, 328.0, 615.0, 1424.0, 16065.0, 3061029.0, 61551.0, 2108.0, 700.0, 386.0, 236.0, 154.0, 110.0, 73.0, 48.0, 44.0, 41.0, 21.0, 17.0, 18.0, 12.0, 15.0, 12.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-306.75, -297.0546875, -287.359375, -277.6640625, -267.96875, -258.2734375, -248.578125, -238.8828125, -229.1875, -219.4921875, -209.796875, -200.1015625, -190.40625, -180.7109375, -171.015625, -161.3203125, -151.625, -141.9296875, -132.234375, -122.5390625, -112.84375, -103.1484375, -93.453125, -83.7578125, -74.0625, -64.3671875, -54.671875, -44.9765625, -35.28125, -25.5859375, -15.890625, -6.1953125, 3.5, 13.1953125, 22.890625, 32.5859375, 42.28125, 51.9765625, 61.671875, 71.3671875, 81.0625, 90.7578125, 100.453125, 110.1484375, 119.84375, 129.5390625, 139.234375, 148.9296875, 158.625, 168.3203125, 178.015625, 187.7109375, 197.40625, 207.1015625, 216.796875, 226.4921875, 236.1875, 245.8828125, 255.578125, 265.2734375, 274.96875, 284.6640625, 294.359375, 304.0546875, 313.75]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 22.0, 307.0, 622.0, 59.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-505.9183349609375, -450.8454895019531, -395.77264404296875, -340.6998291015625, -285.6269836425781, -230.55413818359375, -175.4813232421875, -120.40847778320312, -65.33563232421875, -10.262794494628906, 44.81004333496094, 99.88287353515625, 154.95571899414062, 210.028564453125, 265.10137939453125, 320.1742248535156, 375.2470703125, 430.3199157714844, 485.39276123046875, 540.465576171875, 595.5384521484375, 650.6112670898438, 705.68408203125, 760.7569580078125, 815.8297729492188, 870.902587890625, 925.9754638671875, 981.0482788085938, 1036.12109375, 1091.1939697265625, 1146.266845703125, 1201.339599609375, 1256.412353515625, 1311.4852294921875, 1366.5579833984375, 1421.630859375, 1476.7037353515625, 1531.776611328125, 1586.849365234375, 1641.9222412109375, 1696.9951171875, 1752.0679931640625, 1807.1407470703125, 1862.213623046875, 1917.2864990234375, 1972.359375, 2027.43212890625, 2082.5048828125, 2137.57763671875, 2192.650390625, 2247.723388671875, 2302.796142578125, 2357.868896484375, 2412.94189453125, 2468.0146484375, 2523.08740234375, 2578.160400390625, 2633.233154296875, 2688.30615234375, 2743.37890625, 2798.45166015625, 2853.524658203125, 2908.597412109375, 2963.670166015625, 3018.7431640625]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 6.0, 5.0, 5.0, 11.0, 14.0, 14.0, 12.0, 12.0, 14.0, 15.0, 14.0, 29.0, 29.0, 32.0, 39.0, 30.0, 40.0, 45.0, 35.0, 43.0, 35.0, 33.0, 42.0, 49.0, 37.0, 37.0, 39.0, 35.0, 24.0, 24.0, 26.0, 28.0, 14.0, 24.0, 17.0, 15.0, 11.0, 13.0, 10.0, 8.0, 7.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-378.24462890625, -367.5784912109375, -356.912353515625, -346.2462158203125, -335.580078125, -324.9139404296875, -314.247802734375, -303.5816955566406, -292.9155578613281, -282.2494201660156, -271.5832824707031, -260.9171447753906, -250.2510223388672, -239.5848846435547, -228.9187469482422, -218.25262451171875, -207.5864715576172, -196.9203338623047, -186.2541961669922, -175.58807373046875, -164.92193603515625, -154.25579833984375, -143.58966064453125, -132.92352294921875, -122.25739288330078, -111.59125518798828, -100.92512512207031, -90.25898742675781, -79.59284973144531, -68.92671966552734, -58.260581970214844, -47.594451904296875, -36.928314208984375, -26.26218032836914, -15.596044540405273, -4.929908752441406, 5.736225128173828, 16.402359008789062, 27.068496704101562, 37.73462677001953, 48.40076446533203, 59.066898345947266, 69.7330322265625, 80.399169921875, 91.0653076171875, 101.73143768310547, 112.39757537841797, 123.06370544433594, 133.72984313964844, 144.39598083496094, 155.06211853027344, 165.72824096679688, 176.39437866210938, 187.06051635742188, 197.72665405273438, 208.39279174804688, 219.05892944335938, 229.72506713867188, 240.39120483398438, 251.05734252929688, 261.7234802246094, 272.38958740234375, 283.05572509765625, 293.72186279296875, 304.38800048828125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 4.0, 12.0, 12.0, 15.0, 13.0, 12.0, 26.0, 17.0, 23.0, 29.0, 20.0, 40.0, 39.0, 38.0, 39.0, 36.0, 51.0, 35.0, 46.0, 45.0, 44.0, 32.0, 26.0, 38.0, 33.0, 31.0, 35.0, 35.0, 25.0, 28.0, 13.0, 19.0, 15.0, 12.0, 10.0, 7.0, 7.0, 8.0, 6.0, 4.0, 3.0, 4.0, 3.0, 5.0], "bins": [-79.625, -77.56005859375, -75.4951171875, -73.43017578125, -71.365234375, -69.30029296875, -67.2353515625, -65.17041015625, -63.10546875, -61.04052734375, -58.9755859375, -56.91064453125, -54.845703125, -52.78076171875, -50.7158203125, -48.65087890625, -46.5859375, -44.52099609375, -42.4560546875, -40.39111328125, -38.326171875, -36.26123046875, -34.1962890625, -32.13134765625, -30.06640625, -28.00146484375, -25.9365234375, -23.87158203125, -21.806640625, -19.74169921875, -17.6767578125, -15.61181640625, -13.546875, -11.48193359375, -9.4169921875, -7.35205078125, -5.287109375, -3.22216796875, -1.1572265625, 0.90771484375, 2.97265625, 5.03759765625, 7.1025390625, 9.16748046875, 11.232421875, 13.29736328125, 15.3623046875, 17.42724609375, 19.4921875, 21.55712890625, 23.6220703125, 25.68701171875, 27.751953125, 29.81689453125, 31.8818359375, 33.94677734375, 36.01171875, 38.07666015625, 40.1416015625, 42.20654296875, 44.271484375, 46.33642578125, 48.4013671875, 50.46630859375, 52.53125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 11.0, 12.0, 21.0, 30.0, 31.0, 42.0, 32.0, 68.0, 88.0, 117.0, 162.0, 229.0, 346.0, 495.0, 798.0, 1387.0, 2817.0, 6589.0, 19044.0, 130840.0, 3653767.0, 337737.0, 24388.0, 7717.0, 3165.0, 1659.0, 876.0, 519.0, 367.0, 248.0, 165.0, 126.0, 104.0, 69.0, 59.0, 39.0, 27.0, 26.0, 21.0, 15.0, 9.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-339.0, -328.6015625, -318.203125, -307.8046875, -297.40625, -287.0078125, -276.609375, -266.2109375, -255.8125, -245.4140625, -235.015625, -224.6171875, -214.21875, -203.8203125, -193.421875, -183.0234375, -172.625, -162.2265625, -151.828125, -141.4296875, -131.03125, -120.6328125, -110.234375, -99.8359375, -89.4375, -79.0390625, -68.640625, -58.2421875, -47.84375, -37.4453125, -27.046875, -16.6484375, -6.25, 4.1484375, 14.546875, 24.9453125, 35.34375, 45.7421875, 56.140625, 66.5390625, 76.9375, 87.3359375, 97.734375, 108.1328125, 118.53125, 128.9296875, 139.328125, 149.7265625, 160.125, 170.5234375, 180.921875, 191.3203125, 201.71875, 212.1171875, 222.515625, 232.9140625, 243.3125, 253.7109375, 264.109375, 274.5078125, 284.90625, 295.3046875, 305.703125, 316.1015625, 326.5]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 11.0, 7.0, 12.0, 18.0, 14.0, 30.0, 38.0, 68.0, 88.0, 148.0, 280.0, 550.0, 947.0, 815.0, 414.0, 203.0, 122.0, 91.0, 60.0, 37.0, 22.0, 25.0, 14.0, 18.0, 12.0, 7.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.625, -155.046875, -149.46875, -143.890625, -138.3125, -132.734375, -127.15625, -121.578125, -116.0, -110.421875, -104.84375, -99.265625, -93.6875, -88.109375, -82.53125, -76.953125, -71.375, -65.796875, -60.21875, -54.640625, -49.0625, -43.484375, -37.90625, -32.328125, -26.75, -21.171875, -15.59375, -10.015625, -4.4375, 1.140625, 6.71875, 12.296875, 17.875, 23.453125, 29.03125, 34.609375, 40.1875, 45.765625, 51.34375, 56.921875, 62.5, 68.078125, 73.65625, 79.234375, 84.8125, 90.390625, 95.96875, 101.546875, 107.125, 112.703125, 118.28125, 123.859375, 129.4375, 135.015625, 140.59375, 146.171875, 151.75, 157.328125, 162.90625, 168.484375, 174.0625, 179.640625, 185.21875, 190.796875, 196.375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 9.0, 14.0, 10.0, 22.0, 27.0, 35.0, 45.0, 71.0, 119.0, 158.0, 244.0, 364.0, 572.0, 933.0, 1483.0, 2729.0, 4819.0, 8828.0, 17596.0, 37747.0, 94896.0, 351424.0, 2618321.0, 803208.0, 147825.0, 53350.0, 23246.0, 11553.0, 6049.0, 3479.0, 1867.0, 1182.0, 739.0, 404.0, 264.0, 211.0, 132.0, 84.0, 61.0, 46.0, 33.0, 19.0, 17.0, 8.0, 13.0, 7.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0], "bins": [-109.8125, -106.5537109375, -103.294921875, -100.0361328125, -96.77734375, -93.5185546875, -90.259765625, -87.0009765625, -83.7421875, -80.4833984375, -77.224609375, -73.9658203125, -70.70703125, -67.4482421875, -64.189453125, -60.9306640625, -57.671875, -54.4130859375, -51.154296875, -47.8955078125, -44.63671875, -41.3779296875, -38.119140625, -34.8603515625, -31.6015625, -28.3427734375, -25.083984375, -21.8251953125, -18.56640625, -15.3076171875, -12.048828125, -8.7900390625, -5.53125, -2.2724609375, 0.986328125, 4.2451171875, 7.50390625, 10.7626953125, 14.021484375, 17.2802734375, 20.5390625, 23.7978515625, 27.056640625, 30.3154296875, 33.57421875, 36.8330078125, 40.091796875, 43.3505859375, 46.609375, 49.8681640625, 53.126953125, 56.3857421875, 59.64453125, 62.9033203125, 66.162109375, 69.4208984375, 72.6796875, 75.9384765625, 79.197265625, 82.4560546875, 85.71484375, 88.9736328125, 92.232421875, 95.4912109375, 98.75]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 10.0, 5.0, 14.0, 13.0, 15.0, 20.0, 12.0, 21.0, 28.0, 46.0, 62.0, 61.0, 72.0, 65.0, 68.0, 71.0, 66.0, 66.0, 43.0, 43.0, 39.0, 33.0, 23.0, 11.0, 18.0, 17.0, 15.0, 6.0, 8.0, 6.0, 4.0, 6.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-506.3139343261719, -486.72625732421875, -467.13861083984375, -447.55096435546875, -427.9632873535156, -408.3756103515625, -388.7879638671875, -369.2003173828125, -349.6126403808594, -330.02496337890625, -310.43731689453125, -290.84967041015625, -271.2619934082031, -251.67433166503906, -232.086669921875, -212.49900817871094, -192.91134643554688, -173.3236846923828, -153.73602294921875, -134.1483612060547, -114.56069946289062, -94.97303771972656, -75.3853759765625, -55.79771423339844, -36.210052490234375, -16.622390747070312, 2.96527099609375, 22.552932739257812, 42.140594482421875, 61.72825622558594, 81.31591796875, 100.90357971191406, 120.49127197265625, 140.0789337158203, 159.66659545898438, 179.25425720214844, 198.8419189453125, 218.42958068847656, 238.01724243164062, 257.60491943359375, 277.19256591796875, 296.78021240234375, 316.3678894042969, 335.95556640625, 355.543212890625, 375.130859375, 394.7185363769531, 414.30621337890625, 433.89385986328125, 453.48150634765625, 473.0691833496094, 492.6568603515625, 512.2445068359375, 531.8321533203125, 551.4197998046875, 571.0075073242188, 590.5951538085938, 610.1828002929688, 629.7705078125, 649.358154296875, 668.94580078125, 688.533447265625, 708.12109375, 727.7088012695312, 747.2964477539062]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 4.0, 5.0, 9.0, 10.0, 5.0, 11.0, 14.0, 18.0, 19.0, 25.0, 27.0, 22.0, 21.0, 31.0, 25.0, 35.0, 28.0, 32.0, 38.0, 38.0, 45.0, 30.0, 45.0, 39.0, 36.0, 35.0, 39.0, 37.0, 19.0, 29.0, 31.0, 30.0, 25.0, 33.0, 13.0, 18.0, 11.0, 13.0, 8.0, 14.0, 14.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-495.6292724609375, -480.5400695800781, -465.45086669921875, -450.36163330078125, -435.2724304199219, -420.1832275390625, -405.0940246582031, -390.00482177734375, -374.91558837890625, -359.8263854980469, -344.7371826171875, -329.64794921875, -314.5587463378906, -299.46954345703125, -284.3803405761719, -269.2911376953125, -254.20193481445312, -239.11273193359375, -224.0235137939453, -208.93431091308594, -193.8450927734375, -178.75588989257812, -163.66668701171875, -148.57748413085938, -133.48826599121094, -118.39905548095703, -103.30984497070312, -88.22064208984375, -73.13143157958984, -58.04222106933594, -42.95301818847656, -27.863807678222656, -12.774566650390625, 2.3146419525146484, 17.403850555419922, 32.49305725097656, 47.58226776123047, 62.671478271484375, 77.76068115234375, 92.84989166259766, 107.93910217285156, 123.02831268310547, 138.11752319335938, 153.20672607421875, 168.29592895507812, 183.38514709472656, 198.47434997558594, 213.56356811523438, 228.65277099609375, 243.74197387695312, 258.8311767578125, 273.92041015625, 289.0096130371094, 304.09881591796875, 319.1880187988281, 334.2772216796875, 349.366455078125, 364.4556579589844, 379.54486083984375, 394.63409423828125, 409.7232971191406, 424.8125, 439.9017028808594, 454.99090576171875, 470.0801086425781]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 10.0, 10.0, 13.0, 10.0, 18.0, 16.0, 14.0, 24.0, 16.0, 22.0, 22.0, 22.0, 24.0, 27.0, 22.0, 47.0, 32.0, 34.0, 36.0, 50.0, 31.0, 47.0, 37.0, 37.0, 31.0, 40.0, 22.0, 33.0, 23.0, 28.0, 18.0, 25.0, 32.0, 17.0, 13.0, 13.0, 16.0, 9.0, 8.0, 13.0, 5.0, 8.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-827.0, -799.7890625, -772.578125, -745.3671875, -718.15625, -690.9453125, -663.734375, -636.5234375, -609.3125, -582.1015625, -554.890625, -527.6796875, -500.46875, -473.2578125, -446.046875, -418.8359375, -391.625, -364.4140625, -337.203125, -309.9921875, -282.78125, -255.5703125, -228.359375, -201.1484375, -173.9375, -146.7265625, -119.515625, -92.3046875, -65.09375, -37.8828125, -10.671875, 16.5390625, 43.75, 70.9609375, 98.171875, 125.3828125, 152.59375, 179.8046875, 207.015625, 234.2265625, 261.4375, 288.6484375, 315.859375, 343.0703125, 370.28125, 397.4921875, 424.703125, 451.9140625, 479.125, 506.3359375, 533.546875, 560.7578125, 587.96875, 615.1796875, 642.390625, 669.6015625, 696.8125, 724.0234375, 751.234375, 778.4453125, 805.65625, 832.8671875, 860.078125, 887.2890625, 914.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 17.0, 18.0, 41.0, 51.0, 75.0, 102.0, 163.0, 244.0, 344.0, 546.0, 770.0, 1170.0, 1887.0, 2698.0, 4181.0, 6230.0, 9762.0, 15209.0, 23765.0, 38479.0, 65254.0, 125474.0, 291456.0, 217977.0, 98117.0, 54195.0, 32724.0, 20376.0, 12871.0, 8351.0, 5418.0, 3523.0, 2382.0, 1561.0, 992.0, 710.0, 456.0, 312.0, 196.0, 147.0, 99.0, 71.0, 51.0, 32.0, 22.0, 8.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-65.6875, -63.556640625, -61.42578125, -59.294921875, -57.1640625, -55.033203125, -52.90234375, -50.771484375, -48.640625, -46.509765625, -44.37890625, -42.248046875, -40.1171875, -37.986328125, -35.85546875, -33.724609375, -31.59375, -29.462890625, -27.33203125, -25.201171875, -23.0703125, -20.939453125, -18.80859375, -16.677734375, -14.546875, -12.416015625, -10.28515625, -8.154296875, -6.0234375, -3.892578125, -1.76171875, 0.369140625, 2.5, 4.630859375, 6.76171875, 8.892578125, 11.0234375, 13.154296875, 15.28515625, 17.416015625, 19.546875, 21.677734375, 23.80859375, 25.939453125, 28.0703125, 30.201171875, 32.33203125, 34.462890625, 36.59375, 38.724609375, 40.85546875, 42.986328125, 45.1171875, 47.248046875, 49.37890625, 51.509765625, 53.640625, 55.771484375, 57.90234375, 60.033203125, 62.1640625, 64.294921875, 66.42578125, 68.556640625, 70.6875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 10.0, 15.0, 14.0, 16.0, 11.0, 20.0, 17.0, 22.0, 28.0, 22.0, 31.0, 27.0, 37.0, 28.0, 31.0, 28.0, 35.0, 34.0, 46.0, 1061.0, 40.0, 33.0, 27.0, 35.0, 28.0, 30.0, 40.0, 35.0, 33.0, 22.0, 23.0, 22.0, 17.0, 15.0, 15.0, 10.0, 9.0, 9.0, 9.0, 7.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-545.5, -529.08203125, -512.6640625, -496.24609375, -479.828125, -463.41015625, -446.9921875, -430.57421875, -414.15625, -397.73828125, -381.3203125, -364.90234375, -348.484375, -332.06640625, -315.6484375, -299.23046875, -282.8125, -266.39453125, -249.9765625, -233.55859375, -217.140625, -200.72265625, -184.3046875, -167.88671875, -151.46875, -135.05078125, -118.6328125, -102.21484375, -85.796875, -69.37890625, -52.9609375, -36.54296875, -20.125, -3.70703125, 12.7109375, 29.12890625, 45.546875, 61.96484375, 78.3828125, 94.80078125, 111.21875, 127.63671875, 144.0546875, 160.47265625, 176.890625, 193.30859375, 209.7265625, 226.14453125, 242.5625, 258.98046875, 275.3984375, 291.81640625, 308.234375, 324.65234375, 341.0703125, 357.48828125, 373.90625, 390.32421875, 406.7421875, 423.16015625, 439.578125, 455.99609375, 472.4140625, 488.83203125, 505.25]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 13.0, 26.0, 25.0, 33.0, 60.0, 70.0, 117.0, 171.0, 234.0, 375.0, 513.0, 761.0, 1135.0, 1703.0, 2407.0, 3597.0, 5495.0, 8161.0, 12575.0, 19469.0, 30887.0, 50084.0, 84273.0, 167503.0, 1350585.0, 149558.0, 78165.0, 46749.0, 28718.0, 18246.0, 11985.0, 7712.0, 5021.0, 3510.0, 2327.0, 1546.0, 997.0, 697.0, 483.0, 379.0, 236.0, 160.0, 112.0, 76.0, 52.0, 34.0, 31.0, 16.0, 10.0, 11.0, 6.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.5625, -39.27197265625, -37.9814453125, -36.69091796875, -35.400390625, -34.10986328125, -32.8193359375, -31.52880859375, -30.23828125, -28.94775390625, -27.6572265625, -26.36669921875, -25.076171875, -23.78564453125, -22.4951171875, -21.20458984375, -19.9140625, -18.62353515625, -17.3330078125, -16.04248046875, -14.751953125, -13.46142578125, -12.1708984375, -10.88037109375, -9.58984375, -8.29931640625, -7.0087890625, -5.71826171875, -4.427734375, -3.13720703125, -1.8466796875, -0.55615234375, 0.734375, 2.02490234375, 3.3154296875, 4.60595703125, 5.896484375, 7.18701171875, 8.4775390625, 9.76806640625, 11.05859375, 12.34912109375, 13.6396484375, 14.93017578125, 16.220703125, 17.51123046875, 18.8017578125, 20.09228515625, 21.3828125, 22.67333984375, 23.9638671875, 25.25439453125, 26.544921875, 27.83544921875, 29.1259765625, 30.41650390625, 31.70703125, 32.99755859375, 34.2880859375, 35.57861328125, 36.869140625, 38.15966796875, 39.4501953125, 40.74072265625, 42.03125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 9.0, 10.0, 12.0, 11.0, 26.0, 29.0, 36.0, 47.0, 91.0, 101.0, 121.0, 111.0, 99.0, 74.0, 48.0, 43.0, 16.0, 19.0, 13.0, 10.0, 9.0, 5.0, 9.0, 6.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.5087890625, -0.4945869445800781, -0.48038482666015625, -0.4661827087402344, -0.4519805908203125, -0.4377784729003906, -0.42357635498046875, -0.4093742370605469, -0.395172119140625, -0.3809700012207031, -0.36676788330078125, -0.3525657653808594, -0.3383636474609375, -0.3241615295410156, -0.30995941162109375, -0.2957572937011719, -0.28155517578125, -0.2673530578613281, -0.25315093994140625, -0.23894882202148438, -0.2247467041015625, -0.21054458618164062, -0.19634246826171875, -0.18214035034179688, -0.167938232421875, -0.15373611450195312, -0.13953399658203125, -0.12533187866210938, -0.1111297607421875, -0.09692764282226562, -0.08272552490234375, -0.06852340698242188, -0.0543212890625, -0.040119171142578125, -0.02591705322265625, -0.011714935302734375, 0.0024871826171875, 0.016689300537109375, 0.03089141845703125, 0.045093536376953125, 0.059295654296875, 0.07349777221679688, 0.08769989013671875, 0.10190200805664062, 0.1161041259765625, 0.13030624389648438, 0.14450836181640625, 0.15871047973632812, 0.17291259765625, 0.18711471557617188, 0.20131683349609375, 0.21551895141601562, 0.2297210693359375, 0.24392318725585938, 0.25812530517578125, 0.2723274230957031, 0.286529541015625, 0.3007316589355469, 0.31493377685546875, 0.3291358947753906, 0.3433380126953125, 0.3575401306152344, 0.37174224853515625, 0.3859443664550781, 0.400146484375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 12.0, 6.0, 8.0, 9.0, 9.0, 11.0, 16.0, 28.0, 26.0, 44.0, 47.0, 73.0, 102.0, 182.0, 540.0, 1796.0, 13625.0, 950091.0, 76527.0, 3769.0, 847.0, 296.0, 112.0, 78.0, 60.0, 51.0, 38.0, 24.0, 23.0, 14.0, 6.0, 11.0, 6.0, 10.0, 8.0, 3.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.68359375, -6.47930908203125, -6.2750244140625, -6.07073974609375, -5.866455078125, -5.66217041015625, -5.4578857421875, -5.25360107421875, -5.04931640625, -4.84503173828125, -4.6407470703125, -4.43646240234375, -4.232177734375, -4.02789306640625, -3.8236083984375, -3.61932373046875, -3.4150390625, -3.21075439453125, -3.0064697265625, -2.80218505859375, -2.597900390625, -2.39361572265625, -2.1893310546875, -1.98504638671875, -1.78076171875, -1.57647705078125, -1.3721923828125, -1.16790771484375, -0.963623046875, -0.75933837890625, -0.5550537109375, -0.35076904296875, -0.146484375, 0.05780029296875, 0.2620849609375, 0.46636962890625, 0.670654296875, 0.87493896484375, 1.0792236328125, 1.28350830078125, 1.48779296875, 1.69207763671875, 1.8963623046875, 2.10064697265625, 2.304931640625, 2.50921630859375, 2.7135009765625, 2.91778564453125, 3.1220703125, 3.32635498046875, 3.5306396484375, 3.73492431640625, 3.939208984375, 4.14349365234375, 4.3477783203125, 4.55206298828125, 4.75634765625, 4.96063232421875, 5.1649169921875, 5.36920166015625, 5.573486328125, 5.77777099609375, 5.9820556640625, 6.18634033203125, 6.390625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 13.0, 73.0, 379.0, 403.0, 94.0, 22.0, 14.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.5265917778015137, -3.458897352218628, -3.391202926635742, -3.3235082626342773, -3.2558138370513916, -3.188119411468506, -3.120424747467041, -3.0527303218841553, -2.9850358963012695, -2.917341470718384, -2.849647045135498, -2.781952381134033, -2.7142579555511475, -2.6465635299682617, -2.578868865966797, -2.511174440383911, -2.4434800148010254, -2.3757855892181396, -2.308091163635254, -2.240396499633789, -2.1727020740509033, -2.1050076484680176, -2.0373129844665527, -1.969618558883667, -1.9019241333007812, -1.8342297077178955, -1.7665351629257202, -1.698840618133545, -1.6311461925506592, -1.5634517669677734, -1.4957572221755981, -1.4280626773834229, -1.360368013381958, -1.2926735877990723, -1.224979043006897, -1.1572844982147217, -1.089590072631836, -1.0218956470489502, -0.9542011022567749, -0.8865066170692444, -0.8188121318817139, -0.7511176466941833, -0.6834231615066528, -0.6157286763191223, -0.5480341911315918, -0.4803397059440613, -0.41264522075653076, -0.34495073556900024, -0.2772562503814697, -0.2095617651939392, -0.1418672800064087, -0.07417279481887817, -0.006478309631347656, 0.06121617555618286, 0.12891066074371338, 0.1966051459312439, 0.2642996311187744, 0.33199411630630493, 0.39968860149383545, 0.46738308668136597, 0.5350775718688965, 0.602772057056427, 0.6704665422439575, 0.738161027431488, 0.8058555126190186]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 1.0, 5.0, 9.0, 10.0, 7.0, 18.0, 7.0, 13.0, 18.0, 7.0, 20.0, 17.0, 19.0, 25.0, 28.0, 33.0, 30.0, 20.0, 48.0, 44.0, 22.0, 35.0, 41.0, 37.0, 29.0, 35.0, 39.0, 40.0, 27.0, 34.0, 31.0, 28.0, 21.0, 25.0, 23.0, 21.0, 15.0, 11.0, 20.0, 15.0, 15.0, 8.0, 10.0, 5.0, 6.0, 5.0, 4.0, 1.0, 4.0, 4.0, 5.0, 1.0, 3.0], "bins": [-0.38483625650405884, -0.3735042214393616, -0.3621721565723419, -0.35084012150764465, -0.3395080864429474, -0.32817602157592773, -0.31684398651123047, -0.3055119514465332, -0.29417988657951355, -0.2828478515148163, -0.27151578664779663, -0.26018375158309937, -0.2488517016172409, -0.23751965165138245, -0.22618761658668518, -0.21485556662082672, -0.20352353155612946, -0.192191481590271, -0.18085944652557373, -0.16952739655971527, -0.1581953465938568, -0.14686331152915955, -0.1355312615633011, -0.12419921159744263, -0.11286716908216476, -0.1015351265668869, -0.09020307660102844, -0.07887103408575058, -0.06753899157047272, -0.05620694160461426, -0.044874899089336395, -0.033542849123477936, -0.022210806608200073, -0.010878761298954487, 0.00045328401029109955, 0.011785328388214111, 0.023117374628782272, 0.03444942086935043, 0.045781463384628296, 0.057113513350486755, 0.06844555586576462, 0.07977759838104248, 0.09110964834690094, 0.1024416908621788, 0.11377373337745667, 0.12510578334331512, 0.13643783330917358, 0.14776986837387085, 0.1591019183397293, 0.17043396830558777, 0.18176600337028503, 0.1930980533361435, 0.20443010330200195, 0.21576213836669922, 0.22709418833255768, 0.23842623829841614, 0.2497582733631134, 0.26109030842781067, 0.2724223732948303, 0.2837544083595276, 0.29508644342422485, 0.3064185082912445, 0.3177505433559418, 0.3290826082229614, 0.3404146432876587]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 10.0, 10.0, 13.0, 10.0, 19.0, 14.0, 15.0, 24.0, 17.0, 20.0, 23.0, 22.0, 26.0, 25.0, 21.0, 45.0, 34.0, 35.0, 36.0, 49.0, 32.0, 48.0, 36.0, 37.0, 31.0, 40.0, 22.0, 33.0, 24.0, 27.0, 18.0, 25.0, 29.0, 20.0, 12.0, 14.0, 16.0, 9.0, 9.0, 12.0, 5.0, 8.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-827.0, -799.796875, -772.59375, -745.390625, -718.1875, -690.984375, -663.78125, -636.578125, -609.375, -582.171875, -554.96875, -527.765625, -500.5625, -473.359375, -446.15625, -418.953125, -391.75, -364.546875, -337.34375, -310.140625, -282.9375, -255.734375, -228.53125, -201.328125, -174.125, -146.921875, -119.71875, -92.515625, -65.3125, -38.109375, -10.90625, 16.296875, 43.5, 70.703125, 97.90625, 125.109375, 152.3125, 179.515625, 206.71875, 233.921875, 261.125, 288.328125, 315.53125, 342.734375, 369.9375, 397.140625, 424.34375, 451.546875, 478.75, 505.953125, 533.15625, 560.359375, 587.5625, 614.765625, 641.96875, 669.171875, 696.375, 723.578125, 750.78125, 777.984375, 805.1875, 832.390625, 859.59375, 886.796875, 914.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 8.0, 8.0, 10.0, 14.0, 17.0, 23.0, 28.0, 37.0, 48.0, 61.0, 80.0, 90.0, 130.0, 195.0, 289.0, 444.0, 869.0, 1633.0, 3270.0, 7182.0, 15779.0, 37871.0, 106993.0, 359695.0, 345849.0, 101978.0, 36570.0, 15307.0, 6900.0, 3321.0, 1596.0, 817.0, 448.0, 259.0, 195.0, 120.0, 93.0, 65.0, 55.0, 49.0, 33.0, 27.0, 24.0, 15.0, 15.0, 15.0, 8.0, 7.0, 5.0, 4.0, 1.0, 4.0, 0.0, 3.0, 2.0], "bins": [-125.125, -121.3310546875, -117.537109375, -113.7431640625, -109.94921875, -106.1552734375, -102.361328125, -98.5673828125, -94.7734375, -90.9794921875, -87.185546875, -83.3916015625, -79.59765625, -75.8037109375, -72.009765625, -68.2158203125, -64.421875, -60.6279296875, -56.833984375, -53.0400390625, -49.24609375, -45.4521484375, -41.658203125, -37.8642578125, -34.0703125, -30.2763671875, -26.482421875, -22.6884765625, -18.89453125, -15.1005859375, -11.306640625, -7.5126953125, -3.71875, 0.0751953125, 3.869140625, 7.6630859375, 11.45703125, 15.2509765625, 19.044921875, 22.8388671875, 26.6328125, 30.4267578125, 34.220703125, 38.0146484375, 41.80859375, 45.6025390625, 49.396484375, 53.1904296875, 56.984375, 60.7783203125, 64.572265625, 68.3662109375, 72.16015625, 75.9541015625, 79.748046875, 83.5419921875, 87.3359375, 91.1298828125, 94.923828125, 98.7177734375, 102.51171875, 106.3056640625, 110.099609375, 113.8935546875, 117.6875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 5.0, 11.0, 12.0, 19.0, 30.0, 46.0, 51.0, 64.0, 71.0, 77.0, 108.0, 2125.0, 81.0, 62.0, 72.0, 48.0, 46.0, 31.0, 28.0, 15.0, 12.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2578.0, -2500.40625, -2422.8125, -2345.21875, -2267.625, -2190.03125, -2112.4375, -2034.84375, -1957.25, -1879.65625, -1802.0625, -1724.46875, -1646.875, -1569.28125, -1491.6875, -1414.09375, -1336.5, -1258.90625, -1181.3125, -1103.71875, -1026.125, -948.53125, -870.9375, -793.34375, -715.75, -638.15625, -560.5625, -482.96875, -405.375, -327.78125, -250.1875, -172.59375, -95.0, -17.40625, 60.1875, 137.78125, 215.375, 292.96875, 370.5625, 448.15625, 525.75, 603.34375, 680.9375, 758.53125, 836.125, 913.71875, 991.3125, 1068.90625, 1146.5, 1224.09375, 1301.6875, 1379.28125, 1456.875, 1534.46875, 1612.0625, 1689.65625, 1767.25, 1844.84375, 1922.4375, 2000.03125, 2077.625, 2155.21875, 2232.8125, 2310.40625, 2388.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 7.0, 6.0, 8.0, 12.0, 20.0, 15.0, 37.0, 51.0, 85.0, 145.0, 270.0, 479.0, 1134.0, 3847.0, 30664.0, 2923263.0, 172644.0, 9391.0, 1962.0, 767.0, 367.0, 187.0, 122.0, 69.0, 38.0, 23.0, 21.0, 16.0, 11.0, 11.0, 10.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-393.25, -380.46484375, -367.6796875, -354.89453125, -342.109375, -329.32421875, -316.5390625, -303.75390625, -290.96875, -278.18359375, -265.3984375, -252.61328125, -239.828125, -227.04296875, -214.2578125, -201.47265625, -188.6875, -175.90234375, -163.1171875, -150.33203125, -137.546875, -124.76171875, -111.9765625, -99.19140625, -86.40625, -73.62109375, -60.8359375, -48.05078125, -35.265625, -22.48046875, -9.6953125, 3.08984375, 15.875, 28.66015625, 41.4453125, 54.23046875, 67.015625, 79.80078125, 92.5859375, 105.37109375, 118.15625, 130.94140625, 143.7265625, 156.51171875, 169.296875, 182.08203125, 194.8671875, 207.65234375, 220.4375, 233.22265625, 246.0078125, 258.79296875, 271.578125, 284.36328125, 297.1484375, 309.93359375, 322.71875, 335.50390625, 348.2890625, 361.07421875, 373.859375, 386.64453125, 399.4296875, 412.21484375, 425.0]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 5.0, 3.0, 8.0, 16.0, 24.0, 36.0, 76.0, 156.0, 232.0, 195.0, 96.0, 63.0, 21.0, 21.0, 11.0, 10.0, 5.0, 6.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1138.414306640625, -1048.4727783203125, -958.5311279296875, -868.589599609375, -778.6480102539062, -688.7064208984375, -598.764892578125, -508.82330322265625, -418.8817138671875, -328.94012451171875, -238.99856567382812, -149.0570068359375, -59.11541748046875, 30.826171875, 120.7677001953125, 210.70928955078125, 300.65087890625, 390.59246826171875, 480.5340270996094, 570.4755859375, 660.4171752929688, 750.3587646484375, 840.30029296875, 930.2418823242188, 1020.1834716796875, 1110.125, 1200.066650390625, 1290.0081787109375, 1379.94970703125, 1469.891357421875, 1559.8328857421875, 1649.7744140625, 1739.7158203125, 1829.6573486328125, 1919.5989990234375, 2009.54052734375, 2099.482177734375, 2189.423828125, 2279.365234375, 2369.306884765625, 2459.24853515625, 2549.190185546875, 2639.131591796875, 2729.0732421875, 2819.014892578125, 2908.95654296875, 2998.89794921875, 3088.839599609375, 3178.781005859375, 3268.72265625, 3358.6640625, 3448.605712890625, 3538.54736328125, 3628.48876953125, 3718.430419921875, 3808.3720703125, 3898.3134765625, 3988.255126953125, 4078.196533203125, 4168.13818359375, 4258.07958984375, 4348.021484375, 4437.962890625, 4527.904296875, 4617.84619140625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 7.0, 8.0, 16.0, 14.0, 11.0, 20.0, 14.0, 23.0, 33.0, 32.0, 29.0, 43.0, 36.0, 38.0, 40.0, 48.0, 55.0, 39.0, 47.0, 42.0, 35.0, 41.0, 34.0, 34.0, 26.0, 32.0, 21.0, 24.0, 25.0, 24.0, 13.0, 12.0, 15.0, 10.0, 10.0, 10.0, 5.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2362.6376953125, -2295.719482421875, -2228.801025390625, -2161.8828125, -2094.96435546875, -2028.046142578125, -1961.1278076171875, -1894.20947265625, -1827.291259765625, -1760.3729248046875, -1693.45458984375, -1626.536376953125, -1559.6180419921875, -1492.69970703125, -1425.7813720703125, -1358.863037109375, -1291.9447021484375, -1225.0263671875, -1158.1080322265625, -1091.189697265625, -1024.271484375, -957.3531494140625, -890.434814453125, -823.5164794921875, -756.5982055664062, -689.6798706054688, -622.7615966796875, -555.84326171875, -488.9249572753906, -422.00665283203125, -355.08831787109375, -288.1700134277344, -221.2518310546875, -154.33352661132812, -87.41520690917969, -20.49688720703125, 46.421417236328125, 113.3397216796875, 180.258056640625, 247.17636108398438, 314.09466552734375, 381.0129699707031, 447.9312744140625, 514.849609375, 581.7679443359375, 648.6862182617188, 715.6045532226562, 782.5228271484375, 849.441162109375, 916.3594970703125, 983.2777709960938, 1050.196044921875, 1117.1143798828125, 1184.03271484375, 1250.9510498046875, 1317.869384765625, 1384.78759765625, 1451.7059326171875, 1518.624267578125, 1585.54248046875, 1652.4608154296875, 1719.379150390625, 1786.2974853515625, 1853.2158203125, 1920.1341552734375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 3.0, 6.0, 10.0, 4.0, 11.0, 12.0, 20.0, 20.0, 27.0, 37.0, 43.0, 57.0, 74.0, 105.0, 118.0, 173.0, 208.0, 241.0, 307.0, 388.0, 445.0, 706.0, 1042384.0, 852.0, 414.0, 361.0, 328.0, 249.0, 181.0, 168.0, 108.0, 121.0, 81.0, 60.0, 53.0, 43.0, 32.0, 21.0, 19.0, 21.0, 10.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-644.144287109375, -624.9339599609375, -605.7236328125, -586.5133056640625, -567.302978515625, -548.0926513671875, -528.88232421875, -509.6719970703125, -490.461669921875, -471.2513427734375, -452.041015625, -432.8306884765625, -413.620361328125, -394.4100341796875, -375.19970703125, -355.9893798828125, -336.779052734375, -317.5687255859375, -298.3583984375, -279.1480712890625, -259.937744140625, -240.7274169921875, -221.51708984375, -202.3067626953125, -183.096435546875, -163.8861083984375, -144.67578125, -125.4654541015625, -106.255126953125, -87.0447998046875, -67.83447265625, -48.6241455078125, -29.41387939453125, -10.20355224609375, 9.00677490234375, 28.21710205078125, 47.42742919921875, 66.63775634765625, 85.84808349609375, 105.05841064453125, 124.26873779296875, 143.47906494140625, 162.68939208984375, 181.89971923828125, 201.11004638671875, 220.32037353515625, 239.53070068359375, 258.74102783203125, 277.95135498046875, 297.16168212890625, 316.37200927734375, 335.58233642578125, 354.79266357421875, 374.00299072265625, 393.21331787109375, 412.42364501953125, 431.63397216796875, 450.84429931640625, 470.05462646484375, 489.26495361328125, 508.47528076171875, 527.6856079101562, 546.8959350585938, 566.1062622070312, 585.3165893554688]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 1.0, 3.0, 7.0, 7.0, 8.0, 21.0, 35.0, 139.0, 732.0, 51458740.0, 3073.0, 267.0, 45.0, 16.0, 11.0, 7.0, 8.0, 5.0, 7.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6364.0, -6180.9150390625, -5997.82958984375, -5814.74462890625, -5631.6591796875, -5448.57421875, -5265.4892578125, -5082.404296875, -4899.31884765625, -4716.23388671875, -4533.1484375, -4350.0634765625, -4166.978515625, -3983.89306640625, -3800.80810546875, -3617.722900390625, -3434.6376953125, -3251.552490234375, -3068.46728515625, -2885.38232421875, -2702.297119140625, -2519.2119140625, -2336.126953125, -2153.041748046875, -1969.95654296875, -1786.871337890625, -1603.7862548828125, -1420.701171875, -1237.615966796875, -1054.53076171875, -871.4456787109375, -688.360595703125, -505.27490234375, -322.18975830078125, -139.1046142578125, 43.98052978515625, 227.065673828125, 410.15081787109375, 593.2359619140625, 776.321044921875, 959.40625, 1142.491455078125, 1325.5765380859375, 1508.66162109375, 1691.746826171875, 1874.83203125, 2057.9169921875, 2241.002197265625, 2424.08740234375, 2607.172607421875, 2790.2578125, 2973.3427734375, 3156.427978515625, 3339.51318359375, 3522.59814453125, 3705.683349609375, 3888.7685546875, 4071.853759765625, 4254.93896484375, 4438.02392578125, 4621.109375, 4804.1943359375, 4987.279296875, 5170.3642578125, 5353.44970703125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 14.0, 14.0, 23.0, 34.0, 76.0, 104.0, 144.0, 219.0, 313.0, 431.0, 673.0, 976.0, 1594.0, 2312.0, 3457.0, 4866.0, 7065.0, 10137.0, 14722.0, 21380.0, 31257.0, 47808.0, 71968.0, 109112.0, 164913.0, 258077.0, 434661.0, 3249519.0, 871175.0, 346338.0, 216355.0, 140969.0, 92797.0, 61147.0, 40785.0, 27524.0, 18464.0, 12398.0, 8620.0, 5959.0, 4147.0, 2892.0, 2040.0, 1316.0, 890.0, 587.0, 442.0, 245.0, 167.0, 100.0, 66.0, 59.0, 47.0, 15.0, 16.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-11.6640625, -11.285400390625, -10.90673828125, -10.528076171875, -10.1494140625, -9.770751953125, -9.39208984375, -9.013427734375, -8.634765625, -8.256103515625, -7.87744140625, -7.498779296875, -7.1201171875, -6.741455078125, -6.36279296875, -5.984130859375, -5.60546875, -5.226806640625, -4.84814453125, -4.469482421875, -4.0908203125, -3.712158203125, -3.33349609375, -2.954833984375, -2.576171875, -2.197509765625, -1.81884765625, -1.440185546875, -1.0615234375, -0.682861328125, -0.30419921875, 0.074462890625, 0.453125, 0.831787109375, 1.21044921875, 1.589111328125, 1.9677734375, 2.346435546875, 2.72509765625, 3.103759765625, 3.482421875, 3.861083984375, 4.23974609375, 4.618408203125, 4.9970703125, 5.375732421875, 5.75439453125, 6.133056640625, 6.51171875, 6.890380859375, 7.26904296875, 7.647705078125, 8.0263671875, 8.405029296875, 8.78369140625, 9.162353515625, 9.541015625, 9.919677734375, 10.29833984375, 10.677001953125, 11.0556640625, 11.434326171875, 11.81298828125, 12.191650390625, 12.5703125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 6.0, 8.0, 3.0, 7.0, 8.0, 13.0, 13.0, 19.0, 16.0, 17.0, 24.0, 34.0, 29.0, 30.0, 29.0, 38.0, 35.0, 18.0, 39.0, 35.0, 69.0, 1003.0, 78.0, 46.0, 33.0, 36.0, 32.0, 31.0, 30.0, 46.0, 25.0, 17.0, 32.0, 21.0, 18.0, 10.0, 10.0, 12.0, 9.0, 6.0, 5.0, 8.0, 6.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-249.75, -242.29296875, -234.8359375, -227.37890625, -219.921875, -212.46484375, -205.0078125, -197.55078125, -190.09375, -182.63671875, -175.1796875, -167.72265625, -160.265625, -152.80859375, -145.3515625, -137.89453125, -130.4375, -122.98046875, -115.5234375, -108.06640625, -100.609375, -93.15234375, -85.6953125, -78.23828125, -70.78125, -63.32421875, -55.8671875, -48.41015625, -40.953125, -33.49609375, -26.0390625, -18.58203125, -11.125, -3.66796875, 3.7890625, 11.24609375, 18.703125, 26.16015625, 33.6171875, 41.07421875, 48.53125, 55.98828125, 63.4453125, 70.90234375, 78.359375, 85.81640625, 93.2734375, 100.73046875, 108.1875, 115.64453125, 123.1015625, 130.55859375, 138.015625, 145.47265625, 152.9296875, 160.38671875, 167.84375, 175.30078125, 182.7578125, 190.21484375, 197.671875, 205.12890625, 212.5859375, 220.04296875, 227.5]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 3.0, 12.0, 19.0, 29.0, 45.0, 57.0, 81.0, 128.0, 156.0, 253.0, 375.0, 548.0, 852.0, 1306.0, 2009.0, 3047.0, 4554.0, 6982.0, 11212.0, 17797.0, 28485.0, 45943.0, 75840.0, 127430.0, 218662.0, 384392.0, 986497.0, 3284066.0, 457390.0, 255694.0, 147315.0, 88187.0, 53487.0, 32636.0, 20339.0, 12713.0, 8007.0, 5199.0, 3333.0, 2109.0, 1367.0, 957.0, 625.0, 425.0, 299.0, 187.0, 116.0, 88.0, 48.0, 40.0, 33.0, 18.0, 14.0, 12.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.0078125, -12.5762939453125, -12.144775390625, -11.7132568359375, -11.28173828125, -10.8502197265625, -10.418701171875, -9.9871826171875, -9.5556640625, -9.1241455078125, -8.692626953125, -8.2611083984375, -7.82958984375, -7.3980712890625, -6.966552734375, -6.5350341796875, -6.103515625, -5.6719970703125, -5.240478515625, -4.8089599609375, -4.37744140625, -3.9459228515625, -3.514404296875, -3.0828857421875, -2.6513671875, -2.2198486328125, -1.788330078125, -1.3568115234375, -0.92529296875, -0.4937744140625, -0.062255859375, 0.3692626953125, 0.80078125, 1.2322998046875, 1.663818359375, 2.0953369140625, 2.52685546875, 2.9583740234375, 3.389892578125, 3.8214111328125, 4.2529296875, 4.6844482421875, 5.115966796875, 5.5474853515625, 5.97900390625, 6.4105224609375, 6.842041015625, 7.2735595703125, 7.705078125, 8.1365966796875, 8.568115234375, 8.9996337890625, 9.43115234375, 9.8626708984375, 10.294189453125, 10.7257080078125, 11.1572265625, 11.5887451171875, 12.020263671875, 12.4517822265625, 12.88330078125, 13.3148193359375, 13.746337890625, 14.1778564453125, 14.609375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 2.0, 10.0, 7.0, 9.0, 9.0, 17.0, 13.0, 11.0, 22.0, 36.0, 28.0, 21.0, 32.0, 35.0, 39.0, 45.0, 29.0, 46.0, 50.0, 649.0, 454.0, 57.0, 44.0, 47.0, 36.0, 32.0, 38.0, 34.0, 27.0, 22.0, 27.0, 17.0, 15.0, 15.0, 13.0, 9.0, 7.0, 3.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-236.5, -229.091796875, -221.68359375, -214.275390625, -206.8671875, -199.458984375, -192.05078125, -184.642578125, -177.234375, -169.826171875, -162.41796875, -155.009765625, -147.6015625, -140.193359375, -132.78515625, -125.376953125, -117.96875, -110.560546875, -103.15234375, -95.744140625, -88.3359375, -80.927734375, -73.51953125, -66.111328125, -58.703125, -51.294921875, -43.88671875, -36.478515625, -29.0703125, -21.662109375, -14.25390625, -6.845703125, 0.5625, 7.970703125, 15.37890625, 22.787109375, 30.1953125, 37.603515625, 45.01171875, 52.419921875, 59.828125, 67.236328125, 74.64453125, 82.052734375, 89.4609375, 96.869140625, 104.27734375, 111.685546875, 119.09375, 126.501953125, 133.91015625, 141.318359375, 148.7265625, 156.134765625, 163.54296875, 170.951171875, 178.359375, 185.767578125, 193.17578125, 200.583984375, 207.9921875, 215.400390625, 222.80859375, 230.216796875, 237.625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 12.0, 23.0, 21.0, 34.0, 35.0, 46.0, 63.0, 59.0, 67.0, 86.0, 161.0, 242.0, 331.0, 399.0, 609.0, 926.0, 1517.0, 2419.0, 4644.0, 9858.0, 26555.0, 82796.0, 5779369.0, 284438.0, 58881.0, 20009.0, 7806.0, 3799.0, 2000.0, 1256.0, 850.0, 563.0, 409.0, 314.0, 241.0, 136.0, 107.0, 74.0, 47.0, 61.0, 37.0, 36.0, 21.0, 25.0, 18.0, 9.0, 1.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-84.875, -82.2109375, -79.546875, -76.8828125, -74.21875, -71.5546875, -68.890625, -66.2265625, -63.5625, -60.8984375, -58.234375, -55.5703125, -52.90625, -50.2421875, -47.578125, -44.9140625, -42.25, -39.5859375, -36.921875, -34.2578125, -31.59375, -28.9296875, -26.265625, -23.6015625, -20.9375, -18.2734375, -15.609375, -12.9453125, -10.28125, -7.6171875, -4.953125, -2.2890625, 0.375, 3.0390625, 5.703125, 8.3671875, 11.03125, 13.6953125, 16.359375, 19.0234375, 21.6875, 24.3515625, 27.015625, 29.6796875, 32.34375, 35.0078125, 37.671875, 40.3359375, 43.0, 45.6640625, 48.328125, 50.9921875, 53.65625, 56.3203125, 58.984375, 61.6484375, 64.3125, 66.9765625, 69.640625, 72.3046875, 74.96875, 77.6328125, 80.296875, 82.9609375, 85.625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 5.0, 7.0, 8.0, 10.0, 13.0, 15.0, 16.0, 18.0, 18.0, 26.0, 24.0, 27.0, 31.0, 24.0, 27.0, 36.0, 39.0, 37.0, 31.0, 89.0, 984.0, 61.0, 33.0, 49.0, 39.0, 25.0, 44.0, 32.0, 27.0, 24.0, 27.0, 24.0, 22.0, 17.0, 15.0, 14.0, 15.0, 9.0, 9.0, 7.0, 6.0, 1.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.5, -155.013671875, -149.52734375, -144.041015625, -138.5546875, -133.068359375, -127.58203125, -122.095703125, -116.609375, -111.123046875, -105.63671875, -100.150390625, -94.6640625, -89.177734375, -83.69140625, -78.205078125, -72.71875, -67.232421875, -61.74609375, -56.259765625, -50.7734375, -45.287109375, -39.80078125, -34.314453125, -28.828125, -23.341796875, -17.85546875, -12.369140625, -6.8828125, -1.396484375, 4.08984375, 9.576171875, 15.0625, 20.548828125, 26.03515625, 31.521484375, 37.0078125, 42.494140625, 47.98046875, 53.466796875, 58.953125, 64.439453125, 69.92578125, 75.412109375, 80.8984375, 86.384765625, 91.87109375, 97.357421875, 102.84375, 108.330078125, 113.81640625, 119.302734375, 124.7890625, 130.275390625, 135.76171875, 141.248046875, 146.734375, 152.220703125, 157.70703125, 163.193359375, 168.6796875, 174.166015625, 179.65234375, 185.138671875, 190.625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 4.0, 18.0, 79.0, 654.0, 209.0, 22.0, 8.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-761.0686645507812, -705.44970703125, -649.8306884765625, -594.2117309570312, -538.5927734375, -482.97381591796875, -427.3548278808594, -371.73583984375, -316.11688232421875, -260.4979248046875, -204.87893676757812, -149.2599639892578, -93.6409912109375, -38.02203369140625, 17.596954345703125, 73.2159423828125, 128.83489990234375, 184.45387268066406, 240.07284545898438, 295.69183349609375, 351.310791015625, 406.92974853515625, 462.5487365722656, 518.167724609375, 573.7866821289062, 629.4056396484375, 685.024658203125, 740.6436157226562, 796.2625732421875, 851.8815307617188, 907.50048828125, 963.1195068359375, 1018.738525390625, 1074.3575439453125, 1129.9764404296875, 1185.595458984375, 1241.21435546875, 1296.8333740234375, 1352.452392578125, 1408.0712890625, 1463.6903076171875, 1519.309326171875, 1574.92822265625, 1630.5472412109375, 1686.166259765625, 1741.78515625, 1797.4041748046875, 1853.023193359375, 1908.64208984375, 1964.2611083984375, 2019.8800048828125, 2075.4990234375, 2131.117919921875, 2186.73681640625, 2242.35595703125, 2297.974853515625, 2353.59375, 2409.212646484375, 2464.831787109375, 2520.45068359375, 2576.069580078125, 2631.6884765625, 2687.3076171875, 2742.926513671875, 2798.545654296875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 5.0, 10.0, 12.0, 15.0, 11.0, 18.0, 21.0, 31.0, 29.0, 32.0, 28.0, 38.0, 34.0, 51.0, 45.0, 34.0, 55.0, 46.0, 56.0, 44.0, 36.0, 40.0, 36.0, 43.0, 38.0, 26.0, 28.0, 22.0, 20.0, 23.0, 11.0, 10.0, 8.0, 4.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-505.085205078125, -490.9626770019531, -476.84014892578125, -462.7176208496094, -448.5950927734375, -434.4725646972656, -420.35003662109375, -406.2275390625, -392.10498046875, -377.9824523925781, -363.85992431640625, -349.7373962402344, -335.6148681640625, -321.4923400878906, -307.36981201171875, -293.247314453125, -279.1247863769531, -265.00225830078125, -250.87973022460938, -236.7572021484375, -222.63467407226562, -208.51214599609375, -194.38963317871094, -180.26710510253906, -166.1445770263672, -152.0220489501953, -137.89952087402344, -123.7770004272461, -109.65447235107422, -95.53194427490234, -81.409423828125, -67.28689575195312, -53.16436767578125, -39.041839599609375, -24.919315338134766, -10.796791076660156, 3.3257369995117188, 17.448265075683594, 31.570785522460938, 45.69331359863281, 59.81584167480469, 73.93836975097656, 88.06089782714844, 102.18341827392578, 116.30594635009766, 130.428466796875, 144.55099487304688, 158.67352294921875, 172.79605102539062, 186.9185791015625, 201.04110717773438, 215.16363525390625, 229.28616333007812, 243.40869140625, 257.53118896484375, 271.65374755859375, 285.7762451171875, 299.8987731933594, 314.02130126953125, 328.1438293457031, 342.266357421875, 356.3888854980469, 370.51141357421875, 384.6339111328125, 398.7564697265625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 20.0, 13.0, 16.0, 33.0, 31.0, 50.0, 66.0, 81.0, 140.0, 195.0, 287.0, 457.0, 729.0, 1161.0, 2353.0, 6876.0, 26396.0, 211629.0, 3868292.0, 57389.0, 10193.0, 3538.0, 1689.0, 840.0, 564.0, 353.0, 215.0, 187.0, 127.0, 79.0, 59.0, 51.0, 38.0, 26.0, 26.0, 17.0, 9.0, 3.0, 9.0, 5.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-1.4326171875, -1.39306640625, -1.353515625, -1.31396484375, -1.2744140625, -1.23486328125, -1.1953125, -1.15576171875, -1.1162109375, -1.07666015625, -1.037109375, -0.99755859375, -0.9580078125, -0.91845703125, -0.87890625, -0.83935546875, -0.7998046875, -0.76025390625, -0.720703125, -0.68115234375, -0.6416015625, -0.60205078125, -0.5625, -0.52294921875, -0.4833984375, -0.44384765625, -0.404296875, -0.36474609375, -0.3251953125, -0.28564453125, -0.24609375, -0.20654296875, -0.1669921875, -0.12744140625, -0.087890625, -0.04833984375, -0.0087890625, 0.03076171875, 0.0703125, 0.10986328125, 0.1494140625, 0.18896484375, 0.228515625, 0.26806640625, 0.3076171875, 0.34716796875, 0.38671875, 0.42626953125, 0.4658203125, 0.50537109375, 0.544921875, 0.58447265625, 0.6240234375, 0.66357421875, 0.703125, 0.74267578125, 0.7822265625, 0.82177734375, 0.861328125, 0.90087890625, 0.9404296875, 0.97998046875, 1.01953125, 1.05908203125, 1.0986328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 3.0, 10.0, 7.0, 18.0, 16.0, 15.0, 14.0, 46.0, 753.0, 16.0, 12.0, 11.0, 15.0, 6.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7255859375, -1.6790618896484375, -1.632537841796875, -1.5860137939453125, -1.53948974609375, -1.4929656982421875, -1.446441650390625, -1.3999176025390625, -1.3533935546875, -1.3068695068359375, -1.260345458984375, -1.2138214111328125, -1.16729736328125, -1.1207733154296875, -1.074249267578125, -1.0277252197265625, -0.981201171875, -0.9346771240234375, -0.888153076171875, -0.8416290283203125, -0.79510498046875, -0.7485809326171875, -0.702056884765625, -0.6555328369140625, -0.6090087890625, -0.5624847412109375, -0.515960693359375, -0.4694366455078125, -0.42291259765625, -0.3763885498046875, -0.329864501953125, -0.2833404541015625, -0.23681640625, -0.1902923583984375, -0.143768310546875, -0.0972442626953125, -0.05072021484375, -0.0041961669921875, 0.042327880859375, 0.0888519287109375, 0.1353759765625, 0.1819000244140625, 0.228424072265625, 0.2749481201171875, 0.32147216796875, 0.3679962158203125, 0.414520263671875, 0.4610443115234375, 0.507568359375, 0.5540924072265625, 0.600616455078125, 0.6471405029296875, 0.69366455078125, 0.7401885986328125, 0.786712646484375, 0.8332366943359375, 0.8797607421875, 0.9262847900390625, 0.972808837890625, 1.0193328857421875, 1.06585693359375, 1.1123809814453125, 1.158905029296875, 1.2054290771484375, 1.251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 4.0, 9.0, 4.0, 16.0, 23.0, 49.0, 75.0, 138.0, 268.0, 404.0, 783.0, 1890.0, 6363.0, 40366.0, 3853301.0, 267262.0, 16978.0, 3675.0, 1274.0, 582.0, 319.0, 182.0, 106.0, 71.0, 30.0, 27.0, 24.0, 16.0, 7.0, 3.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.970703125, -2.88525390625, -2.7998046875, -2.71435546875, -2.62890625, -2.54345703125, -2.4580078125, -2.37255859375, -2.287109375, -2.20166015625, -2.1162109375, -2.03076171875, -1.9453125, -1.85986328125, -1.7744140625, -1.68896484375, -1.603515625, -1.51806640625, -1.4326171875, -1.34716796875, -1.26171875, -1.17626953125, -1.0908203125, -1.00537109375, -0.919921875, -0.83447265625, -0.7490234375, -0.66357421875, -0.578125, -0.49267578125, -0.4072265625, -0.32177734375, -0.236328125, -0.15087890625, -0.0654296875, 0.02001953125, 0.10546875, 0.19091796875, 0.2763671875, 0.36181640625, 0.447265625, 0.53271484375, 0.6181640625, 0.70361328125, 0.7890625, 0.87451171875, 0.9599609375, 1.04541015625, 1.130859375, 1.21630859375, 1.3017578125, 1.38720703125, 1.47265625, 1.55810546875, 1.6435546875, 1.72900390625, 1.814453125, 1.89990234375, 1.9853515625, 2.07080078125, 2.15625, 2.24169921875, 2.3271484375, 2.41259765625, 2.498046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 13.0, 11.0, 27.0, 27.0, 57.0, 171.0, 999.0, 2127.0, 358.0, 111.0, 59.0, 35.0, 33.0, 19.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.375, -1.3224945068359375, -1.269989013671875, -1.2174835205078125, -1.16497802734375, -1.1124725341796875, -1.059967041015625, -1.0074615478515625, -0.9549560546875, -0.9024505615234375, -0.849945068359375, -0.7974395751953125, -0.74493408203125, -0.6924285888671875, -0.639923095703125, -0.5874176025390625, -0.534912109375, -0.4824066162109375, -0.429901123046875, -0.3773956298828125, -0.32489013671875, -0.2723846435546875, -0.219879150390625, -0.1673736572265625, -0.1148681640625, -0.0623626708984375, -0.009857177734375, 0.0426483154296875, 0.09515380859375, 0.1476593017578125, 0.200164794921875, 0.2526702880859375, 0.30517578125, 0.3576812744140625, 0.410186767578125, 0.4626922607421875, 0.51519775390625, 0.5677032470703125, 0.620208740234375, 0.6727142333984375, 0.7252197265625, 0.7777252197265625, 0.830230712890625, 0.8827362060546875, 0.93524169921875, 0.9877471923828125, 1.040252685546875, 1.0927581787109375, 1.145263671875, 1.1977691650390625, 1.250274658203125, 1.3027801513671875, 1.35528564453125, 1.4077911376953125, 1.460296630859375, 1.5128021240234375, 1.5653076171875, 1.6178131103515625, 1.670318603515625, 1.7228240966796875, 1.77532958984375, 1.8278350830078125, 1.880340576171875, 1.9328460693359375, 1.9853515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 19.0, 99.0, 568.0, 225.0, 41.0, 18.0, 13.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.887177467346191, -5.6007080078125, -5.314238548278809, -5.027769565582275, -4.741300106048584, -4.454830646514893, -4.168361663818359, -3.881892204284668, -3.5954227447509766, -3.308953285217285, -3.022484064102173, -2.7360148429870605, -2.449545383453369, -2.1630759239196777, -1.8766067028045654, -1.5901374816894531, -1.3036680221557617, -1.0171986818313599, -0.730729341506958, -0.44426000118255615, -0.1577906608581543, 0.12867867946624756, 0.4151480197906494, 0.7016172409057617, 0.9880867004394531, 1.274556040763855, 1.5610253810882568, 1.8474947214126587, 2.1339640617370605, 2.420433521270752, 2.7069027423858643, 2.9933719635009766, 3.2798423767089844, 3.566311836242676, 3.852781057357788, 4.1392502784729, 4.425719738006592, 4.712189197540283, 4.998658180236816, 5.285127639770508, 5.571597099304199, 5.858066558837891, 6.144536018371582, 6.431005001068115, 6.717474460601807, 7.003943920135498, 7.290412902832031, 7.576882362365723, 7.863351821899414, 8.149821281433105, 8.436290740966797, 8.722760200500488, 9.00922966003418, 9.295698165893555, 9.582167625427246, 9.868637084960938, 10.155106544494629, 10.44157600402832, 10.728045463562012, 11.014514923095703, 11.300983428955078, 11.58745288848877, 11.873922348022461, 12.160391807556152, 12.446861267089844]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 5.0, 6.0, 10.0, 11.0, 16.0, 19.0, 28.0, 29.0, 29.0, 38.0, 40.0, 47.0, 60.0, 68.0, 74.0, 64.0, 65.0, 62.0, 48.0, 49.0, 45.0, 30.0, 32.0, 23.0, 26.0, 15.0, 10.0, 9.0, 5.0, 8.0, 10.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8867177963256836, -3.758209466934204, -3.6297011375427246, -3.501192569732666, -3.3726842403411865, -3.244175910949707, -3.1156673431396484, -2.987159013748169, -2.8586506843566895, -2.73014235496521, -2.6016340255737305, -2.473125457763672, -2.3446171283721924, -2.216108798980713, -2.0876002311706543, -1.9590919017791748, -1.8305835723876953, -1.7020752429962158, -1.5735667943954468, -1.4450583457946777, -1.3165500164031982, -1.1880416870117188, -1.0595332384109497, -0.9310248494148254, -0.8025164604187012, -0.6740080714225769, -0.5454996824264526, -0.41699129343032837, -0.2884829044342041, -0.15997451543807983, -0.031466126441955566, 0.0970422625541687, 0.22555017471313477, 0.35405856370925903, 0.4825669527053833, 0.6110753417015076, 0.7395837306976318, 0.8680921196937561, 0.9966005086898804, 1.1251089572906494, 1.253617286682129, 1.3821256160736084, 1.5106340646743774, 1.6391425132751465, 1.767650842666626, 1.8961591720581055, 2.024667739868164, 2.1531760692596436, 2.281684398651123, 2.4101927280426025, 2.538701057434082, 2.6672096252441406, 2.79571795463562, 2.9242262840270996, 3.052734851837158, 3.1812431812286377, 3.309751510620117, 3.4382598400115967, 3.566768169403076, 3.6952767372131348, 3.8237850666046143, 3.9522933959960938, 4.080801963806152, 4.209310054779053, 4.337818622589111]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 10.0, 19.0, 22.0, 29.0, 37.0, 51.0, 73.0, 114.0, 151.0, 257.0, 331.0, 531.0, 945.0, 1522.0, 2851.0, 5412.0, 11555.0, 30966.0, 899650.0, 58858.0, 18227.0, 7822.0, 3773.0, 2066.0, 1180.0, 721.0, 459.0, 308.0, 194.0, 130.0, 97.0, 66.0, 36.0, 25.0, 17.0, 12.0, 11.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.99609375, -6.76092529296875, -6.5257568359375, -6.29058837890625, -6.055419921875, -5.82025146484375, -5.5850830078125, -5.34991455078125, -5.11474609375, -4.87957763671875, -4.6444091796875, -4.40924072265625, -4.174072265625, -3.93890380859375, -3.7037353515625, -3.46856689453125, -3.2333984375, -2.99822998046875, -2.7630615234375, -2.52789306640625, -2.292724609375, -2.05755615234375, -1.8223876953125, -1.58721923828125, -1.35205078125, -1.11688232421875, -0.8817138671875, -0.64654541015625, -0.411376953125, -0.17620849609375, 0.0589599609375, 0.29412841796875, 0.529296875, 0.76446533203125, 0.9996337890625, 1.23480224609375, 1.469970703125, 1.70513916015625, 1.9403076171875, 2.17547607421875, 2.41064453125, 2.64581298828125, 2.8809814453125, 3.11614990234375, 3.351318359375, 3.58648681640625, 3.8216552734375, 4.05682373046875, 4.2919921875, 4.52716064453125, 4.7623291015625, 4.99749755859375, 5.232666015625, 5.46783447265625, 5.7030029296875, 5.93817138671875, 6.17333984375, 6.40850830078125, 6.6436767578125, 6.87884521484375, 7.114013671875, 7.34918212890625, 7.5843505859375, 7.81951904296875, 8.0546875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 4.0, 6.0, 6.0, 8.0, 8.0, 12.0, 19.0, 18.0, 11.0, 100.0, 697.0, 19.0, 12.0, 13.0, 12.0, 7.0, 11.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.701171875, -1.6553802490234375, -1.609588623046875, -1.5637969970703125, -1.51800537109375, -1.4722137451171875, -1.426422119140625, -1.3806304931640625, -1.3348388671875, -1.2890472412109375, -1.243255615234375, -1.1974639892578125, -1.15167236328125, -1.1058807373046875, -1.060089111328125, -1.0142974853515625, -0.968505859375, -0.9227142333984375, -0.876922607421875, -0.8311309814453125, -0.78533935546875, -0.7395477294921875, -0.693756103515625, -0.6479644775390625, -0.6021728515625, -0.5563812255859375, -0.510589599609375, -0.4647979736328125, -0.41900634765625, -0.3732147216796875, -0.327423095703125, -0.2816314697265625, -0.23583984375, -0.1900482177734375, -0.144256591796875, -0.0984649658203125, -0.05267333984375, -0.0068817138671875, 0.038909912109375, 0.0847015380859375, 0.1304931640625, 0.1762847900390625, 0.222076416015625, 0.2678680419921875, 0.31365966796875, 0.3594512939453125, 0.405242919921875, 0.4510345458984375, 0.496826171875, 0.5426177978515625, 0.588409423828125, 0.6342010498046875, 0.67999267578125, 0.7257843017578125, 0.771575927734375, 0.8173675537109375, 0.8631591796875, 0.9089508056640625, 0.954742431640625, 1.0005340576171875, 1.04632568359375, 1.0921173095703125, 1.137908935546875, 1.1837005615234375, 1.2294921875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 8.0, 7.0, 10.0, 18.0, 23.0, 29.0, 30.0, 49.0, 67.0, 83.0, 117.0, 165.0, 219.0, 342.0, 560.0, 1119.0, 2521.0, 6407.0, 19815.0, 70906.0, 411260.0, 429807.0, 72548.0, 20486.0, 6534.0, 2475.0, 1051.0, 612.0, 388.0, 237.0, 181.0, 143.0, 92.0, 68.0, 52.0, 32.0, 29.0, 21.0, 14.0, 11.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.86328125, -3.742584228515625, -3.62188720703125, -3.501190185546875, -3.3804931640625, -3.259796142578125, -3.13909912109375, -3.018402099609375, -2.897705078125, -2.777008056640625, -2.65631103515625, -2.535614013671875, -2.4149169921875, -2.294219970703125, -2.17352294921875, -2.052825927734375, -1.93212890625, -1.811431884765625, -1.69073486328125, -1.570037841796875, -1.4493408203125, -1.328643798828125, -1.20794677734375, -1.087249755859375, -0.966552734375, -0.845855712890625, -0.72515869140625, -0.604461669921875, -0.4837646484375, -0.363067626953125, -0.24237060546875, -0.121673583984375, -0.0009765625, 0.119720458984375, 0.24041748046875, 0.361114501953125, 0.4818115234375, 0.602508544921875, 0.72320556640625, 0.843902587890625, 0.964599609375, 1.085296630859375, 1.20599365234375, 1.326690673828125, 1.4473876953125, 1.568084716796875, 1.68878173828125, 1.809478759765625, 1.93017578125, 2.050872802734375, 2.17156982421875, 2.292266845703125, 2.4129638671875, 2.533660888671875, 2.65435791015625, 2.775054931640625, 2.895751953125, 3.016448974609375, 3.13714599609375, 3.257843017578125, 3.3785400390625, 3.499237060546875, 3.61993408203125, 3.740631103515625, 3.861328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 6.0, 8.0, 9.0, 12.0, 9.0, 15.0, 25.0, 32.0, 23.0, 31.0, 30.0, 27.0, 32.0, 42.0, 49.0, 33.0, 35.0, 57.0, 48.0, 43.0, 42.0, 36.0, 49.0, 29.0, 24.0, 33.0, 32.0, 27.0, 25.0, 27.0, 24.0, 17.0, 12.0, 9.0, 6.0, 8.0, 6.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.05078125, -4.909576416015625, -4.76837158203125, -4.627166748046875, -4.4859619140625, -4.344757080078125, -4.20355224609375, -4.062347412109375, -3.921142578125, -3.779937744140625, -3.63873291015625, -3.497528076171875, -3.3563232421875, -3.215118408203125, -3.07391357421875, -2.932708740234375, -2.79150390625, -2.650299072265625, -2.50909423828125, -2.367889404296875, -2.2266845703125, -2.085479736328125, -1.94427490234375, -1.803070068359375, -1.661865234375, -1.520660400390625, -1.37945556640625, -1.238250732421875, -1.0970458984375, -0.955841064453125, -0.81463623046875, -0.673431396484375, -0.5322265625, -0.391021728515625, -0.24981689453125, -0.108612060546875, 0.0325927734375, 0.173797607421875, 0.31500244140625, 0.456207275390625, 0.597412109375, 0.738616943359375, 0.87982177734375, 1.021026611328125, 1.1622314453125, 1.303436279296875, 1.44464111328125, 1.585845947265625, 1.72705078125, 1.868255615234375, 2.00946044921875, 2.150665283203125, 2.2918701171875, 2.433074951171875, 2.57427978515625, 2.715484619140625, 2.856689453125, 2.997894287109375, 3.13909912109375, 3.280303955078125, 3.4215087890625, 3.562713623046875, 3.70391845703125, 3.845123291015625, 3.986328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 6.0, 6.0, 16.0, 24.0, 32.0, 60.0, 109.0, 226.0, 588.0, 3062.0, 131591.0, 907127.0, 4392.0, 795.0, 230.0, 120.0, 67.0, 38.0, 16.0, 19.0, 10.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.10565185546875, -5.9027099609375, -5.69976806640625, -5.496826171875, -5.29388427734375, -5.0909423828125, -4.88800048828125, -4.68505859375, -4.48211669921875, -4.2791748046875, -4.07623291015625, -3.873291015625, -3.67034912109375, -3.4674072265625, -3.26446533203125, -3.0615234375, -2.85858154296875, -2.6556396484375, -2.45269775390625, -2.249755859375, -2.04681396484375, -1.8438720703125, -1.64093017578125, -1.43798828125, -1.23504638671875, -1.0321044921875, -0.82916259765625, -0.626220703125, -0.42327880859375, -0.2203369140625, -0.01739501953125, 0.185546875, 0.38848876953125, 0.5914306640625, 0.79437255859375, 0.997314453125, 1.20025634765625, 1.4031982421875, 1.60614013671875, 1.80908203125, 2.01202392578125, 2.2149658203125, 2.41790771484375, 2.620849609375, 2.82379150390625, 3.0267333984375, 3.22967529296875, 3.4326171875, 3.63555908203125, 3.8385009765625, 4.04144287109375, 4.244384765625, 4.44732666015625, 4.6502685546875, 4.85321044921875, 5.05615234375, 5.25909423828125, 5.4620361328125, 5.66497802734375, 5.867919921875, 6.07086181640625, 6.2738037109375, 6.47674560546875, 6.6796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 7.0, 2.0, 4.0, 7.0, 5.0, 7.0, 17.0, 25.0, 32.0, 78.0, 134.0, 228.0, 211.0, 111.0, 57.0, 32.0, 17.0, 8.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019419193267822266, -0.00018637441098690033, -0.000178556889295578, -0.00017073936760425568, -0.00016292184591293335, -0.00015510432422161102, -0.0001472868025302887, -0.00013946928083896637, -0.00013165175914764404, -0.00012383423745632172, -0.00011601671576499939, -0.00010819919407367706, -0.00010038167238235474, -9.256415069103241e-05, -8.474662899971008e-05, -7.692910730838776e-05, -6.911158561706543e-05, -6.12940639257431e-05, -5.3476542234420776e-05, -4.565902054309845e-05, -3.784149885177612e-05, -3.0023977160453796e-05, -2.220645546913147e-05, -1.4388933777809143e-05, -6.571412086486816e-06, 1.2461096048355103e-06, 9.063631296157837e-06, 1.6881152987480164e-05, 2.469867467880249e-05, 3.251619637012482e-05, 4.0333718061447144e-05, 4.815123975276947e-05, 5.59687614440918e-05, 6.378628313541412e-05, 7.160380482673645e-05, 7.942132651805878e-05, 8.72388482093811e-05, 9.505636990070343e-05, 0.00010287389159202576, 0.00011069141328334808, 0.00011850893497467041, 0.00012632645666599274, 0.00013414397835731506, 0.0001419615000486374, 0.00014977902173995972, 0.00015759654343128204, 0.00016541406512260437, 0.0001732315868139267, 0.00018104910850524902, 0.00018886663019657135, 0.00019668415188789368, 0.000204501673579216, 0.00021231919527053833, 0.00022013671696186066, 0.00022795423865318298, 0.0002357717603445053, 0.00024358928203582764, 0.00025140680372714996, 0.0002592243254184723, 0.0002670418471097946, 0.00027485936880111694, 0.00028267689049243927, 0.0002904944121837616, 0.0002983119338750839, 0.00030612945556640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 23.0, 49.0, 62.0, 140.0, 275.0, 618.0, 1748.0, 8358.0, 126964.0, 878715.0, 26208.0, 3461.0, 1064.0, 420.0, 191.0, 90.0, 47.0, 40.0, 17.0, 11.0, 7.0, 6.0, 10.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.900390625, -2.807586669921875, -2.71478271484375, -2.621978759765625, -2.5291748046875, -2.436370849609375, -2.34356689453125, -2.250762939453125, -2.157958984375, -2.065155029296875, -1.97235107421875, -1.879547119140625, -1.7867431640625, -1.693939208984375, -1.60113525390625, -1.508331298828125, -1.41552734375, -1.322723388671875, -1.22991943359375, -1.137115478515625, -1.0443115234375, -0.951507568359375, -0.85870361328125, -0.765899658203125, -0.673095703125, -0.580291748046875, -0.48748779296875, -0.394683837890625, -0.3018798828125, -0.209075927734375, -0.11627197265625, -0.023468017578125, 0.0693359375, 0.162139892578125, 0.25494384765625, 0.347747802734375, 0.4405517578125, 0.533355712890625, 0.62615966796875, 0.718963623046875, 0.811767578125, 0.904571533203125, 0.99737548828125, 1.090179443359375, 1.1829833984375, 1.275787353515625, 1.36859130859375, 1.461395263671875, 1.55419921875, 1.647003173828125, 1.73980712890625, 1.832611083984375, 1.9254150390625, 2.018218994140625, 2.11102294921875, 2.203826904296875, 2.296630859375, 2.389434814453125, 2.48223876953125, 2.575042724609375, 2.6678466796875, 2.760650634765625, 2.85345458984375, 2.946258544921875, 3.0390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 17.0, 23.0, 20.0, 35.0, 41.0, 76.0, 121.0, 159.0, 124.0, 124.0, 71.0, 50.0, 36.0, 33.0, 18.0, 17.0, 5.0, 10.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7314453125, -1.6410980224609375, -1.550750732421875, -1.4604034423828125, -1.37005615234375, -1.2797088623046875, -1.189361572265625, -1.0990142822265625, -1.0086669921875, -0.9183197021484375, -0.827972412109375, -0.7376251220703125, -0.64727783203125, -0.5569305419921875, -0.466583251953125, -0.3762359619140625, -0.285888671875, -0.1955413818359375, -0.105194091796875, -0.0148468017578125, 0.07550048828125, 0.1658477783203125, 0.256195068359375, 0.3465423583984375, 0.4368896484375, 0.5272369384765625, 0.617584228515625, 0.7079315185546875, 0.79827880859375, 0.8886260986328125, 0.978973388671875, 1.0693206787109375, 1.15966796875, 1.2500152587890625, 1.340362548828125, 1.4307098388671875, 1.52105712890625, 1.6114044189453125, 1.701751708984375, 1.7920989990234375, 1.8824462890625, 1.9727935791015625, 2.063140869140625, 2.1534881591796875, 2.24383544921875, 2.3341827392578125, 2.424530029296875, 2.5148773193359375, 2.605224609375, 2.6955718994140625, 2.785919189453125, 2.8762664794921875, 2.96661376953125, 3.0569610595703125, 3.147308349609375, 3.2376556396484375, 3.3280029296875, 3.4183502197265625, 3.508697509765625, 3.5990447998046875, 3.68939208984375, 3.7797393798828125, 3.870086669921875, 3.9604339599609375, 4.05078125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 9.0, 19.0, 66.0, 228.0, 403.0, 146.0, 49.0, 32.0, 17.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.96891784667969, -49.4395751953125, -47.91023254394531, -46.38089370727539, -44.8515510559082, -43.322208404541016, -41.79286575317383, -40.263526916503906, -38.73418426513672, -37.20484161376953, -35.675498962402344, -34.14616012573242, -32.616817474365234, -31.087474822998047, -29.55813217163086, -28.028791427612305, -26.499448776245117, -24.97010612487793, -23.440765380859375, -21.911422729492188, -20.382081985473633, -18.852739334106445, -17.32339859008789, -15.794055938720703, -14.264714241027832, -12.735372543334961, -11.20603084564209, -9.676689147949219, -8.147346496582031, -6.618005275726318, -5.088663101196289, -3.559321403503418, -2.029979705810547, -0.5006378889083862, 1.0287039279937744, 2.5580458641052246, 4.087387561798096, 5.616729259490967, 7.146071434020996, 8.675413131713867, 10.204754829406738, 11.73409652709961, 13.26343822479248, 14.792779922485352, 16.32212257385254, 17.851463317871094, 19.38080596923828, 20.91014862060547, 22.439489364624023, 23.96883201599121, 25.498172760009766, 27.027515411376953, 28.556856155395508, 30.086198806762695, 31.61553955078125, 33.14488220214844, 34.674224853515625, 36.20356750488281, 37.73291015625, 39.26224899291992, 40.79159164428711, 42.3209342956543, 43.850276947021484, 45.379615783691406, 46.908958435058594]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 3.0, 2.0, 6.0, 7.0, 6.0, 9.0, 18.0, 22.0, 47.0, 92.0, 152.0, 201.0, 165.0, 89.0, 72.0, 40.0, 17.0, 14.0, 5.0, 1.0, 4.0, 10.0, 4.0, 5.0, 2.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.03308868408203, -82.68578338623047, -79.3384780883789, -75.99117279052734, -72.64386749267578, -69.29656219482422, -65.94924926757812, -62.60194778442383, -59.254642486572266, -55.9073371887207, -52.56003189086914, -49.21272277832031, -45.86541748046875, -42.51811218261719, -39.170806884765625, -35.82350158691406, -32.4761962890625, -29.128890991210938, -25.781585693359375, -22.43427848815918, -19.086973190307617, -15.739667892456055, -12.39236068725586, -9.045055389404297, -5.697750091552734, -2.3504443168640137, 0.996861457824707, 4.344167709350586, 7.691473007202148, 11.038778305053711, 14.386085510253906, 17.73339080810547, 21.080703735351562, 24.428009033203125, 27.775314331054688, 31.122621536254883, 34.46992492675781, 37.817230224609375, 41.1645393371582, 44.511844635009766, 47.85914993286133, 51.20645523071289, 54.55376052856445, 57.90106964111328, 61.248374938964844, 64.5956802368164, 67.94298553466797, 71.29029083251953, 74.6375961303711, 77.98490142822266, 81.33220672607422, 84.67951202392578, 88.02681732177734, 91.3741226196289, 94.721435546875, 98.06874084472656, 101.41604614257812, 104.76335144042969, 108.11065673828125, 111.45796203613281, 114.80526733398438, 118.15257263183594, 121.4998779296875, 124.84718322753906, 128.19448852539062]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 8.0, 12.0, 24.0, 18.0, 42.0, 44.0, 73.0, 123.0, 212.0, 458.0, 1096.0, 3227.0, 13571.0, 220700.0, 3923682.0, 23733.0, 4650.0, 1421.0, 577.0, 252.0, 127.0, 76.0, 53.0, 21.0, 14.0, 10.0, 13.0, 6.0, 6.0, 12.0, 3.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.359375, -16.850830078125, -16.34228515625, -15.833740234375, -15.3251953125, -14.816650390625, -14.30810546875, -13.799560546875, -13.291015625, -12.782470703125, -12.27392578125, -11.765380859375, -11.2568359375, -10.748291015625, -10.23974609375, -9.731201171875, -9.22265625, -8.714111328125, -8.20556640625, -7.697021484375, -7.1884765625, -6.679931640625, -6.17138671875, -5.662841796875, -5.154296875, -4.645751953125, -4.13720703125, -3.628662109375, -3.1201171875, -2.611572265625, -2.10302734375, -1.594482421875, -1.0859375, -0.577392578125, -0.06884765625, 0.439697265625, 0.9482421875, 1.456787109375, 1.96533203125, 2.473876953125, 2.982421875, 3.490966796875, 3.99951171875, 4.508056640625, 5.0166015625, 5.525146484375, 6.03369140625, 6.542236328125, 7.05078125, 7.559326171875, 8.06787109375, 8.576416015625, 9.0849609375, 9.593505859375, 10.10205078125, 10.610595703125, 11.119140625, 11.627685546875, 12.13623046875, 12.644775390625, 13.1533203125, 13.661865234375, 14.17041015625, 14.678955078125, 15.1875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 3.0, 1.0, 7.0, 5.0, 5.0, 8.0, 3.0, 6.0, 8.0, 15.0, 9.0, 20.0, 44.0, 299.0, 409.0, 57.0, 17.0, 12.0, 13.0, 9.0, 5.0, 11.0, 6.0, 8.0, 4.0, 3.0, 7.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1572265625, -1.1251678466796875, -1.093109130859375, -1.0610504150390625, -1.02899169921875, -0.9969329833984375, -0.964874267578125, -0.9328155517578125, -0.9007568359375, -0.8686981201171875, -0.836639404296875, -0.8045806884765625, -0.77252197265625, -0.7404632568359375, -0.708404541015625, -0.6763458251953125, -0.644287109375, -0.6122283935546875, -0.580169677734375, -0.5481109619140625, -0.51605224609375, -0.4839935302734375, -0.451934814453125, -0.4198760986328125, -0.3878173828125, -0.3557586669921875, -0.323699951171875, -0.2916412353515625, -0.25958251953125, -0.2275238037109375, -0.195465087890625, -0.1634063720703125, -0.13134765625, -0.0992889404296875, -0.067230224609375, -0.0351715087890625, -0.00311279296875, 0.0289459228515625, 0.061004638671875, 0.0930633544921875, 0.1251220703125, 0.1571807861328125, 0.189239501953125, 0.2212982177734375, 0.25335693359375, 0.2854156494140625, 0.317474365234375, 0.3495330810546875, 0.381591796875, 0.4136505126953125, 0.445709228515625, 0.4777679443359375, 0.50982666015625, 0.5418853759765625, 0.573944091796875, 0.6060028076171875, 0.6380615234375, 0.6701202392578125, 0.702178955078125, 0.7342376708984375, 0.76629638671875, 0.7983551025390625, 0.830413818359375, 0.8624725341796875, 0.89453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 6.0, 2.0, 9.0, 11.0, 25.0, 22.0, 41.0, 52.0, 106.0, 138.0, 220.0, 348.0, 595.0, 1100.0, 2318.0, 6097.0, 22553.0, 164164.0, 3797586.0, 163408.0, 23757.0, 6480.0, 2514.0, 1091.0, 604.0, 367.0, 224.0, 117.0, 78.0, 67.0, 52.0, 35.0, 21.0, 21.0, 18.0, 9.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.32537841796875, -5.1663818359375, -5.00738525390625, -4.848388671875, -4.68939208984375, -4.5303955078125, -4.37139892578125, -4.21240234375, -4.05340576171875, -3.8944091796875, -3.73541259765625, -3.576416015625, -3.41741943359375, -3.2584228515625, -3.09942626953125, -2.9404296875, -2.78143310546875, -2.6224365234375, -2.46343994140625, -2.304443359375, -2.14544677734375, -1.9864501953125, -1.82745361328125, -1.66845703125, -1.50946044921875, -1.3504638671875, -1.19146728515625, -1.032470703125, -0.87347412109375, -0.7144775390625, -0.55548095703125, -0.396484375, -0.23748779296875, -0.0784912109375, 0.08050537109375, 0.239501953125, 0.39849853515625, 0.5574951171875, 0.71649169921875, 0.87548828125, 1.03448486328125, 1.1934814453125, 1.35247802734375, 1.511474609375, 1.67047119140625, 1.8294677734375, 1.98846435546875, 2.1474609375, 2.30645751953125, 2.4654541015625, 2.62445068359375, 2.783447265625, 2.94244384765625, 3.1014404296875, 3.26043701171875, 3.41943359375, 3.57843017578125, 3.7374267578125, 3.89642333984375, 4.055419921875, 4.21441650390625, 4.3734130859375, 4.53240966796875, 4.69140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 8.0, 5.0, 5.0, 14.0, 11.0, 20.0, 15.0, 37.0, 43.0, 71.0, 126.0, 292.0, 847.0, 1640.0, 365.0, 176.0, 113.0, 64.0, 49.0, 33.0, 27.0, 22.0, 28.0, 15.0, 13.0, 7.0, 5.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.0957489013671875, -1.060638427734375, -1.0255279541015625, -0.99041748046875, -0.9553070068359375, -0.920196533203125, -0.8850860595703125, -0.8499755859375, -0.8148651123046875, -0.779754638671875, -0.7446441650390625, -0.70953369140625, -0.6744232177734375, -0.639312744140625, -0.6042022705078125, -0.569091796875, -0.5339813232421875, -0.498870849609375, -0.4637603759765625, -0.42864990234375, -0.3935394287109375, -0.358428955078125, -0.3233184814453125, -0.2882080078125, -0.2530975341796875, -0.217987060546875, -0.1828765869140625, -0.14776611328125, -0.1126556396484375, -0.077545166015625, -0.0424346923828125, -0.00732421875, 0.0277862548828125, 0.062896728515625, 0.0980072021484375, 0.13311767578125, 0.1682281494140625, 0.203338623046875, 0.2384490966796875, 0.2735595703125, 0.3086700439453125, 0.343780517578125, 0.3788909912109375, 0.41400146484375, 0.4491119384765625, 0.484222412109375, 0.5193328857421875, 0.554443359375, 0.5895538330078125, 0.624664306640625, 0.6597747802734375, 0.69488525390625, 0.7299957275390625, 0.765106201171875, 0.8002166748046875, 0.8353271484375, 0.8704376220703125, 0.905548095703125, 0.9406585693359375, 0.97576904296875, 1.0108795166015625, 1.045989990234375, 1.0811004638671875, 1.1162109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 12.0, 357.0, 594.0, 35.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.282752990722656, -40.3668212890625, -39.450889587402344, -38.53495788574219, -37.61902618408203, -36.703094482421875, -35.78716278076172, -34.8712272644043, -33.95529556274414, -33.039363861083984, -32.12343215942383, -31.207500457763672, -30.291566848754883, -29.375635147094727, -28.45970344543457, -27.543771743774414, -26.627840042114258, -25.7119083404541, -24.795976638793945, -23.880043029785156, -22.964111328125, -22.048179626464844, -21.132247924804688, -20.21631622314453, -19.300384521484375, -18.38445281982422, -17.468521118164062, -16.552589416503906, -15.636655807495117, -14.720724105834961, -13.804792404174805, -12.888860702514648, -11.97292709350586, -11.056995391845703, -10.14106273651123, -9.225131034851074, -8.309198379516602, -7.393266677856445, -6.477334976196289, -5.561402797698975, -4.64547061920166, -3.7295384407043457, -2.8136065006256104, -1.897674560546875, -0.9817423820495605, -0.0658102035522461, 0.8501214981079102, 1.7660536766052246, 2.681985855102539, 3.5979180335998535, 4.513850212097168, 5.429781913757324, 6.345714092254639, 7.261646270751953, 8.17757797241211, 9.093509674072266, 10.009442329406738, 10.925374031066895, 11.841306686401367, 12.757238388061523, 13.67317008972168, 14.589102745056152, 15.505034446716309, 16.42096710205078, 17.336898803710938]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 12.0, 6.0, 15.0, 22.0, 23.0, 47.0, 42.0, 56.0, 73.0, 86.0, 95.0, 79.0, 90.0, 77.0, 76.0, 47.0, 30.0, 34.0, 17.0, 11.0, 12.0, 11.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.129861831665039, -6.933475971221924, -6.737090587615967, -6.540704727172852, -6.3443193435668945, -6.147933483123779, -5.951547622680664, -5.755162239074707, -5.558776378631592, -5.362390518188477, -5.1660051345825195, -4.969619274139404, -4.773233413696289, -4.576848030090332, -4.380462169647217, -4.184076309204102, -3.9876909255981445, -3.7913053035736084, -3.5949196815490723, -3.398533821105957, -3.202148199081421, -3.0057625770568848, -2.8093767166137695, -2.6129910945892334, -2.4166054725646973, -2.220219850540161, -2.023834228515625, -1.8274483680725098, -1.6310627460479736, -1.4346771240234375, -1.2382913827896118, -1.0419056415557861, -0.84552001953125, -0.6491343379020691, -0.4527486562728882, -0.2563629746437073, -0.05997729301452637, 0.13640838861465454, 0.33279407024383545, 0.5291798114776611, 0.7255654335021973, 0.9219511151313782, 1.118336796760559, 1.3147225379943848, 1.511108160018921, 1.707493782043457, 1.9038795232772827, 2.1002652645111084, 2.2966508865356445, 2.4930365085601807, 2.689422130584717, 2.885807991027832, 3.082193613052368, 3.2785792350769043, 3.4749650955200195, 3.6713507175445557, 3.867736339569092, 4.064122200012207, 4.260507583618164, 4.456893444061279, 4.6532793045043945, 4.849664688110352, 5.046050548553467, 5.242436408996582, 5.438821792602539]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 0.0, 6.0, 6.0, 5.0, 14.0, 12.0, 33.0, 44.0, 63.0, 96.0, 164.0, 227.0, 400.0, 715.0, 1438.0, 3060.0, 6935.0, 19345.0, 146845.0, 823575.0, 28486.0, 9283.0, 3827.0, 1799.0, 912.0, 494.0, 245.0, 179.0, 104.0, 84.0, 38.0, 34.0, 31.0, 19.0, 10.0, 9.0, 4.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4921875, -8.2105712890625, -7.928955078125, -7.6473388671875, -7.36572265625, -7.0841064453125, -6.802490234375, -6.5208740234375, -6.2392578125, -5.9576416015625, -5.676025390625, -5.3944091796875, -5.11279296875, -4.8311767578125, -4.549560546875, -4.2679443359375, -3.986328125, -3.7047119140625, -3.423095703125, -3.1414794921875, -2.85986328125, -2.5782470703125, -2.296630859375, -2.0150146484375, -1.7333984375, -1.4517822265625, -1.170166015625, -0.8885498046875, -0.60693359375, -0.3253173828125, -0.043701171875, 0.2379150390625, 0.51953125, 0.8011474609375, 1.082763671875, 1.3643798828125, 1.64599609375, 1.9276123046875, 2.209228515625, 2.4908447265625, 2.7724609375, 3.0540771484375, 3.335693359375, 3.6173095703125, 3.89892578125, 4.1805419921875, 4.462158203125, 4.7437744140625, 5.025390625, 5.3070068359375, 5.588623046875, 5.8702392578125, 6.15185546875, 6.4334716796875, 6.715087890625, 6.9967041015625, 7.2783203125, 7.5599365234375, 7.841552734375, 8.1231689453125, 8.40478515625, 8.6864013671875, 8.968017578125, 9.2496337890625, 9.53125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 3.0, 5.0, 11.0, 14.0, 12.0, 15.0, 46.0, 211.0, 394.0, 146.0, 39.0, 15.0, 12.0, 13.0, 11.0, 9.0, 5.0, 4.0, 3.0, 3.0, 6.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.306640625, -1.2734909057617188, -1.2403411865234375, -1.2071914672851562, -1.174041748046875, -1.1408920288085938, -1.1077423095703125, -1.0745925903320312, -1.04144287109375, -1.0082931518554688, -0.9751434326171875, -0.9419937133789062, -0.908843994140625, -0.8756942749023438, -0.8425445556640625, -0.8093948364257812, -0.7762451171875, -0.7430953979492188, -0.7099456787109375, -0.6767959594726562, -0.643646240234375, -0.6104965209960938, -0.5773468017578125, -0.5441970825195312, -0.51104736328125, -0.47789764404296875, -0.4447479248046875, -0.41159820556640625, -0.378448486328125, -0.34529876708984375, -0.3121490478515625, -0.27899932861328125, -0.245849609375, -0.21269989013671875, -0.1795501708984375, -0.14640045166015625, -0.113250732421875, -0.08010101318359375, -0.0469512939453125, -0.01380157470703125, 0.01934814453125, 0.05249786376953125, 0.0856475830078125, 0.11879730224609375, 0.151947021484375, 0.18509674072265625, 0.2182464599609375, 0.25139617919921875, 0.2845458984375, 0.31769561767578125, 0.3508453369140625, 0.38399505615234375, 0.417144775390625, 0.45029449462890625, 0.4834442138671875, 0.5165939331054688, 0.54974365234375, 0.5828933715820312, 0.6160430908203125, 0.6491928100585938, 0.682342529296875, 0.7154922485351562, 0.7486419677734375, 0.7817916870117188, 0.81494140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 2.0, 6.0, 9.0, 16.0, 9.0, 10.0, 23.0, 31.0, 47.0, 48.0, 84.0, 114.0, 139.0, 247.0, 471.0, 924.0, 2076.0, 5933.0, 21718.0, 109853.0, 673711.0, 185699.0, 32791.0, 8998.0, 2931.0, 1162.0, 525.0, 305.0, 185.0, 141.0, 78.0, 71.0, 32.0, 37.0, 25.0, 31.0, 14.0, 13.0, 10.0, 8.0, 7.0, 3.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.6796875, -4.54052734375, -4.4013671875, -4.26220703125, -4.123046875, -3.98388671875, -3.8447265625, -3.70556640625, -3.56640625, -3.42724609375, -3.2880859375, -3.14892578125, -3.009765625, -2.87060546875, -2.7314453125, -2.59228515625, -2.453125, -2.31396484375, -2.1748046875, -2.03564453125, -1.896484375, -1.75732421875, -1.6181640625, -1.47900390625, -1.33984375, -1.20068359375, -1.0615234375, -0.92236328125, -0.783203125, -0.64404296875, -0.5048828125, -0.36572265625, -0.2265625, -0.08740234375, 0.0517578125, 0.19091796875, 0.330078125, 0.46923828125, 0.6083984375, 0.74755859375, 0.88671875, 1.02587890625, 1.1650390625, 1.30419921875, 1.443359375, 1.58251953125, 1.7216796875, 1.86083984375, 2.0, 2.13916015625, 2.2783203125, 2.41748046875, 2.556640625, 2.69580078125, 2.8349609375, 2.97412109375, 3.11328125, 3.25244140625, 3.3916015625, 3.53076171875, 3.669921875, 3.80908203125, 3.9482421875, 4.08740234375, 4.2265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 9.0, 8.0, 6.0, 7.0, 17.0, 21.0, 16.0, 20.0, 33.0, 30.0, 39.0, 31.0, 37.0, 35.0, 42.0, 40.0, 40.0, 41.0, 59.0, 46.0, 29.0, 44.0, 46.0, 33.0, 30.0, 35.0, 35.0, 21.0, 20.0, 14.0, 16.0, 16.0, 16.0, 11.0, 7.0, 11.0, 11.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.759765625, -2.678253173828125, -2.59674072265625, -2.515228271484375, -2.4337158203125, -2.352203369140625, -2.27069091796875, -2.189178466796875, -2.107666015625, -2.026153564453125, -1.94464111328125, -1.863128662109375, -1.7816162109375, -1.700103759765625, -1.61859130859375, -1.537078857421875, -1.45556640625, -1.374053955078125, -1.29254150390625, -1.211029052734375, -1.1295166015625, -1.048004150390625, -0.96649169921875, -0.884979248046875, -0.803466796875, -0.721954345703125, -0.64044189453125, -0.558929443359375, -0.4774169921875, -0.395904541015625, -0.31439208984375, -0.232879638671875, -0.1513671875, -0.069854736328125, 0.01165771484375, 0.093170166015625, 0.1746826171875, 0.256195068359375, 0.33770751953125, 0.419219970703125, 0.500732421875, 0.582244873046875, 0.66375732421875, 0.745269775390625, 0.8267822265625, 0.908294677734375, 0.98980712890625, 1.071319580078125, 1.15283203125, 1.234344482421875, 1.31585693359375, 1.397369384765625, 1.4788818359375, 1.560394287109375, 1.64190673828125, 1.723419189453125, 1.804931640625, 1.886444091796875, 1.96795654296875, 2.049468994140625, 2.1309814453125, 2.212493896484375, 2.29400634765625, 2.375518798828125, 2.45703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 9.0, 10.0, 12.0, 13.0, 31.0, 78.0, 153.0, 398.0, 1670.0, 58078.0, 984153.0, 2934.0, 605.0, 207.0, 95.0, 49.0, 26.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-18.359375, -17.9527587890625, -17.546142578125, -17.1395263671875, -16.73291015625, -16.3262939453125, -15.919677734375, -15.5130615234375, -15.1064453125, -14.6998291015625, -14.293212890625, -13.8865966796875, -13.47998046875, -13.0733642578125, -12.666748046875, -12.2601318359375, -11.853515625, -11.4468994140625, -11.040283203125, -10.6336669921875, -10.22705078125, -9.8204345703125, -9.413818359375, -9.0072021484375, -8.6005859375, -8.1939697265625, -7.787353515625, -7.3807373046875, -6.97412109375, -6.5675048828125, -6.160888671875, -5.7542724609375, -5.34765625, -4.9410400390625, -4.534423828125, -4.1278076171875, -3.72119140625, -3.3145751953125, -2.907958984375, -2.5013427734375, -2.0947265625, -1.6881103515625, -1.281494140625, -0.8748779296875, -0.46826171875, -0.0616455078125, 0.344970703125, 0.7515869140625, 1.158203125, 1.5648193359375, 1.971435546875, 2.3780517578125, 2.78466796875, 3.1912841796875, 3.597900390625, 4.0045166015625, 4.4111328125, 4.8177490234375, 5.224365234375, 5.6309814453125, 6.03759765625, 6.4442138671875, 6.850830078125, 7.2574462890625, 7.6640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 17.0, 28.0, 54.0, 114.0, 326.0, 263.0, 104.0, 42.0, 18.0, 12.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030040740966796875, -0.00028727203607559204, -0.00027413666248321533, -0.0002610012888908386, -0.0002478659152984619, -0.0002347305417060852, -0.0002215951681137085, -0.0002084597945213318, -0.00019532442092895508, -0.00018218904733657837, -0.00016905367374420166, -0.00015591830015182495, -0.00014278292655944824, -0.00012964755296707153, -0.00011651217937469482, -0.00010337680578231812, -9.02414321899414e-05, -7.71060585975647e-05, -6.397068500518799e-05, -5.083531141281128e-05, -3.769993782043457e-05, -2.456456422805786e-05, -1.1429190635681152e-05, 1.7061829566955566e-06, 1.4841556549072266e-05, 2.7976930141448975e-05, 4.1112303733825684e-05, 5.424767732620239e-05, 6.73830509185791e-05, 8.051842451095581e-05, 9.365379810333252e-05, 0.00010678917169570923, 0.00011992454528808594, 0.00013305991888046265, 0.00014619529247283936, 0.00015933066606521606, 0.00017246603965759277, 0.00018560141324996948, 0.0001987367868423462, 0.0002118721604347229, 0.0002250075340270996, 0.00023814290761947632, 0.00025127828121185303, 0.00026441365480422974, 0.00027754902839660645, 0.00029068440198898315, 0.00030381977558135986, 0.00031695514917373657, 0.0003300905227661133, 0.00034322589635849, 0.0003563612699508667, 0.0003694966435432434, 0.0003826320171356201, 0.0003957673907279968, 0.00040890276432037354, 0.00042203813791275024, 0.00043517351150512695, 0.00044830888509750366, 0.00046144425868988037, 0.0004745796322822571, 0.0004877150058746338, 0.0005008503794670105, 0.0005139857530593872, 0.0005271211266517639, 0.0005402565002441406]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 11.0, 22.0, 42.0, 79.0, 211.0, 520.0, 1615.0, 12039.0, 922308.0, 105681.0, 4464.0, 908.0, 290.0, 132.0, 92.0, 59.0, 24.0, 13.0, 9.0, 8.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.466796875, -4.26171875, -4.056640625, -3.8515625, -3.646484375, -3.44140625, -3.236328125, -3.03125, -2.826171875, -2.62109375, -2.416015625, -2.2109375, -2.005859375, -1.80078125, -1.595703125, -1.390625, -1.185546875, -0.98046875, -0.775390625, -0.5703125, -0.365234375, -0.16015625, 0.044921875, 0.25, 0.455078125, 0.66015625, 0.865234375, 1.0703125, 1.275390625, 1.48046875, 1.685546875, 1.890625, 2.095703125, 2.30078125, 2.505859375, 2.7109375, 2.916015625, 3.12109375, 3.326171875, 3.53125, 3.736328125, 3.94140625, 4.146484375, 4.3515625, 4.556640625, 4.76171875, 4.966796875, 5.171875, 5.376953125, 5.58203125, 5.787109375, 5.9921875, 6.197265625, 6.40234375, 6.607421875, 6.8125, 7.017578125, 7.22265625, 7.427734375, 7.6328125, 7.837890625, 8.04296875, 8.248046875, 8.453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 7.0, 6.0, 12.0, 15.0, 30.0, 52.0, 85.0, 129.0, 214.0, 165.0, 119.0, 69.0, 31.0, 27.0, 15.0, 12.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.603515625, -2.488983154296875, -2.37445068359375, -2.259918212890625, -2.1453857421875, -2.030853271484375, -1.91632080078125, -1.801788330078125, -1.687255859375, -1.572723388671875, -1.45819091796875, -1.343658447265625, -1.2291259765625, -1.114593505859375, -1.00006103515625, -0.885528564453125, -0.77099609375, -0.656463623046875, -0.54193115234375, -0.427398681640625, -0.3128662109375, -0.198333740234375, -0.08380126953125, 0.030731201171875, 0.145263671875, 0.259796142578125, 0.37432861328125, 0.488861083984375, 0.6033935546875, 0.717926025390625, 0.83245849609375, 0.946990966796875, 1.0615234375, 1.176055908203125, 1.29058837890625, 1.405120849609375, 1.5196533203125, 1.634185791015625, 1.74871826171875, 1.863250732421875, 1.977783203125, 2.092315673828125, 2.20684814453125, 2.321380615234375, 2.4359130859375, 2.550445556640625, 2.66497802734375, 2.779510498046875, 2.89404296875, 3.008575439453125, 3.12310791015625, 3.237640380859375, 3.3521728515625, 3.466705322265625, 3.58123779296875, 3.695770263671875, 3.810302734375, 3.924835205078125, 4.03936767578125, 4.153900146484375, 4.2684326171875, 4.382965087890625, 4.49749755859375, 4.612030029296875, 4.7265625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 11.0, 17.0, 61.0, 173.0, 412.0, 213.0, 47.0, 30.0, 15.0, 10.0, 7.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.90705871582031, -37.78193283081055, -36.65680694580078, -35.531681060791016, -34.40655517578125, -33.28142547607422, -32.15629959106445, -31.031173706054688, -29.906047821044922, -28.780921936035156, -27.65579605102539, -26.530668258666992, -25.405542373657227, -24.28041648864746, -23.155288696289062, -22.030162811279297, -20.90503692626953, -19.779911041259766, -18.65478515625, -17.5296573638916, -16.404531478881836, -15.27940559387207, -14.154278755187988, -13.029151916503906, -11.90402603149414, -10.778900146484375, -9.653773307800293, -8.528646469116211, -7.403520584106445, -6.2783942222595215, -5.153267860412598, -4.028141498565674, -2.9030113220214844, -1.7778849601745605, -0.6527585983276367, 0.4723677635192871, 1.597494125366211, 2.7226204872131348, 3.8477468490600586, 4.972873210906982, 6.097999572753906, 7.22312593460083, 8.348252296447754, 9.473379135131836, 10.598505020141602, 11.723630905151367, 12.84875774383545, 13.973884582519531, 15.099010467529297, 16.224136352539062, 17.349262237548828, 18.474390029907227, 19.599515914916992, 20.724641799926758, 21.849769592285156, 22.974895477294922, 24.100021362304688, 25.225147247314453, 26.35027313232422, 27.475400924682617, 28.600526809692383, 29.72565269470215, 30.850780487060547, 31.975906372070312, 33.10103225708008]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 2.0, 1.0, 6.0, 1.0, 4.0, 5.0, 3.0, 21.0, 28.0, 28.0, 35.0, 56.0, 69.0, 68.0, 93.0, 104.0, 97.0, 94.0, 52.0, 58.0, 45.0, 33.0, 20.0, 17.0, 14.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-39.178199768066406, -38.16204833984375, -37.145896911621094, -36.12974548339844, -35.11359405517578, -34.09743881225586, -33.0812873840332, -32.06513595581055, -31.04898452758789, -30.032833099365234, -29.016681671142578, -28.00052833557129, -26.984376907348633, -25.968225479125977, -24.952072143554688, -23.93592071533203, -22.919769287109375, -21.90361785888672, -20.887466430664062, -19.871313095092773, -18.855161666870117, -17.83901023864746, -16.822856903076172, -15.806705474853516, -14.79055404663086, -13.774402618408203, -12.75825023651123, -11.742097854614258, -10.725946426391602, -9.709794998168945, -8.693642616271973, -7.677490711212158, -6.661338806152344, -5.645186901092529, -4.629034996032715, -3.6128830909729004, -2.596731185913086, -1.5805792808532715, -0.564427375793457, 0.4517245292663574, 1.4678764343261719, 2.4840283393859863, 3.500180244445801, 4.516332149505615, 5.53248405456543, 6.548635959625244, 7.564787864685059, 8.580940246582031, 9.597091674804688, 10.613243103027344, 11.629395484924316, 12.645547866821289, 13.661699295043945, 14.677850723266602, 15.694003105163574, 16.710155487060547, 17.726306915283203, 18.74245834350586, 19.758609771728516, 20.774763107299805, 21.79091453552246, 22.807065963745117, 23.823219299316406, 24.839370727539062, 25.85552215576172]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 3.0, 7.0, 5.0, 8.0, 22.0, 25.0, 26.0, 25.0, 43.0, 46.0, 90.0, 121.0, 207.0, 356.0, 701.0, 1394.0, 3434.0, 21099.0, 4143697.0, 16756.0, 3477.0, 1379.0, 625.0, 329.0, 149.0, 111.0, 47.0, 41.0, 22.0, 9.0, 7.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.125, -36.159423828125, -35.19384765625, -34.228271484375, -33.2626953125, -32.297119140625, -31.33154296875, -30.365966796875, -29.400390625, -28.434814453125, -27.46923828125, -26.503662109375, -25.5380859375, -24.572509765625, -23.60693359375, -22.641357421875, -21.67578125, -20.710205078125, -19.74462890625, -18.779052734375, -17.8134765625, -16.847900390625, -15.88232421875, -14.916748046875, -13.951171875, -12.985595703125, -12.02001953125, -11.054443359375, -10.0888671875, -9.123291015625, -8.15771484375, -7.192138671875, -6.2265625, -5.260986328125, -4.29541015625, -3.329833984375, -2.3642578125, -1.398681640625, -0.43310546875, 0.532470703125, 1.498046875, 2.463623046875, 3.42919921875, 4.394775390625, 5.3603515625, 6.325927734375, 7.29150390625, 8.257080078125, 9.22265625, 10.188232421875, 11.15380859375, 12.119384765625, 13.0849609375, 14.050537109375, 15.01611328125, 15.981689453125, 16.947265625, 17.912841796875, 18.87841796875, 19.843994140625, 20.8095703125, 21.775146484375, 22.74072265625, 23.706298828125, 24.671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 4.0, 9.0, 7.0, 7.0, 10.0, 10.0, 22.0, 70.0, 213.0, 279.0, 194.0, 72.0, 25.0, 16.0, 13.0, 13.0, 10.0, 4.0, 9.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.291015625, -1.2574920654296875, -1.223968505859375, -1.1904449462890625, -1.15692138671875, -1.1233978271484375, -1.089874267578125, -1.0563507080078125, -1.0228271484375, -0.9893035888671875, -0.955780029296875, -0.9222564697265625, -0.88873291015625, -0.8552093505859375, -0.821685791015625, -0.7881622314453125, -0.754638671875, -0.7211151123046875, -0.687591552734375, -0.6540679931640625, -0.62054443359375, -0.5870208740234375, -0.553497314453125, -0.5199737548828125, -0.4864501953125, -0.4529266357421875, -0.419403076171875, -0.3858795166015625, -0.35235595703125, -0.3188323974609375, -0.285308837890625, -0.2517852783203125, -0.21826171875, -0.1847381591796875, -0.151214599609375, -0.1176910400390625, -0.08416748046875, -0.0506439208984375, -0.017120361328125, 0.0164031982421875, 0.0499267578125, 0.0834503173828125, 0.116973876953125, 0.1504974365234375, 0.18402099609375, 0.2175445556640625, 0.251068115234375, 0.2845916748046875, 0.318115234375, 0.3516387939453125, 0.385162353515625, 0.4186859130859375, 0.45220947265625, 0.4857330322265625, 0.519256591796875, 0.5527801513671875, 0.5863037109375, 0.6198272705078125, 0.653350830078125, 0.6868743896484375, 0.72039794921875, 0.7539215087890625, 0.787445068359375, 0.8209686279296875, 0.8544921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 5.0, 1.0, 5.0, 7.0, 11.0, 33.0, 16.0, 42.0, 92.0, 322.0, 2304.0, 68467.0, 4114475.0, 7421.0, 712.0, 178.0, 55.0, 39.0, 24.0, 13.0, 11.0, 14.0, 1.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -19.964599609375, -19.25732421875, -18.550048828125, -17.8427734375, -17.135498046875, -16.42822265625, -15.720947265625, -15.013671875, -14.306396484375, -13.59912109375, -12.891845703125, -12.1845703125, -11.477294921875, -10.77001953125, -10.062744140625, -9.35546875, -8.648193359375, -7.94091796875, -7.233642578125, -6.5263671875, -5.819091796875, -5.11181640625, -4.404541015625, -3.697265625, -2.989990234375, -2.28271484375, -1.575439453125, -0.8681640625, -0.160888671875, 0.54638671875, 1.253662109375, 1.9609375, 2.668212890625, 3.37548828125, 4.082763671875, 4.7900390625, 5.497314453125, 6.20458984375, 6.911865234375, 7.619140625, 8.326416015625, 9.03369140625, 9.740966796875, 10.4482421875, 11.155517578125, 11.86279296875, 12.570068359375, 13.27734375, 13.984619140625, 14.69189453125, 15.399169921875, 16.1064453125, 16.813720703125, 17.52099609375, 18.228271484375, 18.935546875, 19.642822265625, 20.35009765625, 21.057373046875, 21.7646484375, 22.471923828125, 23.17919921875, 23.886474609375, 24.59375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 9.0, 7.0, 3.0, 9.0, 13.0, 13.0, 14.0, 20.0, 33.0, 44.0, 107.0, 244.0, 2068.0, 1025.0, 203.0, 86.0, 40.0, 33.0, 20.0, 22.0, 17.0, 7.0, 4.0, 4.0, 2.0, 7.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3125, -1.2737579345703125, -1.235015869140625, -1.1962738037109375, -1.15753173828125, -1.1187896728515625, -1.080047607421875, -1.0413055419921875, -1.0025634765625, -0.9638214111328125, -0.925079345703125, -0.8863372802734375, -0.84759521484375, -0.8088531494140625, -0.770111083984375, -0.7313690185546875, -0.692626953125, -0.6538848876953125, -0.615142822265625, -0.5764007568359375, -0.53765869140625, -0.4989166259765625, -0.460174560546875, -0.4214324951171875, -0.3826904296875, -0.3439483642578125, -0.305206298828125, -0.2664642333984375, -0.22772216796875, -0.1889801025390625, -0.150238037109375, -0.1114959716796875, -0.07275390625, -0.0340118408203125, 0.004730224609375, 0.0434722900390625, 0.08221435546875, 0.1209564208984375, 0.159698486328125, 0.1984405517578125, 0.2371826171875, 0.2759246826171875, 0.314666748046875, 0.3534088134765625, 0.39215087890625, 0.4308929443359375, 0.469635009765625, 0.5083770751953125, 0.547119140625, 0.5858612060546875, 0.624603271484375, 0.6633453369140625, 0.70208740234375, 0.7408294677734375, 0.779571533203125, 0.8183135986328125, 0.8570556640625, 0.8957977294921875, 0.934539794921875, 0.9732818603515625, 1.01202392578125, 1.0507659912109375, 1.089508056640625, 1.1282501220703125, 1.1669921875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 9.0, 51.0, 538.0, 361.0, 37.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.613154172897339, -3.001356601715088, -2.389558792114258, -1.7777612209320068, -1.1659636497497559, -0.5541660785675049, 0.057631731033325195, 0.6694290637969971, 1.2812268733978271, 1.8930244445800781, 2.504822254180908, 3.116619825363159, 3.72841739654541, 4.340214729309082, 4.95201301574707, 5.563810348510742, 6.175607681274414, 6.787405490875244, 7.399202823638916, 8.011000633239746, 8.622797966003418, 9.234596252441406, 9.846393585205078, 10.45819091796875, 11.069989204406738, 11.68178653717041, 12.293584823608398, 12.90538215637207, 13.517179489135742, 14.128976821899414, 14.740775108337402, 15.352572441101074, 15.96436882019043, 16.5761661529541, 17.187963485717773, 17.799762725830078, 18.41156005859375, 19.023357391357422, 19.635154724121094, 20.246952056884766, 20.858749389648438, 21.47054672241211, 22.08234405517578, 22.694141387939453, 23.305940628051758, 23.91773796081543, 24.5295352935791, 25.141332626342773, 25.753131866455078, 26.36492919921875, 26.976726531982422, 27.588523864746094, 28.2003231048584, 28.81212043762207, 29.423917770385742, 30.035715103149414, 30.647512435913086, 31.259309768676758, 31.87110710144043, 32.482906341552734, 33.094703674316406, 33.70650100708008, 34.31829833984375, 34.93009567260742, 35.541893005371094]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 6.0, 6.0, 10.0, 12.0, 13.0, 24.0, 25.0, 32.0, 34.0, 41.0, 68.0, 58.0, 59.0, 64.0, 69.0, 72.0, 74.0, 46.0, 44.0, 46.0, 31.0, 29.0, 19.0, 28.0, 16.0, 12.0, 12.0, 4.0, 8.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.197154998779297, -4.068259239196777, -3.9393632411956787, -3.81046724319458, -3.6815712451934814, -3.552675247192383, -3.4237794876098633, -3.2948834896087646, -3.165987491607666, -3.0370914936065674, -2.908195734024048, -2.779299736022949, -2.6504037380218506, -2.521507740020752, -2.3926119804382324, -2.263715982437134, -2.1348202228546143, -2.0059242248535156, -1.8770283460617065, -1.7481324672698975, -1.6192364692687988, -1.4903405904769897, -1.3614447116851807, -1.232548713684082, -1.103652834892273, -0.9747568964958191, -0.8458609580993652, -0.7169650793075562, -0.5880691409111023, -0.45917320251464844, -0.33027732372283936, -0.2013813853263855, -0.07248544692993164, 0.05641047656536102, 0.1853064000606537, 0.31420230865478516, 0.443098247051239, 0.5719941854476929, 0.700890064239502, 0.8297860026359558, 0.9586819410324097, 1.0875778198242188, 1.2164738178253174, 1.3453696966171265, 1.4742655754089355, 1.6031615734100342, 1.7320574522018433, 1.8609533309936523, 1.989849328994751, 2.1187453269958496, 2.247641086578369, 2.3765370845794678, 2.5054330825805664, 2.634328842163086, 2.7632248401641846, 2.892120838165283, 3.0210165977478027, 3.1499125957489014, 3.278808355331421, 3.4077043533325195, 3.536600351333618, 3.665496349334717, 3.7943921089172363, 3.923288106918335, 4.052184104919434]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 8.0, 3.0, 11.0, 13.0, 15.0, 33.0, 35.0, 68.0, 89.0, 163.0, 286.0, 541.0, 1185.0, 3178.0, 12237.0, 286225.0, 721703.0, 16159.0, 3765.0, 1398.0, 601.0, 339.0, 185.0, 113.0, 67.0, 42.0, 33.0, 14.0, 14.0, 7.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.159912109375, -10.81201171875, -10.464111328125, -10.1162109375, -9.768310546875, -9.42041015625, -9.072509765625, -8.724609375, -8.376708984375, -8.02880859375, -7.680908203125, -7.3330078125, -6.985107421875, -6.63720703125, -6.289306640625, -5.94140625, -5.593505859375, -5.24560546875, -4.897705078125, -4.5498046875, -4.201904296875, -3.85400390625, -3.506103515625, -3.158203125, -2.810302734375, -2.46240234375, -2.114501953125, -1.7666015625, -1.418701171875, -1.07080078125, -0.722900390625, -0.375, -0.027099609375, 0.32080078125, 0.668701171875, 1.0166015625, 1.364501953125, 1.71240234375, 2.060302734375, 2.408203125, 2.756103515625, 3.10400390625, 3.451904296875, 3.7998046875, 4.147705078125, 4.49560546875, 4.843505859375, 5.19140625, 5.539306640625, 5.88720703125, 6.235107421875, 6.5830078125, 6.930908203125, 7.27880859375, 7.626708984375, 7.974609375, 8.322509765625, 8.67041015625, 9.018310546875, 9.3662109375, 9.714111328125, 10.06201171875, 10.409912109375, 10.7578125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 10.0, 9.0, 5.0, 5.0, 30.0, 83.0, 171.0, 294.0, 207.0, 95.0, 30.0, 16.0, 14.0, 8.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.2699127197265625, -1.236114501953125, -1.2023162841796875, -1.16851806640625, -1.1347198486328125, -1.100921630859375, -1.0671234130859375, -1.0333251953125, -0.9995269775390625, -0.965728759765625, -0.9319305419921875, -0.89813232421875, -0.8643341064453125, -0.830535888671875, -0.7967376708984375, -0.762939453125, -0.7291412353515625, -0.695343017578125, -0.6615447998046875, -0.62774658203125, -0.5939483642578125, -0.560150146484375, -0.5263519287109375, -0.4925537109375, -0.4587554931640625, -0.424957275390625, -0.3911590576171875, -0.35736083984375, -0.3235626220703125, -0.289764404296875, -0.2559661865234375, -0.22216796875, -0.1883697509765625, -0.154571533203125, -0.1207733154296875, -0.08697509765625, -0.0531768798828125, -0.019378662109375, 0.0144195556640625, 0.0482177734375, 0.0820159912109375, 0.115814208984375, 0.1496124267578125, 0.18341064453125, 0.2172088623046875, 0.251007080078125, 0.2848052978515625, 0.318603515625, 0.3524017333984375, 0.386199951171875, 0.4199981689453125, 0.45379638671875, 0.4875946044921875, 0.521392822265625, 0.5551910400390625, 0.5889892578125, 0.6227874755859375, 0.656585693359375, 0.6903839111328125, 0.72418212890625, 0.7579803466796875, 0.791778564453125, 0.8255767822265625, 0.859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 10.0, 11.0, 15.0, 30.0, 22.0, 36.0, 53.0, 82.0, 119.0, 154.0, 222.0, 364.0, 527.0, 966.0, 2078.0, 5582.0, 20175.0, 104869.0, 637844.0, 226023.0, 34504.0, 8536.0, 3053.0, 1307.0, 711.0, 410.0, 254.0, 161.0, 112.0, 86.0, 57.0, 32.0, 31.0, 35.0, 16.0, 13.0, 11.0, 12.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0], "bins": [-4.94921875, -4.810516357421875, -4.67181396484375, -4.533111572265625, -4.3944091796875, -4.255706787109375, -4.11700439453125, -3.978302001953125, -3.839599609375, -3.700897216796875, -3.56219482421875, -3.423492431640625, -3.2847900390625, -3.146087646484375, -3.00738525390625, -2.868682861328125, -2.72998046875, -2.591278076171875, -2.45257568359375, -2.313873291015625, -2.1751708984375, -2.036468505859375, -1.89776611328125, -1.759063720703125, -1.620361328125, -1.481658935546875, -1.34295654296875, -1.204254150390625, -1.0655517578125, -0.926849365234375, -0.78814697265625, -0.649444580078125, -0.5107421875, -0.372039794921875, -0.23333740234375, -0.094635009765625, 0.0440673828125, 0.182769775390625, 0.32147216796875, 0.460174560546875, 0.598876953125, 0.737579345703125, 0.87628173828125, 1.014984130859375, 1.1536865234375, 1.292388916015625, 1.43109130859375, 1.569793701171875, 1.70849609375, 1.847198486328125, 1.98590087890625, 2.124603271484375, 2.2633056640625, 2.402008056640625, 2.54071044921875, 2.679412841796875, 2.818115234375, 2.956817626953125, 3.09552001953125, 3.234222412109375, 3.3729248046875, 3.511627197265625, 3.65032958984375, 3.789031982421875, 3.927734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 7.0, 6.0, 14.0, 13.0, 25.0, 19.0, 20.0, 27.0, 27.0, 26.0, 35.0, 28.0, 46.0, 46.0, 49.0, 51.0, 51.0, 56.0, 51.0, 42.0, 60.0, 50.0, 31.0, 35.0, 47.0, 22.0, 20.0, 15.0, 7.0, 18.0, 6.0, 9.0, 7.0, 3.0, 4.0, 2.0, 7.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.884765625, -2.7984619140625, -2.712158203125, -2.6258544921875, -2.53955078125, -2.4532470703125, -2.366943359375, -2.2806396484375, -2.1943359375, -2.1080322265625, -2.021728515625, -1.9354248046875, -1.84912109375, -1.7628173828125, -1.676513671875, -1.5902099609375, -1.50390625, -1.4176025390625, -1.331298828125, -1.2449951171875, -1.15869140625, -1.0723876953125, -0.986083984375, -0.8997802734375, -0.8134765625, -0.7271728515625, -0.640869140625, -0.5545654296875, -0.46826171875, -0.3819580078125, -0.295654296875, -0.2093505859375, -0.123046875, -0.0367431640625, 0.049560546875, 0.1358642578125, 0.22216796875, 0.3084716796875, 0.394775390625, 0.4810791015625, 0.5673828125, 0.6536865234375, 0.739990234375, 0.8262939453125, 0.91259765625, 0.9989013671875, 1.085205078125, 1.1715087890625, 1.2578125, 1.3441162109375, 1.430419921875, 1.5167236328125, 1.60302734375, 1.6893310546875, 1.775634765625, 1.8619384765625, 1.9482421875, 2.0345458984375, 2.120849609375, 2.2071533203125, 2.29345703125, 2.3797607421875, 2.466064453125, 2.5523681640625, 2.638671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 5.0, 5.0, 8.0, 10.0, 13.0, 22.0, 26.0, 48.0, 87.0, 124.0, 273.0, 653.0, 2242.0, 17740.0, 798127.0, 219262.0, 7368.0, 1461.0, 521.0, 248.0, 109.0, 69.0, 35.0, 33.0, 20.0, 20.0, 8.0, 4.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.22265625, -4.10479736328125, -3.9869384765625, -3.86907958984375, -3.751220703125, -3.63336181640625, -3.5155029296875, -3.39764404296875, -3.27978515625, -3.16192626953125, -3.0440673828125, -2.92620849609375, -2.808349609375, -2.69049072265625, -2.5726318359375, -2.45477294921875, -2.3369140625, -2.21905517578125, -2.1011962890625, -1.98333740234375, -1.865478515625, -1.74761962890625, -1.6297607421875, -1.51190185546875, -1.39404296875, -1.27618408203125, -1.1583251953125, -1.04046630859375, -0.922607421875, -0.80474853515625, -0.6868896484375, -0.56903076171875, -0.451171875, -0.33331298828125, -0.2154541015625, -0.09759521484375, 0.020263671875, 0.13812255859375, 0.2559814453125, 0.37384033203125, 0.49169921875, 0.60955810546875, 0.7274169921875, 0.84527587890625, 0.963134765625, 1.08099365234375, 1.1988525390625, 1.31671142578125, 1.4345703125, 1.55242919921875, 1.6702880859375, 1.78814697265625, 1.906005859375, 2.02386474609375, 2.1417236328125, 2.25958251953125, 2.37744140625, 2.49530029296875, 2.6131591796875, 2.73101806640625, 2.848876953125, 2.96673583984375, 3.0845947265625, 3.20245361328125, 3.3203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 9.0, 10.0, 10.0, 19.0, 28.0, 36.0, 40.0, 69.0, 106.0, 147.0, 117.0, 128.0, 73.0, 62.0, 47.0, 24.0, 15.0, 18.0, 8.0, 6.0, 9.0, 5.0, 2.0, 2.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002161264419555664, -0.00020964257419109344, -0.00020315870642662048, -0.00019667483866214752, -0.00019019097089767456, -0.0001837071031332016, -0.00017722323536872864, -0.00017073936760425568, -0.00016425549983978271, -0.00015777163207530975, -0.0001512877643108368, -0.00014480389654636383, -0.00013832002878189087, -0.0001318361610174179, -0.00012535229325294495, -0.00011886842548847198, -0.00011238455772399902, -0.00010590068995952606, -9.94168221950531e-05, -9.293295443058014e-05, -8.644908666610718e-05, -7.996521890163422e-05, -7.348135113716125e-05, -6.69974833726883e-05, -6.051361560821533e-05, -5.402974784374237e-05, -4.754588007926941e-05, -4.106201231479645e-05, -3.4578144550323486e-05, -2.8094276785850525e-05, -2.1610409021377563e-05, -1.5126541256904602e-05, -8.64267349243164e-06, -2.158805727958679e-06, 4.325062036514282e-06, 1.0808929800987244e-05, 1.7292797565460205e-05, 2.3776665329933167e-05, 3.0260533094406128e-05, 3.674440085887909e-05, 4.322826862335205e-05, 4.971213638782501e-05, 5.6196004152297974e-05, 6.267987191677094e-05, 6.91637396812439e-05, 7.564760744571686e-05, 8.213147521018982e-05, 8.861534297466278e-05, 9.509921073913574e-05, 0.0001015830785036087, 0.00010806694626808167, 0.00011455081403255463, 0.00012103468179702759, 0.00012751854956150055, 0.0001340024173259735, 0.00014048628509044647, 0.00014697015285491943, 0.0001534540206193924, 0.00015993788838386536, 0.00016642175614833832, 0.00017290562391281128, 0.00017938949167728424, 0.0001858733594417572, 0.00019235722720623016, 0.00019884109497070312]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 9.0, 11.0, 9.0, 25.0, 21.0, 36.0, 75.0, 123.0, 219.0, 406.0, 828.0, 2083.0, 7853.0, 64374.0, 821535.0, 134288.0, 11833.0, 2749.0, 976.0, 458.0, 257.0, 142.0, 71.0, 62.0, 24.0, 27.0, 12.0, 7.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0625, -2.97406005859375, -2.8856201171875, -2.79718017578125, -2.708740234375, -2.62030029296875, -2.5318603515625, -2.44342041015625, -2.35498046875, -2.26654052734375, -2.1781005859375, -2.08966064453125, -2.001220703125, -1.91278076171875, -1.8243408203125, -1.73590087890625, -1.6474609375, -1.55902099609375, -1.4705810546875, -1.38214111328125, -1.293701171875, -1.20526123046875, -1.1168212890625, -1.02838134765625, -0.93994140625, -0.85150146484375, -0.7630615234375, -0.67462158203125, -0.586181640625, -0.49774169921875, -0.4093017578125, -0.32086181640625, -0.232421875, -0.14398193359375, -0.0555419921875, 0.03289794921875, 0.121337890625, 0.20977783203125, 0.2982177734375, 0.38665771484375, 0.47509765625, 0.56353759765625, 0.6519775390625, 0.74041748046875, 0.828857421875, 0.91729736328125, 1.0057373046875, 1.09417724609375, 1.1826171875, 1.27105712890625, 1.3594970703125, 1.44793701171875, 1.536376953125, 1.62481689453125, 1.7132568359375, 1.80169677734375, 1.89013671875, 1.97857666015625, 2.0670166015625, 2.15545654296875, 2.243896484375, 2.33233642578125, 2.4207763671875, 2.50921630859375, 2.59765625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 14.0, 16.0, 20.0, 30.0, 46.0, 41.0, 76.0, 92.0, 126.0, 131.0, 128.0, 68.0, 67.0, 43.0, 25.0, 20.0, 16.0, 8.0, 7.0, 3.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6690521240234375, -1.620330810546875, -1.5716094970703125, -1.52288818359375, -1.4741668701171875, -1.425445556640625, -1.3767242431640625, -1.3280029296875, -1.2792816162109375, -1.230560302734375, -1.1818389892578125, -1.13311767578125, -1.0843963623046875, -1.035675048828125, -0.9869537353515625, -0.938232421875, -0.8895111083984375, -0.840789794921875, -0.7920684814453125, -0.74334716796875, -0.6946258544921875, -0.645904541015625, -0.5971832275390625, -0.5484619140625, -0.4997406005859375, -0.451019287109375, -0.4022979736328125, -0.35357666015625, -0.3048553466796875, -0.256134033203125, -0.2074127197265625, -0.15869140625, -0.1099700927734375, -0.061248779296875, -0.0125274658203125, 0.03619384765625, 0.0849151611328125, 0.133636474609375, 0.1823577880859375, 0.2310791015625, 0.2798004150390625, 0.328521728515625, 0.3772430419921875, 0.42596435546875, 0.4746856689453125, 0.523406982421875, 0.5721282958984375, 0.620849609375, 0.6695709228515625, 0.718292236328125, 0.7670135498046875, 0.81573486328125, 0.8644561767578125, 0.913177490234375, 0.9618988037109375, 1.0106201171875, 1.0593414306640625, 1.108062744140625, 1.1567840576171875, 1.20550537109375, 1.2542266845703125, 1.302947998046875, 1.3516693115234375, 1.400390625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 17.0, 80.0, 454.0, 372.0, 61.0, 18.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.54603576660156, -78.10302734375, -75.66001892089844, -73.2170181274414, -70.77400970458984, -68.33100128173828, -65.88800048828125, -63.44499206542969, -61.001983642578125, -58.55897521972656, -56.115970611572266, -53.67296600341797, -51.229957580566406, -48.786949157714844, -46.34394454956055, -43.90093994140625, -41.45793151855469, -39.014923095703125, -36.57191848754883, -34.12891387939453, -31.68590545654297, -29.24289894104004, -26.79989242553711, -24.35688591003418, -21.91387939453125, -19.47087287902832, -17.02786636352539, -14.584859848022461, -12.141853332519531, -9.698846817016602, -7.255840301513672, -4.812833786010742, -2.3698272705078125, 0.07317924499511719, 2.516185760498047, 4.959192276000977, 7.402198791503906, 9.845205307006836, 12.288211822509766, 14.731218338012695, 17.174224853515625, 19.617231369018555, 22.060237884521484, 24.503244400024414, 26.946250915527344, 29.389257431030273, 31.832263946533203, 34.2752685546875, 36.71827697753906, 39.161285400390625, 41.60429000854492, 44.04729461669922, 46.49030303955078, 48.933311462402344, 51.37631607055664, 53.81932067871094, 56.2623291015625, 58.70533752441406, 61.14834213256836, 63.591346740722656, 66.03435516357422, 68.47736358642578, 70.92036437988281, 73.36337280273438, 75.80638122558594]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 12.0, 9.0, 12.0, 12.0, 16.0, 32.0, 40.0, 30.0, 63.0, 54.0, 55.0, 61.0, 71.0, 55.0, 76.0, 62.0, 47.0, 63.0, 52.0, 39.0, 36.0, 20.0, 26.0, 14.0, 17.0, 4.0, 7.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.777952194213867, -28.92869758605957, -28.07944107055664, -27.230186462402344, -26.380931854248047, -25.53167724609375, -24.68242073059082, -23.833166122436523, -22.983909606933594, -22.134654998779297, -21.285398483276367, -20.43614387512207, -19.586889266967773, -18.737632751464844, -17.888378143310547, -17.03912353515625, -16.189868927001953, -15.34061336517334, -14.491358757019043, -13.64210319519043, -12.792848587036133, -11.94359302520752, -11.094337463378906, -10.24508285522461, -9.395827293395996, -8.546571731567383, -7.697317123413086, -6.848061561584473, -5.998806476593018, -5.1495513916015625, -4.300295829772949, -3.451040744781494, -2.601787567138672, -1.7525323629379272, -0.9032771587371826, -0.05402183532714844, 0.7952332496643066, 1.6444883346557617, 2.493743896484375, 3.34299898147583, 4.192254066467285, 5.04150915145874, 5.890764236450195, 6.740019798278809, 7.589274883270264, 8.438529968261719, 9.287785530090332, 10.137041091918945, 10.986295700073242, 11.835551261901855, 12.684805870056152, 13.534061431884766, 14.383316040039062, 15.232571601867676, 16.08182716369629, 16.931081771850586, 17.780338287353516, 18.629592895507812, 19.478849411010742, 20.32810401916504, 21.177358627319336, 22.026615142822266, 22.875869750976562, 23.72512435913086, 24.574378967285156]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 10.0, 19.0, 35.0, 46.0, 115.0, 296.0, 854.0, 8163.0, 4178177.0, 5850.0, 491.0, 110.0, 39.0, 29.0, 6.0, 9.0, 9.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-72.625, -71.02734375, -69.4296875, -67.83203125, -66.234375, -64.63671875, -63.0390625, -61.44140625, -59.84375, -58.24609375, -56.6484375, -55.05078125, -53.453125, -51.85546875, -50.2578125, -48.66015625, -47.0625, -45.46484375, -43.8671875, -42.26953125, -40.671875, -39.07421875, -37.4765625, -35.87890625, -34.28125, -32.68359375, -31.0859375, -29.48828125, -27.890625, -26.29296875, -24.6953125, -23.09765625, -21.5, -19.90234375, -18.3046875, -16.70703125, -15.109375, -13.51171875, -11.9140625, -10.31640625, -8.71875, -7.12109375, -5.5234375, -3.92578125, -2.328125, -0.73046875, 0.8671875, 2.46484375, 4.0625, 5.66015625, 7.2578125, 8.85546875, 10.453125, 12.05078125, 13.6484375, 15.24609375, 16.84375, 18.44140625, 20.0390625, 21.63671875, 23.234375, 24.83203125, 26.4296875, 28.02734375, 29.625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 10.0, 12.0, 30.0, 54.0, 110.0, 157.0, 204.0, 162.0, 101.0, 57.0, 33.0, 23.0, 8.0, 7.0, 6.0, 12.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.708984375, -1.6714248657226562, -1.6338653564453125, -1.5963058471679688, -1.558746337890625, -1.5211868286132812, -1.4836273193359375, -1.4460678100585938, -1.40850830078125, -1.3709487915039062, -1.3333892822265625, -1.2958297729492188, -1.258270263671875, -1.2207107543945312, -1.1831512451171875, -1.1455917358398438, -1.1080322265625, -1.0704727172851562, -1.0329132080078125, -0.9953536987304688, -0.957794189453125, -0.9202346801757812, -0.8826751708984375, -0.8451156616210938, -0.80755615234375, -0.7699966430664062, -0.7324371337890625, -0.6948776245117188, -0.657318115234375, -0.6197586059570312, -0.5821990966796875, -0.5446395874023438, -0.507080078125, -0.46952056884765625, -0.4319610595703125, -0.39440155029296875, -0.356842041015625, -0.31928253173828125, -0.2817230224609375, -0.24416351318359375, -0.20660400390625, -0.16904449462890625, -0.1314849853515625, -0.09392547607421875, -0.056365966796875, -0.01880645751953125, 0.0187530517578125, 0.05631256103515625, 0.0938720703125, 0.13143157958984375, 0.1689910888671875, 0.20655059814453125, 0.244110107421875, 0.28166961669921875, 0.3192291259765625, 0.35678863525390625, 0.39434814453125, 0.43190765380859375, 0.4694671630859375, 0.5070266723632812, 0.544586181640625, 0.5821456909179688, 0.6197052001953125, 0.6572647094726562, 0.69482421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 10.0, 26.0, 56.0, 168.0, 450.0, 2030.0, 78451.0, 4104745.0, 7101.0, 782.0, 279.0, 108.0, 45.0, 26.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.1015625, -14.4517822265625, -13.802001953125, -13.1522216796875, -12.50244140625, -11.8526611328125, -11.202880859375, -10.5531005859375, -9.9033203125, -9.2535400390625, -8.603759765625, -7.9539794921875, -7.30419921875, -6.6544189453125, -6.004638671875, -5.3548583984375, -4.705078125, -4.0552978515625, -3.405517578125, -2.7557373046875, -2.10595703125, -1.4561767578125, -0.806396484375, -0.1566162109375, 0.4931640625, 1.1429443359375, 1.792724609375, 2.4425048828125, 3.09228515625, 3.7420654296875, 4.391845703125, 5.0416259765625, 5.69140625, 6.3411865234375, 6.990966796875, 7.6407470703125, 8.29052734375, 8.9403076171875, 9.590087890625, 10.2398681640625, 10.8896484375, 11.5394287109375, 12.189208984375, 12.8389892578125, 13.48876953125, 14.1385498046875, 14.788330078125, 15.4381103515625, 16.087890625, 16.7376708984375, 17.387451171875, 18.0372314453125, 18.68701171875, 19.3367919921875, 19.986572265625, 20.6363525390625, 21.2861328125, 21.9359130859375, 22.585693359375, 23.2354736328125, 23.88525390625, 24.5350341796875, 25.184814453125, 25.8345947265625, 26.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 14.0, 16.0, 33.0, 50.0, 87.0, 312.0, 2527.0, 746.0, 151.0, 46.0, 29.0, 17.0, 10.0, 9.0, 6.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.716796875, -2.642791748046875, -2.56878662109375, -2.494781494140625, -2.4207763671875, -2.346771240234375, -2.27276611328125, -2.198760986328125, -2.124755859375, -2.050750732421875, -1.97674560546875, -1.902740478515625, -1.8287353515625, -1.754730224609375, -1.68072509765625, -1.606719970703125, -1.53271484375, -1.458709716796875, -1.38470458984375, -1.310699462890625, -1.2366943359375, -1.162689208984375, -1.08868408203125, -1.014678955078125, -0.940673828125, -0.866668701171875, -0.79266357421875, -0.718658447265625, -0.6446533203125, -0.570648193359375, -0.49664306640625, -0.422637939453125, -0.3486328125, -0.274627685546875, -0.20062255859375, -0.126617431640625, -0.0526123046875, 0.021392822265625, 0.09539794921875, 0.169403076171875, 0.243408203125, 0.317413330078125, 0.39141845703125, 0.465423583984375, 0.5394287109375, 0.613433837890625, 0.68743896484375, 0.761444091796875, 0.83544921875, 0.909454345703125, 0.98345947265625, 1.057464599609375, 1.1314697265625, 1.205474853515625, 1.27947998046875, 1.353485107421875, 1.427490234375, 1.501495361328125, 1.57550048828125, 1.649505615234375, 1.7235107421875, 1.797515869140625, 1.87152099609375, 1.945526123046875, 2.01953125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 12.0, 55.0, 475.0, 405.0, 43.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.124195098876953, -18.251140594482422, -17.37808609008789, -16.50503158569336, -15.631977081298828, -14.758922576904297, -13.88586711883545, -13.012812614440918, -12.139758110046387, -11.266703605651855, -10.393649101257324, -9.520593643188477, -8.647539138793945, -7.774485111236572, -6.901430130004883, -6.028375625610352, -5.15532112121582, -4.282266616821289, -3.4092118740081787, -2.5361571311950684, -1.663102626800537, -0.7900481224060059, 0.0830068588256836, 0.9560613632202148, 1.829115867614746, 2.7021703720092773, 3.5752251148223877, 4.448279857635498, 5.321334362030029, 6.1943888664245605, 7.06744384765625, 7.940498352050781, 8.813552856445312, 9.686607360839844, 10.559661865234375, 11.432716369628906, 12.305770874023438, 13.178825378417969, 14.051880836486816, 14.924935340881348, 15.797989845275879, 16.671045303344727, 17.544099807739258, 18.41715431213379, 19.29020881652832, 20.16326332092285, 21.036317825317383, 21.909372329711914, 22.782426834106445, 23.655481338500977, 24.528535842895508, 25.40159034729004, 26.27464485168457, 27.1476993560791, 28.020755767822266, 28.893810272216797, 29.766864776611328, 30.63991928100586, 31.51297378540039, 32.38602828979492, 33.25908279418945, 34.132137298583984, 35.005191802978516, 35.87824630737305, 36.75130081176758]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 11.0, 17.0, 31.0, 40.0, 68.0, 74.0, 92.0, 111.0, 100.0, 104.0, 99.0, 62.0, 58.0, 46.0, 31.0, 14.0, 19.0, 2.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.380634307861328, -10.069737434387207, -9.758840560913086, -9.447943687438965, -9.137046813964844, -8.826149940490723, -8.515253067016602, -8.204355239868164, -7.893458843231201, -7.58256196975708, -7.271665096282959, -6.960768222808838, -6.649870872497559, -6.3389739990234375, -6.028077125549316, -5.717180252075195, -5.406283378601074, -5.095386505126953, -4.784489631652832, -4.473592758178711, -4.16269588470459, -3.8517987728118896, -3.5409016609191895, -3.2300047874450684, -2.9191079139709473, -2.608211040496826, -2.297314167022705, -1.9864170551300049, -1.6755201816558838, -1.3646233081817627, -1.053726315498352, -0.7428293228149414, -0.4319314956665039, -0.12103456258773804, 0.18986237049102783, 0.5007593035697937, 0.8116562366485596, 1.1225531101226807, 1.4334501028060913, 1.744347095489502, 2.055243968963623, 2.366140842437744, 2.6770377159118652, 2.9879348278045654, 3.2988317012786865, 3.6097285747528076, 3.920625686645508, 4.231522560119629, 4.54241943359375, 4.853316307067871, 5.164213180541992, 5.475110054016113, 5.786006927490234, 6.0969038009643555, 6.407801151275635, 6.718698024749756, 7.029594898223877, 7.340491771697998, 7.651388645172119, 7.96228551864624, 8.27318286895752, 8.58407974243164, 8.894976615905762, 9.205873489379883, 9.516770362854004]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 21.0, 21.0, 40.0, 63.0, 114.0, 236.0, 414.0, 997.0, 2940.0, 13360.0, 486745.0, 524927.0, 13832.0, 2835.0, 993.0, 450.0, 195.0, 127.0, 90.0, 37.0, 31.0, 23.0, 8.0, 12.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.916748046875, -8.63818359375, -8.359619140625, -8.0810546875, -7.802490234375, -7.52392578125, -7.245361328125, -6.966796875, -6.688232421875, -6.40966796875, -6.131103515625, -5.8525390625, -5.573974609375, -5.29541015625, -5.016845703125, -4.73828125, -4.459716796875, -4.18115234375, -3.902587890625, -3.6240234375, -3.345458984375, -3.06689453125, -2.788330078125, -2.509765625, -2.231201171875, -1.95263671875, -1.674072265625, -1.3955078125, -1.116943359375, -0.83837890625, -0.559814453125, -0.28125, -0.002685546875, 0.27587890625, 0.554443359375, 0.8330078125, 1.111572265625, 1.39013671875, 1.668701171875, 1.947265625, 2.225830078125, 2.50439453125, 2.782958984375, 3.0615234375, 3.340087890625, 3.61865234375, 3.897216796875, 4.17578125, 4.454345703125, 4.73291015625, 5.011474609375, 5.2900390625, 5.568603515625, 5.84716796875, 6.125732421875, 6.404296875, 6.682861328125, 6.96142578125, 7.239990234375, 7.5185546875, 7.797119140625, 8.07568359375, 8.354248046875, 8.6328125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 6.0, 12.0, 33.0, 57.0, 107.0, 126.0, 167.0, 162.0, 125.0, 75.0, 50.0, 22.0, 16.0, 11.0, 5.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.58203125, -1.5474395751953125, -1.512847900390625, -1.4782562255859375, -1.44366455078125, -1.4090728759765625, -1.374481201171875, -1.3398895263671875, -1.3052978515625, -1.2707061767578125, -1.236114501953125, -1.2015228271484375, -1.16693115234375, -1.1323394775390625, -1.097747802734375, -1.0631561279296875, -1.028564453125, -0.9939727783203125, -0.959381103515625, -0.9247894287109375, -0.89019775390625, -0.8556060791015625, -0.821014404296875, -0.7864227294921875, -0.7518310546875, -0.7172393798828125, -0.682647705078125, -0.6480560302734375, -0.61346435546875, -0.5788726806640625, -0.544281005859375, -0.5096893310546875, -0.47509765625, -0.4405059814453125, -0.405914306640625, -0.3713226318359375, -0.33673095703125, -0.3021392822265625, -0.267547607421875, -0.2329559326171875, -0.1983642578125, -0.1637725830078125, -0.129180908203125, -0.0945892333984375, -0.05999755859375, -0.0254058837890625, 0.009185791015625, 0.0437774658203125, 0.078369140625, 0.1129608154296875, 0.147552490234375, 0.1821441650390625, 0.21673583984375, 0.2513275146484375, 0.285919189453125, 0.3205108642578125, 0.3551025390625, 0.3896942138671875, 0.424285888671875, 0.4588775634765625, 0.49346923828125, 0.5280609130859375, 0.562652587890625, 0.5972442626953125, 0.6318359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 6.0, 7.0, 6.0, 5.0, 12.0, 28.0, 36.0, 39.0, 65.0, 87.0, 141.0, 208.0, 314.0, 514.0, 1008.0, 2063.0, 5866.0, 24984.0, 197931.0, 674946.0, 115416.0, 16607.0, 4433.0, 1671.0, 844.0, 457.0, 276.0, 197.0, 106.0, 94.0, 60.0, 31.0, 30.0, 21.0, 14.0, 13.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.2393798828125, -4.099853515625, -3.9603271484375, -3.82080078125, -3.6812744140625, -3.541748046875, -3.4022216796875, -3.2626953125, -3.1231689453125, -2.983642578125, -2.8441162109375, -2.70458984375, -2.5650634765625, -2.425537109375, -2.2860107421875, -2.146484375, -2.0069580078125, -1.867431640625, -1.7279052734375, -1.58837890625, -1.4488525390625, -1.309326171875, -1.1697998046875, -1.0302734375, -0.8907470703125, -0.751220703125, -0.6116943359375, -0.47216796875, -0.3326416015625, -0.193115234375, -0.0535888671875, 0.0859375, 0.2254638671875, 0.364990234375, 0.5045166015625, 0.64404296875, 0.7835693359375, 0.923095703125, 1.0626220703125, 1.2021484375, 1.3416748046875, 1.481201171875, 1.6207275390625, 1.76025390625, 1.8997802734375, 2.039306640625, 2.1788330078125, 2.318359375, 2.4578857421875, 2.597412109375, 2.7369384765625, 2.87646484375, 3.0159912109375, 3.155517578125, 3.2950439453125, 3.4345703125, 3.5740966796875, 3.713623046875, 3.8531494140625, 3.99267578125, 4.1322021484375, 4.271728515625, 4.4112548828125, 4.55078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 5.0, 4.0, 17.0, 14.0, 11.0, 20.0, 33.0, 33.0, 42.0, 47.0, 41.0, 54.0, 46.0, 46.0, 52.0, 58.0, 61.0, 56.0, 59.0, 57.0, 49.0, 34.0, 30.0, 30.0, 24.0, 13.0, 9.0, 13.0, 6.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.91876220703125, -2.8140869140625, -2.70941162109375, -2.604736328125, -2.50006103515625, -2.3953857421875, -2.29071044921875, -2.18603515625, -2.08135986328125, -1.9766845703125, -1.87200927734375, -1.767333984375, -1.66265869140625, -1.5579833984375, -1.45330810546875, -1.3486328125, -1.24395751953125, -1.1392822265625, -1.03460693359375, -0.929931640625, -0.82525634765625, -0.7205810546875, -0.61590576171875, -0.51123046875, -0.40655517578125, -0.3018798828125, -0.19720458984375, -0.092529296875, 0.01214599609375, 0.1168212890625, 0.22149658203125, 0.326171875, 0.43084716796875, 0.5355224609375, 0.64019775390625, 0.744873046875, 0.84954833984375, 0.9542236328125, 1.05889892578125, 1.16357421875, 1.26824951171875, 1.3729248046875, 1.47760009765625, 1.582275390625, 1.68695068359375, 1.7916259765625, 1.89630126953125, 2.0009765625, 2.10565185546875, 2.2103271484375, 2.31500244140625, 2.419677734375, 2.52435302734375, 2.6290283203125, 2.73370361328125, 2.83837890625, 2.94305419921875, 3.0477294921875, 3.15240478515625, 3.257080078125, 3.36175537109375, 3.4664306640625, 3.57110595703125, 3.67578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 17.0, 33.0, 54.0, 167.0, 519.0, 9876.0, 1034075.0, 3188.0, 369.0, 131.0, 66.0, 14.0, 15.0, 12.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.671875, -18.2093505859375, -17.746826171875, -17.2843017578125, -16.82177734375, -16.3592529296875, -15.896728515625, -15.4342041015625, -14.9716796875, -14.5091552734375, -14.046630859375, -13.5841064453125, -13.12158203125, -12.6590576171875, -12.196533203125, -11.7340087890625, -11.271484375, -10.8089599609375, -10.346435546875, -9.8839111328125, -9.42138671875, -8.9588623046875, -8.496337890625, -8.0338134765625, -7.5712890625, -7.1087646484375, -6.646240234375, -6.1837158203125, -5.72119140625, -5.2586669921875, -4.796142578125, -4.3336181640625, -3.87109375, -3.4085693359375, -2.946044921875, -2.4835205078125, -2.02099609375, -1.5584716796875, -1.095947265625, -0.6334228515625, -0.1708984375, 0.2916259765625, 0.754150390625, 1.2166748046875, 1.67919921875, 2.1417236328125, 2.604248046875, 3.0667724609375, 3.529296875, 3.9918212890625, 4.454345703125, 4.9168701171875, 5.37939453125, 5.8419189453125, 6.304443359375, 6.7669677734375, 7.2294921875, 7.6920166015625, 8.154541015625, 8.6170654296875, 9.07958984375, 9.5421142578125, 10.004638671875, 10.4671630859375, 10.9296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 2.0, 8.0, 3.0, 16.0, 19.0, 34.0, 52.0, 89.0, 116.0, 181.0, 155.0, 121.0, 73.0, 49.0, 31.0, 17.0, 9.0, 9.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003228187561035156, -0.00031328946352005005, -0.00030376017093658447, -0.0002942308783531189, -0.0002847015857696533, -0.00027517229318618774, -0.00026564300060272217, -0.0002561137080192566, -0.000246584415435791, -0.00023705512285232544, -0.00022752583026885986, -0.0002179965376853943, -0.0002084672451019287, -0.00019893795251846313, -0.00018940865993499756, -0.00017987936735153198, -0.0001703500747680664, -0.00016082078218460083, -0.00015129148960113525, -0.00014176219701766968, -0.0001322329044342041, -0.00012270361185073853, -0.00011317431926727295, -0.00010364502668380737, -9.41157341003418e-05, -8.458644151687622e-05, -7.505714893341064e-05, -6.552785634994507e-05, -5.599856376647949e-05, -4.6469271183013916e-05, -3.693997859954834e-05, -2.7410686016082764e-05, -1.7881393432617188e-05, -8.352100849151611e-06, 1.1771917343139648e-06, 1.0706484317779541e-05, 2.0235776901245117e-05, 2.9765069484710693e-05, 3.929436206817627e-05, 4.8823654651641846e-05, 5.835294723510742e-05, 6.7882239818573e-05, 7.741153240203857e-05, 8.694082498550415e-05, 9.647011756896973e-05, 0.0001059994101524353, 0.00011552870273590088, 0.00012505799531936646, 0.00013458728790283203, 0.0001441165804862976, 0.00015364587306976318, 0.00016317516565322876, 0.00017270445823669434, 0.0001822337508201599, 0.0001917630434036255, 0.00020129233598709106, 0.00021082162857055664, 0.00022035092115402222, 0.0002298802137374878, 0.00023940950632095337, 0.00024893879890441895, 0.0002584680914878845, 0.0002679973840713501, 0.0002775266766548157, 0.00028705596923828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 3.0, 4.0, 6.0, 4.0, 7.0, 8.0, 16.0, 11.0, 16.0, 28.0, 41.0, 57.0, 102.0, 223.0, 563.0, 1673.0, 6384.0, 76081.0, 931761.0, 25508.0, 3983.0, 1170.0, 433.0, 181.0, 90.0, 62.0, 36.0, 38.0, 10.0, 10.0, 12.0, 10.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.4375, -5.28790283203125, -5.1383056640625, -4.98870849609375, -4.839111328125, -4.68951416015625, -4.5399169921875, -4.39031982421875, -4.24072265625, -4.09112548828125, -3.9415283203125, -3.79193115234375, -3.642333984375, -3.49273681640625, -3.3431396484375, -3.19354248046875, -3.0439453125, -2.89434814453125, -2.7447509765625, -2.59515380859375, -2.445556640625, -2.29595947265625, -2.1463623046875, -1.99676513671875, -1.84716796875, -1.69757080078125, -1.5479736328125, -1.39837646484375, -1.248779296875, -1.09918212890625, -0.9495849609375, -0.79998779296875, -0.650390625, -0.50079345703125, -0.3511962890625, -0.20159912109375, -0.052001953125, 0.09759521484375, 0.2471923828125, 0.39678955078125, 0.54638671875, 0.69598388671875, 0.8455810546875, 0.99517822265625, 1.144775390625, 1.29437255859375, 1.4439697265625, 1.59356689453125, 1.7431640625, 1.89276123046875, 2.0423583984375, 2.19195556640625, 2.341552734375, 2.49114990234375, 2.6407470703125, 2.79034423828125, 2.93994140625, 3.08953857421875, 3.2391357421875, 3.38873291015625, 3.538330078125, 3.68792724609375, 3.8375244140625, 3.98712158203125, 4.13671875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 12.0, 29.0, 49.0, 87.0, 145.0, 217.0, 160.0, 123.0, 78.0, 40.0, 13.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.308319091796875, -2.22210693359375, -2.135894775390625, -2.0496826171875, -1.963470458984375, -1.87725830078125, -1.791046142578125, -1.704833984375, -1.618621826171875, -1.53240966796875, -1.446197509765625, -1.3599853515625, -1.273773193359375, -1.18756103515625, -1.101348876953125, -1.01513671875, -0.928924560546875, -0.84271240234375, -0.756500244140625, -0.6702880859375, -0.584075927734375, -0.49786376953125, -0.411651611328125, -0.325439453125, -0.239227294921875, -0.15301513671875, -0.066802978515625, 0.0194091796875, 0.105621337890625, 0.19183349609375, 0.278045654296875, 0.3642578125, 0.450469970703125, 0.53668212890625, 0.622894287109375, 0.7091064453125, 0.795318603515625, 0.88153076171875, 0.967742919921875, 1.053955078125, 1.140167236328125, 1.22637939453125, 1.312591552734375, 1.3988037109375, 1.485015869140625, 1.57122802734375, 1.657440185546875, 1.74365234375, 1.829864501953125, 1.91607666015625, 2.002288818359375, 2.0885009765625, 2.174713134765625, 2.26092529296875, 2.347137451171875, 2.433349609375, 2.519561767578125, 2.60577392578125, 2.691986083984375, 2.7781982421875, 2.864410400390625, 2.95062255859375, 3.036834716796875, 3.123046875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 49.0, 827.0, 128.0, 9.0, 0.0, 0.0, 1.0, 1.0], "bins": [-280.0517578125, -275.194091796875, -270.3364562988281, -265.4787902832031, -260.6211242675781, -255.7634735107422, -250.9058074951172, -246.04815673828125, -241.19049072265625, -236.3328399658203, -231.4751739501953, -226.61752319335938, -221.75985717773438, -216.90220642089844, -212.04454040527344, -207.1868896484375, -202.32923889160156, -197.47158813476562, -192.61392211914062, -187.7562713623047, -182.8986053466797, -178.04095458984375, -173.18328857421875, -168.3256378173828, -163.46798706054688, -158.61033630371094, -153.75267028808594, -148.89501953125, -144.037353515625, -139.17970275878906, -134.32203674316406, -129.46438598632812, -124.60671997070312, -119.74906158447266, -114.89140319824219, -110.03374481201172, -105.17608642578125, -100.31843566894531, -95.46077728271484, -90.60311889648438, -85.7454605102539, -80.88780212402344, -76.03014373779297, -71.1724853515625, -66.31483459472656, -61.45717239379883, -56.599517822265625, -51.741859436035156, -46.88420104980469, -42.02654266357422, -37.16888427734375, -32.31122970581055, -27.453571319580078, -22.59591293334961, -17.738256454467773, -12.880599975585938, -8.022943496704102, -3.165286064147949, 1.6923713684082031, 6.5500288009643555, 11.407686233520508, 16.265344619750977, 21.123001098632812, 25.98065757751465, 30.838315963745117]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 10.0, 3.0, 11.0, 17.0, 12.0, 14.0, 20.0, 24.0, 25.0, 19.0, 32.0, 40.0, 32.0, 40.0, 42.0, 34.0, 38.0, 50.0, 54.0, 45.0, 46.0, 35.0, 51.0, 45.0, 32.0, 39.0, 32.0, 21.0, 21.0, 13.0, 19.0, 18.0, 13.0, 11.0, 10.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-19.11857795715332, -18.55038070678711, -17.982181549072266, -17.413982391357422, -16.84578514099121, -16.277587890625, -15.709388732910156, -15.141190528869629, -14.572992324829102, -14.004794120788574, -13.436595916748047, -12.86839771270752, -12.300199508666992, -11.732001304626465, -11.163803100585938, -10.59560489654541, -10.027406692504883, -9.459208488464355, -8.891010284423828, -8.3228120803833, -7.754613876342773, -7.186415672302246, -6.618217468261719, -6.050019264221191, -5.481821060180664, -4.913622856140137, -4.345424652099609, -3.777226448059082, -3.2090282440185547, -2.6408300399780273, -2.0726318359375, -1.5044336318969727, -0.9362373352050781, -0.3680391311645508, 0.20015907287597656, 0.7683572769165039, 1.3365554809570312, 1.9047536849975586, 2.472951889038086, 3.0411500930786133, 3.6093482971191406, 4.177546501159668, 4.745744705200195, 5.313942909240723, 5.88214111328125, 6.450339317321777, 7.018537521362305, 7.586735725402832, 8.15493392944336, 8.723132133483887, 9.291330337524414, 9.859528541564941, 10.427726745605469, 10.995924949645996, 11.564123153686523, 12.13232135772705, 12.700519561767578, 13.268717765808105, 13.836915969848633, 14.40511417388916, 14.973312377929688, 15.541510581970215, 16.109708786010742, 16.677906036376953, 17.246105194091797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 11.0, 23.0, 42.0, 51.0, 134.0, 279.0, 793.0, 4442.0, 3191120.0, 992884.0, 3565.0, 566.0, 191.0, 89.0, 30.0, 18.0, 13.0, 12.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-23.25, -22.7091064453125, -22.168212890625, -21.6273193359375, -21.08642578125, -20.5455322265625, -20.004638671875, -19.4637451171875, -18.9228515625, -18.3819580078125, -17.841064453125, -17.3001708984375, -16.75927734375, -16.2183837890625, -15.677490234375, -15.1365966796875, -14.595703125, -14.0548095703125, -13.513916015625, -12.9730224609375, -12.43212890625, -11.8912353515625, -11.350341796875, -10.8094482421875, -10.2685546875, -9.7276611328125, -9.186767578125, -8.6458740234375, -8.10498046875, -7.5640869140625, -7.023193359375, -6.4822998046875, -5.94140625, -5.4005126953125, -4.859619140625, -4.3187255859375, -3.77783203125, -3.2369384765625, -2.696044921875, -2.1551513671875, -1.6142578125, -1.0733642578125, -0.532470703125, 0.0084228515625, 0.54931640625, 1.0902099609375, 1.631103515625, 2.1719970703125, 2.712890625, 3.2537841796875, 3.794677734375, 4.3355712890625, 4.87646484375, 5.4173583984375, 5.958251953125, 6.4991455078125, 7.0400390625, 7.5809326171875, 8.121826171875, 8.6627197265625, 9.20361328125, 9.7445068359375, 10.285400390625, 10.8262939453125, 11.3671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 3.0, 9.0, 18.0, 25.0, 48.0, 79.0, 108.0, 114.0, 137.0, 139.0, 89.0, 83.0, 59.0, 33.0, 20.0, 10.0, 9.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.560546875, -1.5228805541992188, -1.4852142333984375, -1.4475479125976562, -1.409881591796875, -1.3722152709960938, -1.3345489501953125, -1.2968826293945312, -1.25921630859375, -1.2215499877929688, -1.1838836669921875, -1.1462173461914062, -1.108551025390625, -1.0708847045898438, -1.0332183837890625, -0.9955520629882812, -0.9578857421875, -0.9202194213867188, -0.8825531005859375, -0.8448867797851562, -0.807220458984375, -0.7695541381835938, -0.7318878173828125, -0.6942214965820312, -0.65655517578125, -0.6188888549804688, -0.5812225341796875, -0.5435562133789062, -0.505889892578125, -0.46822357177734375, -0.4305572509765625, -0.39289093017578125, -0.355224609375, -0.31755828857421875, -0.2798919677734375, -0.24222564697265625, -0.204559326171875, -0.16689300537109375, -0.1292266845703125, -0.09156036376953125, -0.05389404296875, -0.01622772216796875, 0.0214385986328125, 0.05910491943359375, 0.096771240234375, 0.13443756103515625, 0.1721038818359375, 0.20977020263671875, 0.2474365234375, 0.28510284423828125, 0.3227691650390625, 0.36043548583984375, 0.398101806640625, 0.43576812744140625, 0.4734344482421875, 0.5111007690429688, 0.54876708984375, 0.5864334106445312, 0.6240997314453125, 0.6617660522460938, 0.699432373046875, 0.7370986938476562, 0.7747650146484375, 0.8124313354492188, 0.85009765625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 9.0, 7.0, 28.0, 76.0, 213.0, 786.0, 9841.0, 4137372.0, 43585.0, 1797.0, 349.0, 120.0, 54.0, 25.0, 5.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.150390625, -8.66015625, -8.169921875, -7.6796875, -7.189453125, -6.69921875, -6.208984375, -5.71875, -5.228515625, -4.73828125, -4.248046875, -3.7578125, -3.267578125, -2.77734375, -2.287109375, -1.796875, -1.306640625, -0.81640625, -0.326171875, 0.1640625, 0.654296875, 1.14453125, 1.634765625, 2.125, 2.615234375, 3.10546875, 3.595703125, 4.0859375, 4.576171875, 5.06640625, 5.556640625, 6.046875, 6.537109375, 7.02734375, 7.517578125, 8.0078125, 8.498046875, 8.98828125, 9.478515625, 9.96875, 10.458984375, 10.94921875, 11.439453125, 11.9296875, 12.419921875, 12.91015625, 13.400390625, 13.890625, 14.380859375, 14.87109375, 15.361328125, 15.8515625, 16.341796875, 16.83203125, 17.322265625, 17.8125, 18.302734375, 18.79296875, 19.283203125, 19.7734375, 20.263671875, 20.75390625, 21.244140625, 21.734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 9.0, 9.0, 12.0, 32.0, 52.0, 84.0, 164.0, 543.0, 2192.0, 586.0, 179.0, 85.0, 33.0, 32.0, 14.0, 12.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9501953125, -0.9015350341796875, -0.852874755859375, -0.8042144775390625, -0.75555419921875, -0.7068939208984375, -0.658233642578125, -0.6095733642578125, -0.5609130859375, -0.5122528076171875, -0.463592529296875, -0.4149322509765625, -0.36627197265625, -0.3176116943359375, -0.268951416015625, -0.2202911376953125, -0.171630859375, -0.1229705810546875, -0.074310302734375, -0.0256500244140625, 0.02301025390625, 0.0716705322265625, 0.120330810546875, 0.1689910888671875, 0.2176513671875, 0.2663116455078125, 0.314971923828125, 0.3636322021484375, 0.41229248046875, 0.4609527587890625, 0.509613037109375, 0.5582733154296875, 0.60693359375, 0.6555938720703125, 0.704254150390625, 0.7529144287109375, 0.80157470703125, 0.8502349853515625, 0.898895263671875, 0.9475555419921875, 0.9962158203125, 1.0448760986328125, 1.093536376953125, 1.1421966552734375, 1.19085693359375, 1.2395172119140625, 1.288177490234375, 1.3368377685546875, 1.385498046875, 1.4341583251953125, 1.482818603515625, 1.5314788818359375, 1.58013916015625, 1.6287994384765625, 1.677459716796875, 1.7261199951171875, 1.7747802734375, 1.8234405517578125, 1.872100830078125, 1.9207611083984375, 1.96942138671875, 2.0180816650390625, 2.066741943359375, 2.1154022216796875, 2.1640625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 57.0, 230.0, 411.0, 214.0, 49.0, 17.0, 6.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.721809387207031, -5.294982433319092, -4.868155479431152, -4.441328525543213, -4.014501571655273, -3.587674379348755, -3.1608474254608154, -2.734020471572876, -2.3071935176849365, -1.880366563796997, -1.4535396099090576, -1.0267125368118286, -0.5998855829238892, -0.17305850982666016, 0.2537684440612793, 0.6805953979492188, 1.1074223518371582, 1.5342493057250977, 1.961076259613037, 2.3879032135009766, 2.814730167388916, 3.2415573596954346, 3.668384313583374, 4.095211029052734, 4.522038459777832, 4.9488654136657715, 5.375692367553711, 5.80251932144165, 6.22934627532959, 6.6561737060546875, 7.083000183105469, 7.509827613830566, 7.936654090881348, 8.363481521606445, 8.790307998657227, 9.217135429382324, 9.643961906433105, 10.070789337158203, 10.497615814208984, 10.924443244934082, 11.351269721984863, 11.778097152709961, 12.204923629760742, 12.63175106048584, 13.058577537536621, 13.485404968261719, 13.9122314453125, 14.339058876037598, 14.765886306762695, 15.192713737487793, 15.619540214538574, 16.046367645263672, 16.473194122314453, 16.900020599365234, 17.32684898376465, 17.75367546081543, 18.18050193786621, 18.607328414916992, 19.034156799316406, 19.460983276367188, 19.88780975341797, 20.31463623046875, 20.741464614868164, 21.168291091918945, 21.595117568969727]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 9.0, 26.0, 23.0, 28.0, 58.0, 56.0, 63.0, 76.0, 67.0, 79.0, 87.0, 72.0, 65.0, 68.0, 44.0, 43.0, 40.0, 21.0, 17.0, 16.0, 13.0, 8.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.129608631134033, -6.918914794921875, -6.708220958709717, -6.497527122497559, -6.286832809448242, -6.076138973236084, -5.865445137023926, -5.654751300811768, -5.444057464599609, -5.233363628387451, -5.022669792175293, -4.811975479125977, -4.601281642913818, -4.39058780670166, -4.179893970489502, -3.9692001342773438, -3.7585058212280273, -3.547811985015869, -3.337117910385132, -3.1264240741729736, -2.9157299995422363, -2.705036163330078, -2.49434232711792, -2.2836484909057617, -2.0729544162750244, -1.8622604608535767, -1.651566505432129, -1.4408726692199707, -1.230178713798523, -1.0194847583770752, -0.808790922164917, -0.5980969667434692, -0.3874034881591797, -0.17670956254005432, 0.033984363079071045, 0.24467825889587402, 0.4553722143173218, 0.6660661697387695, 0.8767600059509277, 1.0874539613723755, 1.2981479167938232, 1.508841872215271, 1.7195358276367188, 1.930229663848877, 2.140923500061035, 2.3516175746917725, 2.5623114109039307, 2.773005485534668, 2.983699321746826, 3.1943931579589844, 3.4050872325897217, 3.61578106880188, 3.826475143432617, 4.037168979644775, 4.247862815856934, 4.458556652069092, 4.66925048828125, 4.879944324493408, 5.090638160705566, 5.301332473754883, 5.512026309967041, 5.722720146179199, 5.933413982391357, 6.144107818603516, 6.354802131652832]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 5.0, 2.0, 0.0, 5.0, 3.0, 5.0, 0.0, 10.0, 6.0, 25.0, 18.0, 31.0, 34.0, 35.0, 67.0, 57.0, 132.0, 172.0, 251.0, 358.0, 525.0, 883.0, 1428.0, 2868.0, 7044.0, 23049.0, 101842.0, 458075.0, 351457.0, 71396.0, 16973.0, 5665.0, 2431.0, 1329.0, 771.0, 506.0, 317.0, 191.0, 170.0, 102.0, 90.0, 58.0, 44.0, 29.0, 27.0, 23.0, 10.0, 21.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.95703125, -2.861297607421875, -2.76556396484375, -2.669830322265625, -2.5740966796875, -2.478363037109375, -2.38262939453125, -2.286895751953125, -2.191162109375, -2.095428466796875, -1.99969482421875, -1.903961181640625, -1.8082275390625, -1.712493896484375, -1.61676025390625, -1.521026611328125, -1.42529296875, -1.329559326171875, -1.23382568359375, -1.138092041015625, -1.0423583984375, -0.946624755859375, -0.85089111328125, -0.755157470703125, -0.659423828125, -0.563690185546875, -0.46795654296875, -0.372222900390625, -0.2764892578125, -0.180755615234375, -0.08502197265625, 0.010711669921875, 0.1064453125, 0.202178955078125, 0.29791259765625, 0.393646240234375, 0.4893798828125, 0.585113525390625, 0.68084716796875, 0.776580810546875, 0.872314453125, 0.968048095703125, 1.06378173828125, 1.159515380859375, 1.2552490234375, 1.350982666015625, 1.44671630859375, 1.542449951171875, 1.63818359375, 1.733917236328125, 1.82965087890625, 1.925384521484375, 2.0211181640625, 2.116851806640625, 2.21258544921875, 2.308319091796875, 2.404052734375, 2.499786376953125, 2.59552001953125, 2.691253662109375, 2.7869873046875, 2.882720947265625, 2.97845458984375, 3.074188232421875, 3.169921875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 9.0, 21.0, 42.0, 59.0, 80.0, 106.0, 123.0, 142.0, 126.0, 99.0, 58.0, 49.0, 23.0, 26.0, 10.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.48046875, -1.442596435546875, -1.40472412109375, -1.366851806640625, -1.3289794921875, -1.291107177734375, -1.25323486328125, -1.215362548828125, -1.177490234375, -1.139617919921875, -1.10174560546875, -1.063873291015625, -1.0260009765625, -0.988128662109375, -0.95025634765625, -0.912384033203125, -0.87451171875, -0.836639404296875, -0.79876708984375, -0.760894775390625, -0.7230224609375, -0.685150146484375, -0.64727783203125, -0.609405517578125, -0.571533203125, -0.533660888671875, -0.49578857421875, -0.457916259765625, -0.4200439453125, -0.382171630859375, -0.34429931640625, -0.306427001953125, -0.2685546875, -0.230682373046875, -0.19281005859375, -0.154937744140625, -0.1170654296875, -0.079193115234375, -0.04132080078125, -0.003448486328125, 0.034423828125, 0.072296142578125, 0.11016845703125, 0.148040771484375, 0.1859130859375, 0.223785400390625, 0.26165771484375, 0.299530029296875, 0.33740234375, 0.375274658203125, 0.41314697265625, 0.451019287109375, 0.4888916015625, 0.526763916015625, 0.56463623046875, 0.602508544921875, 0.640380859375, 0.678253173828125, 0.71612548828125, 0.753997802734375, 0.7918701171875, 0.829742431640625, 0.86761474609375, 0.905487060546875, 0.943359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 14.0, 6.0, 16.0, 20.0, 24.0, 28.0, 46.0, 68.0, 93.0, 178.0, 245.0, 382.0, 645.0, 1237.0, 2931.0, 8274.0, 30197.0, 154854.0, 565094.0, 225083.0, 41525.0, 10662.0, 3520.0, 1484.0, 736.0, 413.0, 252.0, 164.0, 113.0, 69.0, 54.0, 38.0, 22.0, 17.0, 18.0, 8.0, 6.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.751953125, -3.646575927734375, -3.54119873046875, -3.435821533203125, -3.3304443359375, -3.225067138671875, -3.11968994140625, -3.014312744140625, -2.908935546875, -2.803558349609375, -2.69818115234375, -2.592803955078125, -2.4874267578125, -2.382049560546875, -2.27667236328125, -2.171295166015625, -2.06591796875, -1.960540771484375, -1.85516357421875, -1.749786376953125, -1.6444091796875, -1.539031982421875, -1.43365478515625, -1.328277587890625, -1.222900390625, -1.117523193359375, -1.01214599609375, -0.906768798828125, -0.8013916015625, -0.696014404296875, -0.59063720703125, -0.485260009765625, -0.3798828125, -0.274505615234375, -0.16912841796875, -0.063751220703125, 0.0416259765625, 0.147003173828125, 0.25238037109375, 0.357757568359375, 0.463134765625, 0.568511962890625, 0.67388916015625, 0.779266357421875, 0.8846435546875, 0.990020751953125, 1.09539794921875, 1.200775146484375, 1.30615234375, 1.411529541015625, 1.51690673828125, 1.622283935546875, 1.7276611328125, 1.833038330078125, 1.93841552734375, 2.043792724609375, 2.149169921875, 2.254547119140625, 2.35992431640625, 2.465301513671875, 2.5706787109375, 2.676055908203125, 2.78143310546875, 2.886810302734375, 2.9921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 4.0, 9.0, 10.0, 9.0, 14.0, 15.0, 25.0, 26.0, 28.0, 35.0, 25.0, 35.0, 28.0, 50.0, 41.0, 49.0, 42.0, 62.0, 43.0, 43.0, 53.0, 45.0, 35.0, 44.0, 40.0, 22.0, 19.0, 24.0, 22.0, 21.0, 17.0, 8.0, 12.0, 6.0, 8.0, 9.0, 1.0, 8.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9140625, -2.82550048828125, -2.7369384765625, -2.64837646484375, -2.559814453125, -2.47125244140625, -2.3826904296875, -2.29412841796875, -2.20556640625, -2.11700439453125, -2.0284423828125, -1.93988037109375, -1.851318359375, -1.76275634765625, -1.6741943359375, -1.58563232421875, -1.4970703125, -1.40850830078125, -1.3199462890625, -1.23138427734375, -1.142822265625, -1.05426025390625, -0.9656982421875, -0.87713623046875, -0.78857421875, -0.70001220703125, -0.6114501953125, -0.52288818359375, -0.434326171875, -0.34576416015625, -0.2572021484375, -0.16864013671875, -0.080078125, 0.00848388671875, 0.0970458984375, 0.18560791015625, 0.274169921875, 0.36273193359375, 0.4512939453125, 0.53985595703125, 0.62841796875, 0.71697998046875, 0.8055419921875, 0.89410400390625, 0.982666015625, 1.07122802734375, 1.1597900390625, 1.24835205078125, 1.3369140625, 1.42547607421875, 1.5140380859375, 1.60260009765625, 1.691162109375, 1.77972412109375, 1.8682861328125, 1.95684814453125, 2.04541015625, 2.13397216796875, 2.2225341796875, 2.31109619140625, 2.399658203125, 2.48822021484375, 2.5767822265625, 2.66534423828125, 2.75390625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 2.0, 6.0, 4.0, 9.0, 10.0, 12.0, 22.0, 30.0, 25.0, 46.0, 53.0, 107.0, 147.0, 325.0, 581.0, 1227.0, 3315.0, 10866.0, 57432.0, 463366.0, 441005.0, 53723.0, 10544.0, 3150.0, 1226.0, 564.0, 255.0, 154.0, 93.0, 80.0, 43.0, 28.0, 21.0, 12.0, 9.0, 11.0, 14.0, 11.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.162109375, -1.1268768310546875, -1.091644287109375, -1.0564117431640625, -1.02117919921875, -0.9859466552734375, -0.950714111328125, -0.9154815673828125, -0.8802490234375, -0.8450164794921875, -0.809783935546875, -0.7745513916015625, -0.73931884765625, -0.7040863037109375, -0.668853759765625, -0.6336212158203125, -0.598388671875, -0.5631561279296875, -0.527923583984375, -0.4926910400390625, -0.45745849609375, -0.4222259521484375, -0.386993408203125, -0.3517608642578125, -0.3165283203125, -0.2812957763671875, -0.246063232421875, -0.2108306884765625, -0.17559814453125, -0.1403656005859375, -0.105133056640625, -0.0699005126953125, -0.03466796875, 0.0005645751953125, 0.035797119140625, 0.0710296630859375, 0.10626220703125, 0.1414947509765625, 0.176727294921875, 0.2119598388671875, 0.2471923828125, 0.2824249267578125, 0.317657470703125, 0.3528900146484375, 0.38812255859375, 0.4233551025390625, 0.458587646484375, 0.4938201904296875, 0.529052734375, 0.5642852783203125, 0.599517822265625, 0.6347503662109375, 0.66998291015625, 0.7052154541015625, 0.740447998046875, 0.7756805419921875, 0.8109130859375, 0.8461456298828125, 0.881378173828125, 0.9166107177734375, 0.95184326171875, 0.9870758056640625, 1.022308349609375, 1.0575408935546875, 1.0927734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 9.0, 11.0, 26.0, 29.0, 41.0, 57.0, 82.0, 119.0, 117.0, 128.0, 100.0, 85.0, 50.0, 48.0, 38.0, 21.0, 15.0, 7.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015497207641601562, -0.00014901533722877502, -0.00014305859804153442, -0.00013710185885429382, -0.00013114511966705322, -0.00012518838047981262, -0.00011923164129257202, -0.00011327490210533142, -0.00010731816291809082, -0.00010136142373085022, -9.540468454360962e-05, -8.944794535636902e-05, -8.349120616912842e-05, -7.753446698188782e-05, -7.157772779464722e-05, -6.562098860740662e-05, -5.9664249420166016e-05, -5.3707510232925415e-05, -4.7750771045684814e-05, -4.1794031858444214e-05, -3.583729267120361e-05, -2.9880553483963013e-05, -2.3923814296722412e-05, -1.796707510948181e-05, -1.2010335922241211e-05, -6.05359673500061e-06, -9.685754776000977e-08, 5.859881639480591e-06, 1.1816620826721191e-05, 1.7773360013961792e-05, 2.3730099201202393e-05, 2.9686838388442993e-05, 3.5643577575683594e-05, 4.1600316762924194e-05, 4.7557055950164795e-05, 5.3513795137405396e-05, 5.9470534324645996e-05, 6.54272735118866e-05, 7.13840126991272e-05, 7.73407518863678e-05, 8.32974910736084e-05, 8.9254230260849e-05, 9.52109694480896e-05, 0.0001011677086353302, 0.0001071244478225708, 0.0001130811870098114, 0.000119037926197052, 0.0001249946653842926, 0.0001309514045715332, 0.0001369081437587738, 0.0001428648829460144, 0.000148821622133255, 0.0001547783613204956, 0.0001607351005077362, 0.0001666918396949768, 0.0001726485788822174, 0.000178605318069458, 0.0001845620572566986, 0.0001905187964439392, 0.0001964755356311798, 0.0002024322748184204, 0.000208389014005661, 0.0002143457531929016, 0.0002203024923801422, 0.0002262592315673828]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 8.0, 13.0, 9.0, 19.0, 27.0, 38.0, 79.0, 108.0, 203.0, 385.0, 755.0, 1784.0, 5576.0, 27873.0, 318046.0, 623948.0, 56176.0, 8884.0, 2552.0, 982.0, 477.0, 225.0, 131.0, 78.0, 57.0, 28.0, 32.0, 10.0, 9.0, 3.0, 8.0, 6.0, 6.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.66015625, -1.612945556640625, -1.56573486328125, -1.518524169921875, -1.4713134765625, -1.424102783203125, -1.37689208984375, -1.329681396484375, -1.282470703125, -1.235260009765625, -1.18804931640625, -1.140838623046875, -1.0936279296875, -1.046417236328125, -0.99920654296875, -0.951995849609375, -0.90478515625, -0.857574462890625, -0.81036376953125, -0.763153076171875, -0.7159423828125, -0.668731689453125, -0.62152099609375, -0.574310302734375, -0.527099609375, -0.479888916015625, -0.43267822265625, -0.385467529296875, -0.3382568359375, -0.291046142578125, -0.24383544921875, -0.196624755859375, -0.1494140625, -0.102203369140625, -0.05499267578125, -0.007781982421875, 0.0394287109375, 0.086639404296875, 0.13385009765625, 0.181060791015625, 0.228271484375, 0.275482177734375, 0.32269287109375, 0.369903564453125, 0.4171142578125, 0.464324951171875, 0.51153564453125, 0.558746337890625, 0.60595703125, 0.653167724609375, 0.70037841796875, 0.747589111328125, 0.7947998046875, 0.842010498046875, 0.88922119140625, 0.936431884765625, 0.983642578125, 1.030853271484375, 1.07806396484375, 1.125274658203125, 1.1724853515625, 1.219696044921875, 1.26690673828125, 1.314117431640625, 1.361328125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 15.0, 12.0, 31.0, 35.0, 61.0, 75.0, 91.0, 112.0, 117.0, 90.0, 89.0, 65.0, 55.0, 44.0, 32.0, 23.0, 10.0, 5.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4404296875, -1.4019317626953125, -1.363433837890625, -1.3249359130859375, -1.28643798828125, -1.2479400634765625, -1.209442138671875, -1.1709442138671875, -1.1324462890625, -1.0939483642578125, -1.055450439453125, -1.0169525146484375, -0.97845458984375, -0.9399566650390625, -0.901458740234375, -0.8629608154296875, -0.824462890625, -0.7859649658203125, -0.747467041015625, -0.7089691162109375, -0.67047119140625, -0.6319732666015625, -0.593475341796875, -0.5549774169921875, -0.5164794921875, -0.4779815673828125, -0.439483642578125, -0.4009857177734375, -0.36248779296875, -0.3239898681640625, -0.285491943359375, -0.2469940185546875, -0.20849609375, -0.1699981689453125, -0.131500244140625, -0.0930023193359375, -0.05450439453125, -0.0160064697265625, 0.022491455078125, 0.0609893798828125, 0.0994873046875, 0.1379852294921875, 0.176483154296875, 0.2149810791015625, 0.25347900390625, 0.2919769287109375, 0.330474853515625, 0.3689727783203125, 0.407470703125, 0.4459686279296875, 0.484466552734375, 0.5229644775390625, 0.56146240234375, 0.5999603271484375, 0.638458251953125, 0.6769561767578125, 0.7154541015625, 0.7539520263671875, 0.792449951171875, 0.8309478759765625, 0.86944580078125, 0.9079437255859375, 0.946441650390625, 0.9849395751953125, 1.0234375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 18.0, 130.0, 506.0, 292.0, 44.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.57118225097656, -49.567386627197266, -47.56359100341797, -45.55979919433594, -43.55600357055664, -41.552207946777344, -39.54841613769531, -37.544620513916016, -35.54082489013672, -33.53702926635742, -31.533235549926758, -29.529441833496094, -27.525646209716797, -25.5218505859375, -23.518056869506836, -21.514263153076172, -19.510467529296875, -17.506671905517578, -15.502878189086914, -13.499083518981934, -11.495288848876953, -9.491494178771973, -7.487699508666992, -5.483904838562012, -3.4801101684570312, -1.4763154983520508, 0.5274791717529297, 2.53127384185791, 4.535068511962891, 6.538863182067871, 8.542657852172852, 10.546452522277832, 12.550247192382812, 14.554041862487793, 16.557836532592773, 18.561630249023438, 20.565425872802734, 22.56922149658203, 24.573015213012695, 26.57680892944336, 28.580604553222656, 30.584400177001953, 32.58819580078125, 34.59198760986328, 36.59578323364258, 38.599578857421875, 40.603370666503906, 42.6071662902832, 44.6109619140625, 46.6147575378418, 48.618553161621094, 50.622344970703125, 52.62614059448242, 54.62993621826172, 56.63372802734375, 58.63752365112305, 60.641319274902344, 62.64511489868164, 64.64891052246094, 66.65270233154297, 68.656494140625, 70.66029357910156, 72.6640853881836, 74.66788482666016, 76.67167663574219]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 7.0, 7.0, 6.0, 13.0, 15.0, 11.0, 21.0, 23.0, 20.0, 31.0, 28.0, 35.0, 37.0, 34.0, 44.0, 43.0, 51.0, 44.0, 57.0, 45.0, 45.0, 45.0, 46.0, 43.0, 35.0, 31.0, 28.0, 28.0, 27.0, 22.0, 12.0, 11.0, 16.0, 11.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.364089965820312, -13.83922004699707, -13.314350128173828, -12.789480209350586, -12.26461124420166, -11.739741325378418, -11.214871406555176, -10.690001487731934, -10.165132522583008, -9.640262603759766, -9.115392684936523, -8.590522766113281, -8.065653800964355, -7.540783882141113, -7.015913963317871, -6.491044044494629, -5.966174125671387, -5.4413042068481445, -4.9164347648620605, -4.391564846038818, -3.8666951656341553, -3.341825485229492, -2.81695556640625, -2.292085886001587, -1.7672162055969238, -1.2423465251922607, -0.7174767255783081, -0.19260692596435547, 0.3322627544403076, 0.8571324348449707, 1.382002353668213, 1.906872034072876, 2.431741714477539, 2.956611394882202, 3.4814810752868652, 4.006350994110107, 4.531220436096191, 5.056090354919434, 5.580960273742676, 6.105830192565918, 6.630699634552002, 7.155569553375244, 7.680438995361328, 8.20530891418457, 8.730178833007812, 9.255048751831055, 9.779918670654297, 10.304787635803223, 10.829657554626465, 11.354527473449707, 11.87939739227295, 12.404266357421875, 12.929136276245117, 13.45400619506836, 13.978876113891602, 14.503746032714844, 15.028615951538086, 15.553485870361328, 16.07835578918457, 16.603225708007812, 17.128095626831055, 17.652965545654297, 18.177833557128906, 18.70270347595215, 19.22757339477539]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 6.0, 2.0, 9.0, 8.0, 16.0, 17.0, 25.0, 24.0, 36.0, 79.0, 137.0, 248.0, 532.0, 1229.0, 3773.0, 19922.0, 3547816.0, 600984.0, 14576.0, 3012.0, 1001.0, 410.0, 188.0, 89.0, 59.0, 25.0, 17.0, 13.0, 9.0, 9.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.5748291015625, -6.391845703125, -6.2088623046875, -6.02587890625, -5.8428955078125, -5.659912109375, -5.4769287109375, -5.2939453125, -5.1109619140625, -4.927978515625, -4.7449951171875, -4.56201171875, -4.3790283203125, -4.196044921875, -4.0130615234375, -3.830078125, -3.6470947265625, -3.464111328125, -3.2811279296875, -3.09814453125, -2.9151611328125, -2.732177734375, -2.5491943359375, -2.3662109375, -2.1832275390625, -2.000244140625, -1.8172607421875, -1.63427734375, -1.4512939453125, -1.268310546875, -1.0853271484375, -0.90234375, -0.7193603515625, -0.536376953125, -0.3533935546875, -0.17041015625, 0.0125732421875, 0.195556640625, 0.3785400390625, 0.5615234375, 0.7445068359375, 0.927490234375, 1.1104736328125, 1.29345703125, 1.4764404296875, 1.659423828125, 1.8424072265625, 2.025390625, 2.2083740234375, 2.391357421875, 2.5743408203125, 2.75732421875, 2.9403076171875, 3.123291015625, 3.3062744140625, 3.4892578125, 3.6722412109375, 3.855224609375, 4.0382080078125, 4.22119140625, 4.4041748046875, 4.587158203125, 4.7701416015625, 4.953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 5.0, 9.0, 21.0, 19.0, 33.0, 44.0, 64.0, 83.0, 95.0, 91.0, 109.0, 104.0, 87.0, 67.0, 49.0, 31.0, 27.0, 21.0, 9.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.3860549926757812, -1.3521881103515625, -1.3183212280273438, -1.284454345703125, -1.2505874633789062, -1.2167205810546875, -1.1828536987304688, -1.14898681640625, -1.1151199340820312, -1.0812530517578125, -1.0473861694335938, -1.013519287109375, -0.9796524047851562, -0.9457855224609375, -0.9119186401367188, -0.8780517578125, -0.8441848754882812, -0.8103179931640625, -0.7764511108398438, -0.742584228515625, -0.7087173461914062, -0.6748504638671875, -0.6409835815429688, -0.60711669921875, -0.5732498168945312, -0.5393829345703125, -0.5055160522460938, -0.471649169921875, -0.43778228759765625, -0.4039154052734375, -0.37004852294921875, -0.336181640625, -0.30231475830078125, -0.2684478759765625, -0.23458099365234375, -0.200714111328125, -0.16684722900390625, -0.1329803466796875, -0.09911346435546875, -0.06524658203125, -0.03137969970703125, 0.0024871826171875, 0.03635406494140625, 0.070220947265625, 0.10408782958984375, 0.1379547119140625, 0.17182159423828125, 0.2056884765625, 0.23955535888671875, 0.2734222412109375, 0.30728912353515625, 0.341156005859375, 0.37502288818359375, 0.4088897705078125, 0.44275665283203125, 0.47662353515625, 0.5104904174804688, 0.5443572998046875, 0.5782241821289062, 0.612091064453125, 0.6459579467773438, 0.6798248291015625, 0.7136917114257812, 0.74755859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 9.0, 17.0, 50.0, 106.0, 278.0, 1898.0, 3307880.0, 882084.0, 1558.0, 260.0, 93.0, 31.0, 14.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.7308349609375, -15.305419921875, -14.8800048828125, -14.45458984375, -14.0291748046875, -13.603759765625, -13.1783447265625, -12.7529296875, -12.3275146484375, -11.902099609375, -11.4766845703125, -11.05126953125, -10.6258544921875, -10.200439453125, -9.7750244140625, -9.349609375, -8.9241943359375, -8.498779296875, -8.0733642578125, -7.64794921875, -7.2225341796875, -6.797119140625, -6.3717041015625, -5.9462890625, -5.5208740234375, -5.095458984375, -4.6700439453125, -4.24462890625, -3.8192138671875, -3.393798828125, -2.9683837890625, -2.54296875, -2.1175537109375, -1.692138671875, -1.2667236328125, -0.84130859375, -0.4158935546875, 0.009521484375, 0.4349365234375, 0.8603515625, 1.2857666015625, 1.711181640625, 2.1365966796875, 2.56201171875, 2.9874267578125, 3.412841796875, 3.8382568359375, 4.263671875, 4.6890869140625, 5.114501953125, 5.5399169921875, 5.96533203125, 6.3907470703125, 6.816162109375, 7.2415771484375, 7.6669921875, 8.0924072265625, 8.517822265625, 8.9432373046875, 9.36865234375, 9.7940673828125, 10.219482421875, 10.6448974609375, 11.0703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 13.0, 11.0, 10.0, 31.0, 74.0, 167.0, 643.0, 2587.0, 346.0, 96.0, 49.0, 23.0, 12.0, 10.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0546875, -2.0037384033203125, -1.952789306640625, -1.9018402099609375, -1.85089111328125, -1.7999420166015625, -1.748992919921875, -1.6980438232421875, -1.6470947265625, -1.5961456298828125, -1.545196533203125, -1.4942474365234375, -1.44329833984375, -1.3923492431640625, -1.341400146484375, -1.2904510498046875, -1.239501953125, -1.1885528564453125, -1.137603759765625, -1.0866546630859375, -1.03570556640625, -0.9847564697265625, -0.933807373046875, -0.8828582763671875, -0.8319091796875, -0.7809600830078125, -0.730010986328125, -0.6790618896484375, -0.62811279296875, -0.5771636962890625, -0.526214599609375, -0.4752655029296875, -0.42431640625, -0.3733673095703125, -0.322418212890625, -0.2714691162109375, -0.22052001953125, -0.1695709228515625, -0.118621826171875, -0.0676727294921875, -0.0167236328125, 0.0342254638671875, 0.085174560546875, 0.1361236572265625, 0.18707275390625, 0.2380218505859375, 0.288970947265625, 0.3399200439453125, 0.390869140625, 0.4418182373046875, 0.492767333984375, 0.5437164306640625, 0.59466552734375, 0.6456146240234375, 0.696563720703125, 0.7475128173828125, 0.7984619140625, 0.8494110107421875, 0.900360107421875, 0.9513092041015625, 1.00225830078125, 1.0532073974609375, 1.104156494140625, 1.1551055908203125, 1.2060546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 12.0, 518.0, 460.0, 15.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.212550163269043, -9.362979888916016, -8.513410568237305, -7.6638407707214355, -6.814270973205566, -5.964701175689697, -5.115131378173828, -4.265561580657959, -3.41599178314209, -2.5664219856262207, -1.7168521881103516, -0.8672823905944824, -0.01771259307861328, 0.8318572044372559, 1.681427001953125, 2.530996799468994, 3.3805665969848633, 4.230136394500732, 5.079706192016602, 5.929275989532471, 6.77884578704834, 7.628415584564209, 8.477985382080078, 9.327554702758789, 10.177124977111816, 11.026695251464844, 11.876264572143555, 12.725833892822266, 13.575404167175293, 14.42497444152832, 15.274543762207031, 16.124113082885742, 16.973682403564453, 17.823251724243164, 18.672821044921875, 19.52239227294922, 20.37196159362793, 21.22153091430664, 22.071102142333984, 22.920671463012695, 23.770240783691406, 24.619810104370117, 25.469379425048828, 26.318950653076172, 27.168519973754883, 28.018089294433594, 28.867660522460938, 29.71722984313965, 30.56679916381836, 31.41636848449707, 32.26593780517578, 33.115509033203125, 33.96508026123047, 34.81464767456055, 35.66421890258789, 36.51378631591797, 37.36335754394531, 38.212928771972656, 39.062496185302734, 39.91206741333008, 40.761634826660156, 41.6112060546875, 42.460777282714844, 43.31034469604492, 44.159915924072266]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 10.0, 6.0, 4.0, 11.0, 11.0, 18.0, 22.0, 31.0, 31.0, 32.0, 37.0, 45.0, 63.0, 60.0, 66.0, 56.0, 57.0, 72.0, 50.0, 53.0, 38.0, 48.0, 41.0, 32.0, 33.0, 14.0, 20.0, 15.0, 11.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3960537910461426, -2.3008692264556885, -2.2056846618652344, -2.1105000972747803, -2.015315532684326, -1.920130968093872, -1.8249462842941284, -1.7297617197036743, -1.6345771551132202, -1.5393925905227661, -1.444208025932312, -1.3490233421325684, -1.2538387775421143, -1.1586542129516602, -1.063469648361206, -0.968285083770752, -0.8731005191802979, -0.7779159545898438, -0.6827313899993896, -0.5875467658042908, -0.49236220121383667, -0.39717763662338257, -0.3019930124282837, -0.2068084478378296, -0.11162388324737549, -0.016439303755760193, 0.0787452757358551, 0.1739298701286316, 0.2691144347190857, 0.3642989993095398, 0.45948362350463867, 0.5546681880950928, 0.6498527526855469, 0.745037317276001, 0.8402218818664551, 0.935406506061554, 1.0305910110473633, 1.1257755756378174, 1.220960259437561, 1.3161448240280151, 1.4113293886184692, 1.5065139532089233, 1.6016985177993774, 1.696883201599121, 1.7920677661895752, 1.8872523307800293, 1.9824368953704834, 2.0776214599609375, 2.1728060245513916, 2.2679905891418457, 2.3631751537323, 2.458359718322754, 2.553544282913208, 2.648728847503662, 2.7439136505126953, 2.8390979766845703, 2.9342827796936035, 3.0294673442840576, 3.1246519088745117, 3.219836473464966, 3.31502103805542, 3.410205602645874, 3.505390167236328, 3.6005749702453613, 3.6957592964172363]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 6.0, 7.0, 15.0, 13.0, 26.0, 37.0, 50.0, 68.0, 134.0, 232.0, 405.0, 816.0, 1930.0, 4959.0, 19236.0, 144040.0, 688339.0, 158474.0, 20680.0, 5266.0, 1890.0, 890.0, 437.0, 227.0, 128.0, 101.0, 35.0, 36.0, 23.0, 18.0, 6.0, 9.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.62890625, -5.489990234375, -5.35107421875, -5.212158203125, -5.0732421875, -4.934326171875, -4.79541015625, -4.656494140625, -4.517578125, -4.378662109375, -4.23974609375, -4.100830078125, -3.9619140625, -3.822998046875, -3.68408203125, -3.545166015625, -3.40625, -3.267333984375, -3.12841796875, -2.989501953125, -2.8505859375, -2.711669921875, -2.57275390625, -2.433837890625, -2.294921875, -2.156005859375, -2.01708984375, -1.878173828125, -1.7392578125, -1.600341796875, -1.46142578125, -1.322509765625, -1.18359375, -1.044677734375, -0.90576171875, -0.766845703125, -0.6279296875, -0.489013671875, -0.35009765625, -0.211181640625, -0.072265625, 0.066650390625, 0.20556640625, 0.344482421875, 0.4833984375, 0.622314453125, 0.76123046875, 0.900146484375, 1.0390625, 1.177978515625, 1.31689453125, 1.455810546875, 1.5947265625, 1.733642578125, 1.87255859375, 2.011474609375, 2.150390625, 2.289306640625, 2.42822265625, 2.567138671875, 2.7060546875, 2.844970703125, 2.98388671875, 3.122802734375, 3.26171875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 9.0, 12.0, 9.0, 21.0, 33.0, 39.0, 70.0, 79.0, 98.0, 96.0, 110.0, 98.0, 73.0, 81.0, 59.0, 29.0, 24.0, 20.0, 13.0, 4.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3818359375, -1.3481826782226562, -1.3145294189453125, -1.2808761596679688, -1.247222900390625, -1.2135696411132812, -1.1799163818359375, -1.1462631225585938, -1.11260986328125, -1.0789566040039062, -1.0453033447265625, -1.0116500854492188, -0.977996826171875, -0.9443435668945312, -0.9106903076171875, -0.8770370483398438, -0.8433837890625, -0.8097305297851562, -0.7760772705078125, -0.7424240112304688, -0.708770751953125, -0.6751174926757812, -0.6414642333984375, -0.6078109741210938, -0.57415771484375, -0.5405044555664062, -0.5068511962890625, -0.47319793701171875, -0.439544677734375, -0.40589141845703125, -0.3722381591796875, -0.33858489990234375, -0.304931640625, -0.27127838134765625, -0.2376251220703125, -0.20397186279296875, -0.170318603515625, -0.13666534423828125, -0.1030120849609375, -0.06935882568359375, -0.03570556640625, -0.00205230712890625, 0.0316009521484375, 0.06525421142578125, 0.098907470703125, 0.13256072998046875, 0.1662139892578125, 0.19986724853515625, 0.2335205078125, 0.26717376708984375, 0.3008270263671875, 0.33448028564453125, 0.368133544921875, 0.40178680419921875, 0.4354400634765625, 0.46909332275390625, 0.50274658203125, 0.5363998413085938, 0.5700531005859375, 0.6037063598632812, 0.637359619140625, 0.6710128784179688, 0.7046661376953125, 0.7383193969726562, 0.77197265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 10.0, 16.0, 15.0, 29.0, 50.0, 72.0, 113.0, 181.0, 273.0, 547.0, 963.0, 2129.0, 6073.0, 24498.0, 143951.0, 616633.0, 207437.0, 32683.0, 7732.0, 2630.0, 1101.0, 552.0, 349.0, 172.0, 118.0, 67.0, 44.0, 38.0, 29.0, 15.0, 11.0, 7.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.10546875, -2.992919921875, -2.88037109375, -2.767822265625, -2.6552734375, -2.542724609375, -2.43017578125, -2.317626953125, -2.205078125, -2.092529296875, -1.97998046875, -1.867431640625, -1.7548828125, -1.642333984375, -1.52978515625, -1.417236328125, -1.3046875, -1.192138671875, -1.07958984375, -0.967041015625, -0.8544921875, -0.741943359375, -0.62939453125, -0.516845703125, -0.404296875, -0.291748046875, -0.17919921875, -0.066650390625, 0.0458984375, 0.158447265625, 0.27099609375, 0.383544921875, 0.49609375, 0.608642578125, 0.72119140625, 0.833740234375, 0.9462890625, 1.058837890625, 1.17138671875, 1.283935546875, 1.396484375, 1.509033203125, 1.62158203125, 1.734130859375, 1.8466796875, 1.959228515625, 2.07177734375, 2.184326171875, 2.296875, 2.409423828125, 2.52197265625, 2.634521484375, 2.7470703125, 2.859619140625, 2.97216796875, 3.084716796875, 3.197265625, 3.309814453125, 3.42236328125, 3.534912109375, 3.6474609375, 3.760009765625, 3.87255859375, 3.985107421875, 4.09765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 6.0, 6.0, 7.0, 6.0, 10.0, 13.0, 13.0, 11.0, 20.0, 14.0, 20.0, 18.0, 29.0, 39.0, 29.0, 31.0, 45.0, 49.0, 50.0, 58.0, 47.0, 56.0, 51.0, 46.0, 38.0, 37.0, 35.0, 34.0, 32.0, 36.0, 21.0, 15.0, 14.0, 22.0, 8.0, 10.0, 6.0, 7.0, 2.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.548828125, -2.461334228515625, -2.37384033203125, -2.286346435546875, -2.1988525390625, -2.111358642578125, -2.02386474609375, -1.936370849609375, -1.848876953125, -1.761383056640625, -1.67388916015625, -1.586395263671875, -1.4989013671875, -1.411407470703125, -1.32391357421875, -1.236419677734375, -1.14892578125, -1.061431884765625, -0.97393798828125, -0.886444091796875, -0.7989501953125, -0.711456298828125, -0.62396240234375, -0.536468505859375, -0.448974609375, -0.361480712890625, -0.27398681640625, -0.186492919921875, -0.0989990234375, -0.011505126953125, 0.07598876953125, 0.163482666015625, 0.2509765625, 0.338470458984375, 0.42596435546875, 0.513458251953125, 0.6009521484375, 0.688446044921875, 0.77593994140625, 0.863433837890625, 0.950927734375, 1.038421630859375, 1.12591552734375, 1.213409423828125, 1.3009033203125, 1.388397216796875, 1.47589111328125, 1.563385009765625, 1.65087890625, 1.738372802734375, 1.82586669921875, 1.913360595703125, 2.0008544921875, 2.088348388671875, 2.17584228515625, 2.263336181640625, 2.350830078125, 2.438323974609375, 2.52581787109375, 2.613311767578125, 2.7008056640625, 2.788299560546875, 2.87579345703125, 2.963287353515625, 3.05078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 1.0, 4.0, 9.0, 13.0, 26.0, 37.0, 41.0, 96.0, 157.0, 366.0, 790.0, 2815.0, 16173.0, 354999.0, 640611.0, 26679.0, 3848.0, 1044.0, 386.0, 186.0, 117.0, 54.0, 30.0, 26.0, 13.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9619140625, -1.904388427734375, -1.84686279296875, -1.789337158203125, -1.7318115234375, -1.674285888671875, -1.61676025390625, -1.559234619140625, -1.501708984375, -1.444183349609375, -1.38665771484375, -1.329132080078125, -1.2716064453125, -1.214080810546875, -1.15655517578125, -1.099029541015625, -1.04150390625, -0.983978271484375, -0.92645263671875, -0.868927001953125, -0.8114013671875, -0.753875732421875, -0.69635009765625, -0.638824462890625, -0.581298828125, -0.523773193359375, -0.46624755859375, -0.408721923828125, -0.3511962890625, -0.293670654296875, -0.23614501953125, -0.178619384765625, -0.12109375, -0.063568115234375, -0.00604248046875, 0.051483154296875, 0.1090087890625, 0.166534423828125, 0.22406005859375, 0.281585693359375, 0.339111328125, 0.396636962890625, 0.45416259765625, 0.511688232421875, 0.5692138671875, 0.626739501953125, 0.68426513671875, 0.741790771484375, 0.79931640625, 0.856842041015625, 0.91436767578125, 0.971893310546875, 1.0294189453125, 1.086944580078125, 1.14447021484375, 1.201995849609375, 1.259521484375, 1.317047119140625, 1.37457275390625, 1.432098388671875, 1.4896240234375, 1.547149658203125, 1.60467529296875, 1.662200927734375, 1.7197265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 9.0, 8.0, 25.0, 34.0, 50.0, 67.0, 82.0, 111.0, 122.0, 129.0, 95.0, 67.0, 48.0, 32.0, 25.0, 19.0, 13.0, 10.0, 6.0, 9.0, 4.0, 1.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017189979553222656, -0.0001661144196987152, -0.00016032904386520386, -0.0001545436680316925, -0.00014875829219818115, -0.0001429729163646698, -0.00013718754053115845, -0.0001314021646976471, -0.00012561678886413574, -0.00011983141303062439, -0.00011404603719711304, -0.00010826066136360168, -0.00010247528553009033, -9.668990969657898e-05, -9.090453386306763e-05, -8.511915802955627e-05, -7.933378219604492e-05, -7.354840636253357e-05, -6.776303052902222e-05, -6.197765469551086e-05, -5.619227886199951e-05, -5.040690302848816e-05, -4.462152719497681e-05, -3.8836151361465454e-05, -3.30507755279541e-05, -2.726539969444275e-05, -2.1480023860931396e-05, -1.5694648027420044e-05, -9.909272193908691e-06, -4.123896360397339e-06, 1.6614794731140137e-06, 7.446855306625366e-06, 1.3232231140136719e-05, 1.901760697364807e-05, 2.4802982807159424e-05, 3.0588358640670776e-05, 3.637373447418213e-05, 4.215911030769348e-05, 4.7944486141204834e-05, 5.3729861974716187e-05, 5.951523780822754e-05, 6.530061364173889e-05, 7.108598947525024e-05, 7.68713653087616e-05, 8.265674114227295e-05, 8.84421169757843e-05, 9.422749280929565e-05, 0.00010001286864280701, 0.00010579824447631836, 0.00011158362030982971, 0.00011736899614334106, 0.00012315437197685242, 0.00012893974781036377, 0.00013472512364387512, 0.00014051049947738647, 0.00014629587531089783, 0.00015208125114440918, 0.00015786662697792053, 0.00016365200281143188, 0.00016943737864494324, 0.0001752227544784546, 0.00018100813031196594, 0.0001867935061454773, 0.00019257888197898865, 0.0001983642578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 17.0, 16.0, 21.0, 37.0, 74.0, 141.0, 292.0, 661.0, 1834.0, 7117.0, 56242.0, 774291.0, 188644.0, 14389.0, 2976.0, 975.0, 397.0, 172.0, 87.0, 54.0, 30.0, 23.0, 19.0, 12.0, 6.0, 3.0, 0.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7822265625, -1.730865478515625, -1.67950439453125, -1.628143310546875, -1.5767822265625, -1.525421142578125, -1.47406005859375, -1.422698974609375, -1.371337890625, -1.319976806640625, -1.26861572265625, -1.217254638671875, -1.1658935546875, -1.114532470703125, -1.06317138671875, -1.011810302734375, -0.96044921875, -0.909088134765625, -0.85772705078125, -0.806365966796875, -0.7550048828125, -0.703643798828125, -0.65228271484375, -0.600921630859375, -0.549560546875, -0.498199462890625, -0.44683837890625, -0.395477294921875, -0.3441162109375, -0.292755126953125, -0.24139404296875, -0.190032958984375, -0.138671875, -0.087310791015625, -0.03594970703125, 0.015411376953125, 0.0667724609375, 0.118133544921875, 0.16949462890625, 0.220855712890625, 0.272216796875, 0.323577880859375, 0.37493896484375, 0.426300048828125, 0.4776611328125, 0.529022216796875, 0.58038330078125, 0.631744384765625, 0.68310546875, 0.734466552734375, 0.78582763671875, 0.837188720703125, 0.8885498046875, 0.939910888671875, 0.99127197265625, 1.042633056640625, 1.093994140625, 1.145355224609375, 1.19671630859375, 1.248077392578125, 1.2994384765625, 1.350799560546875, 1.40216064453125, 1.453521728515625, 1.5048828125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 8.0, 8.0, 13.0, 20.0, 28.0, 49.0, 54.0, 86.0, 74.0, 89.0, 106.0, 121.0, 93.0, 70.0, 46.0, 30.0, 23.0, 18.0, 11.0, 16.0, 5.0, 7.0, 9.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2119140625, -1.1795578002929688, -1.1472015380859375, -1.1148452758789062, -1.082489013671875, -1.0501327514648438, -1.0177764892578125, -0.9854202270507812, -0.95306396484375, -0.9207077026367188, -0.8883514404296875, -0.8559951782226562, -0.823638916015625, -0.7912826538085938, -0.7589263916015625, -0.7265701293945312, -0.6942138671875, -0.6618576049804688, -0.6295013427734375, -0.5971450805664062, -0.564788818359375, -0.5324325561523438, -0.5000762939453125, -0.46772003173828125, -0.43536376953125, -0.40300750732421875, -0.3706512451171875, -0.33829498291015625, -0.305938720703125, -0.27358245849609375, -0.2412261962890625, -0.20886993408203125, -0.176513671875, -0.14415740966796875, -0.1118011474609375, -0.07944488525390625, -0.047088623046875, -0.01473236083984375, 0.0176239013671875, 0.04998016357421875, 0.08233642578125, 0.11469268798828125, 0.1470489501953125, 0.17940521240234375, 0.211761474609375, 0.24411773681640625, 0.2764739990234375, 0.30883026123046875, 0.3411865234375, 0.37354278564453125, 0.4058990478515625, 0.43825531005859375, 0.470611572265625, 0.5029678344726562, 0.5353240966796875, 0.5676803588867188, 0.60003662109375, 0.6323928833007812, 0.6647491455078125, 0.6971054077148438, 0.729461669921875, 0.7618179321289062, 0.7941741943359375, 0.8265304565429688, 0.85888671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 6.0, 13.0, 27.0, 31.0, 77.0, 140.0, 224.0, 213.0, 144.0, 66.0, 28.0, 13.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.208221435546875, -15.436664581298828, -14.665107727050781, -13.893550872802734, -13.121994018554688, -12.35043716430664, -11.57888126373291, -10.807324409484863, -10.035767555236816, -9.26421070098877, -8.492653846740723, -7.721097469329834, -6.949540615081787, -6.17798376083374, -5.406427383422852, -4.634870529174805, -3.863313674926758, -3.091756820678711, -2.320200204849243, -1.5486435890197754, -0.7770867347717285, -0.005529880523681641, 0.766026496887207, 1.537583351135254, 2.309140205383301, 3.0806970596313477, 3.8522536754608154, 4.623810291290283, 5.39536714553833, 6.166923999786377, 6.938480377197266, 7.7100372314453125, 8.48159408569336, 9.253150939941406, 10.024707794189453, 10.7962646484375, 11.567821502685547, 12.339378356933594, 13.110934257507324, 13.882491111755371, 14.654047966003418, 15.425604820251465, 16.197160720825195, 16.968717575073242, 17.74027442932129, 18.511831283569336, 19.283388137817383, 20.05494499206543, 20.826501846313477, 21.598058700561523, 22.36961555480957, 23.141172409057617, 23.912729263305664, 24.68428611755371, 25.455841064453125, 26.227397918701172, 26.99895477294922, 27.770511627197266, 28.542068481445312, 29.31362533569336, 30.085182189941406, 30.856739044189453, 31.6282958984375, 32.39985275268555, 33.171409606933594]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 6.0, 4.0, 5.0, 6.0, 9.0, 9.0, 16.0, 15.0, 25.0, 26.0, 33.0, 36.0, 41.0, 45.0, 59.0, 63.0, 74.0, 57.0, 59.0, 75.0, 53.0, 47.0, 40.0, 32.0, 30.0, 31.0, 23.0, 15.0, 22.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.58616065979004, -20.995849609375, -20.40553855895996, -19.815227508544922, -19.224918365478516, -18.634607315063477, -18.044296264648438, -17.4539852142334, -16.86367416381836, -16.27336311340332, -15.683052062988281, -15.092741966247559, -14.50243091583252, -13.91211986541748, -13.321809768676758, -12.731498718261719, -12.14118766784668, -11.55087661743164, -10.960565567016602, -10.370255470275879, -9.77994441986084, -9.1896333694458, -8.599323272705078, -8.009012222290039, -7.418701171875, -6.828390121459961, -6.23807954788208, -5.647768974304199, -5.05745792388916, -4.467146873474121, -3.8768362998962402, -3.2865257263183594, -2.6962127685546875, -2.1059019565582275, -1.5155911445617676, -0.9252803325653076, -0.33496952056884766, 0.2553412914276123, 0.8456521034240723, 1.4359626770019531, 2.026273727416992, 2.616584539413452, 3.206895351409912, 3.797206163406372, 4.387516975402832, 4.977828025817871, 5.568138599395752, 6.158449172973633, 6.748760223388672, 7.339071273803711, 7.929381847381592, 8.519692420959473, 9.110003471374512, 9.70031452178955, 10.290624618530273, 10.880935668945312, 11.471246719360352, 12.06155776977539, 12.65186882019043, 13.242178916931152, 13.832489967346191, 14.42280101776123, 15.013111114501953, 15.603422164916992, 16.19373321533203]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 10.0, 9.0, 16.0, 17.0, 18.0, 31.0, 29.0, 59.0, 101.0, 176.0, 306.0, 774.0, 2050.0, 7481.0, 90553.0, 4018341.0, 65049.0, 6191.0, 1724.0, 691.0, 309.0, 136.0, 74.0, 41.0, 28.0, 18.0, 9.0, 8.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.75390625, -7.54119873046875, -7.3284912109375, -7.11578369140625, -6.903076171875, -6.69036865234375, -6.4776611328125, -6.26495361328125, -6.05224609375, -5.83953857421875, -5.6268310546875, -5.41412353515625, -5.201416015625, -4.98870849609375, -4.7760009765625, -4.56329345703125, -4.3505859375, -4.13787841796875, -3.9251708984375, -3.71246337890625, -3.499755859375, -3.28704833984375, -3.0743408203125, -2.86163330078125, -2.64892578125, -2.43621826171875, -2.2235107421875, -2.01080322265625, -1.798095703125, -1.58538818359375, -1.3726806640625, -1.15997314453125, -0.947265625, -0.73455810546875, -0.5218505859375, -0.30914306640625, -0.096435546875, 0.11627197265625, 0.3289794921875, 0.54168701171875, 0.75439453125, 0.96710205078125, 1.1798095703125, 1.39251708984375, 1.605224609375, 1.81793212890625, 2.0306396484375, 2.24334716796875, 2.4560546875, 2.66876220703125, 2.8814697265625, 3.09417724609375, 3.306884765625, 3.51959228515625, 3.7322998046875, 3.94500732421875, 4.15771484375, 4.37042236328125, 4.5831298828125, 4.79583740234375, 5.008544921875, 5.22125244140625, 5.4339599609375, 5.64666748046875, 5.859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 10.0, 17.0, 27.0, 27.0, 39.0, 61.0, 79.0, 121.0, 86.0, 97.0, 106.0, 75.0, 72.0, 47.0, 51.0, 23.0, 11.0, 14.0, 13.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.3112640380859375, -1.276824951171875, -1.2423858642578125, -1.20794677734375, -1.1735076904296875, -1.139068603515625, -1.1046295166015625, -1.0701904296875, -1.0357513427734375, -1.001312255859375, -0.9668731689453125, -0.93243408203125, -0.8979949951171875, -0.863555908203125, -0.8291168212890625, -0.794677734375, -0.7602386474609375, -0.725799560546875, -0.6913604736328125, -0.65692138671875, -0.6224822998046875, -0.588043212890625, -0.5536041259765625, -0.5191650390625, -0.4847259521484375, -0.450286865234375, -0.4158477783203125, -0.38140869140625, -0.3469696044921875, -0.312530517578125, -0.2780914306640625, -0.24365234375, -0.2092132568359375, -0.174774169921875, -0.1403350830078125, -0.10589599609375, -0.0714569091796875, -0.037017822265625, -0.0025787353515625, 0.0318603515625, 0.0662994384765625, 0.100738525390625, 0.1351776123046875, 0.16961669921875, 0.2040557861328125, 0.238494873046875, 0.2729339599609375, 0.307373046875, 0.3418121337890625, 0.376251220703125, 0.4106903076171875, 0.44512939453125, 0.4795684814453125, 0.514007568359375, 0.5484466552734375, 0.5828857421875, 0.6173248291015625, 0.651763916015625, 0.6862030029296875, 0.72064208984375, 0.7550811767578125, 0.789520263671875, 0.8239593505859375, 0.8583984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 13.0, 22.0, 30.0, 30.0, 119.0, 372.0, 1700.0, 15994.0, 4003164.0, 166520.0, 4945.0, 865.0, 287.0, 101.0, 34.0, 27.0, 18.0, 12.0, 9.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.49249267578125, -5.1998291015625, -4.90716552734375, -4.614501953125, -4.32183837890625, -4.0291748046875, -3.73651123046875, -3.44384765625, -3.15118408203125, -2.8585205078125, -2.56585693359375, -2.273193359375, -1.98052978515625, -1.6878662109375, -1.39520263671875, -1.1025390625, -0.80987548828125, -0.5172119140625, -0.22454833984375, 0.068115234375, 0.36077880859375, 0.6534423828125, 0.94610595703125, 1.23876953125, 1.53143310546875, 1.8240966796875, 2.11676025390625, 2.409423828125, 2.70208740234375, 2.9947509765625, 3.28741455078125, 3.580078125, 3.87274169921875, 4.1654052734375, 4.45806884765625, 4.750732421875, 5.04339599609375, 5.3360595703125, 5.62872314453125, 5.92138671875, 6.21405029296875, 6.5067138671875, 6.79937744140625, 7.092041015625, 7.38470458984375, 7.6773681640625, 7.97003173828125, 8.2626953125, 8.55535888671875, 8.8480224609375, 9.14068603515625, 9.433349609375, 9.72601318359375, 10.0186767578125, 10.31134033203125, 10.60400390625, 10.89666748046875, 11.1893310546875, 11.48199462890625, 11.774658203125, 12.06732177734375, 12.3599853515625, 12.65264892578125, 12.9453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 8.0, 12.0, 18.0, 16.0, 35.0, 52.0, 65.0, 175.0, 371.0, 1626.0, 1045.0, 327.0, 136.0, 77.0, 34.0, 14.0, 16.0, 9.0, 11.0, 9.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.5036163330078125, -1.447662353515625, -1.3917083740234375, -1.33575439453125, -1.2798004150390625, -1.223846435546875, -1.1678924560546875, -1.1119384765625, -1.0559844970703125, -1.000030517578125, -0.9440765380859375, -0.88812255859375, -0.8321685791015625, -0.776214599609375, -0.7202606201171875, -0.664306640625, -0.6083526611328125, -0.552398681640625, -0.4964447021484375, -0.44049072265625, -0.3845367431640625, -0.328582763671875, -0.2726287841796875, -0.2166748046875, -0.1607208251953125, -0.104766845703125, -0.0488128662109375, 0.00714111328125, 0.0630950927734375, 0.119049072265625, 0.1750030517578125, 0.23095703125, 0.2869110107421875, 0.342864990234375, 0.3988189697265625, 0.45477294921875, 0.5107269287109375, 0.566680908203125, 0.6226348876953125, 0.6785888671875, 0.7345428466796875, 0.790496826171875, 0.8464508056640625, 0.90240478515625, 0.9583587646484375, 1.014312744140625, 1.0702667236328125, 1.126220703125, 1.1821746826171875, 1.238128662109375, 1.2940826416015625, 1.35003662109375, 1.4059906005859375, 1.461944580078125, 1.5178985595703125, 1.5738525390625, 1.6298065185546875, 1.685760498046875, 1.7417144775390625, 1.79766845703125, 1.8536224365234375, 1.909576416015625, 1.9655303955078125, 2.021484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 23.0, 96.0, 409.0, 352.0, 91.0, 14.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.163129806518555, -25.474000930786133, -24.78487205505371, -24.095741271972656, -23.406612396240234, -22.717483520507812, -22.02835464477539, -21.33922576904297, -20.650096893310547, -19.960968017578125, -19.271839141845703, -18.58271026611328, -17.893579483032227, -17.204450607299805, -16.515321731567383, -15.826192855834961, -15.137062072753906, -14.447933197021484, -13.758803367614746, -13.069674491882324, -12.380544662475586, -11.691415786743164, -11.002286911010742, -10.31315803527832, -9.624028205871582, -8.93489933013916, -8.245769500732422, -7.556640625, -6.86751127243042, -6.17838191986084, -5.489253044128418, -4.800123691558838, -4.110992431640625, -3.421863079071045, -2.732733964920044, -2.043604850769043, -1.354475498199463, -0.6653461456298828, 0.023782730102539062, 0.7129120826721191, 1.4020414352416992, 2.0911707878112793, 2.7802999019622803, 3.4694290161132812, 4.158558368682861, 4.847687721252441, 5.536816596984863, 6.225945949554443, 6.915075302124023, 7.6042046546936035, 8.293334007263184, 8.982462882995605, 9.671592712402344, 10.360721588134766, 11.049850463867188, 11.73897933959961, 12.428109169006348, 13.11723804473877, 13.806367874145508, 14.49549674987793, 15.184625625610352, 15.87375545501709, 16.562885284423828, 17.25201416015625, 17.941143035888672]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 16.0, 18.0, 29.0, 30.0, 36.0, 52.0, 66.0, 79.0, 91.0, 81.0, 73.0, 76.0, 72.0, 66.0, 53.0, 43.0, 29.0, 23.0, 19.0, 12.0, 11.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.126326084136963, -5.882452964782715, -5.638579845428467, -5.394706726074219, -5.150833606719971, -4.906960487365723, -4.663087368011475, -4.419214248657227, -4.1753411293029785, -3.9314680099487305, -3.6875948905944824, -3.4437217712402344, -3.1998486518859863, -2.9559755325317383, -2.7121024131774902, -2.468229293823242, -2.224356174468994, -1.980483055114746, -1.736609935760498, -1.49273681640625, -1.248863697052002, -1.004990577697754, -0.7611174583435059, -0.5172443389892578, -0.27337121963500977, -0.02949810028076172, 0.21437501907348633, 0.4582481384277344, 0.7021212577819824, 0.9459943771362305, 1.1898674964904785, 1.4337406158447266, 1.6776142120361328, 1.9214873313903809, 2.165360450744629, 2.409233570098877, 2.653106689453125, 2.896979808807373, 3.140852928161621, 3.384726047515869, 3.628599166870117, 3.8724722862243652, 4.116345405578613, 4.360218524932861, 4.604091644287109, 4.847964763641357, 5.0918378829956055, 5.3357110023498535, 5.579584121704102, 5.82345724105835, 6.067330360412598, 6.311203479766846, 6.555076599121094, 6.798949718475342, 7.04282283782959, 7.286695957183838, 7.530569076538086, 7.774442195892334, 8.018315315246582, 8.262187957763672, 8.506061553955078, 8.749935150146484, 8.993807792663574, 9.237680435180664, 9.48155403137207]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 8.0, 14.0, 11.0, 19.0, 26.0, 40.0, 48.0, 73.0, 79.0, 104.0, 177.0, 265.0, 365.0, 544.0, 1065.0, 1701.0, 3519.0, 8426.0, 28388.0, 142199.0, 565145.0, 232258.0, 42645.0, 11630.0, 4495.0, 2157.0, 1125.0, 737.0, 354.0, 285.0, 187.0, 123.0, 89.0, 66.0, 52.0, 28.0, 29.0, 16.0, 21.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-3.587890625, -3.47796630859375, -3.3680419921875, -3.25811767578125, -3.148193359375, -3.03826904296875, -2.9283447265625, -2.81842041015625, -2.70849609375, -2.59857177734375, -2.4886474609375, -2.37872314453125, -2.268798828125, -2.15887451171875, -2.0489501953125, -1.93902587890625, -1.8291015625, -1.71917724609375, -1.6092529296875, -1.49932861328125, -1.389404296875, -1.27947998046875, -1.1695556640625, -1.05963134765625, -0.94970703125, -0.83978271484375, -0.7298583984375, -0.61993408203125, -0.510009765625, -0.40008544921875, -0.2901611328125, -0.18023681640625, -0.0703125, 0.03961181640625, 0.1495361328125, 0.25946044921875, 0.369384765625, 0.47930908203125, 0.5892333984375, 0.69915771484375, 0.80908203125, 0.91900634765625, 1.0289306640625, 1.13885498046875, 1.248779296875, 1.35870361328125, 1.4686279296875, 1.57855224609375, 1.6884765625, 1.79840087890625, 1.9083251953125, 2.01824951171875, 2.128173828125, 2.23809814453125, 2.3480224609375, 2.45794677734375, 2.56787109375, 2.67779541015625, 2.7877197265625, 2.89764404296875, 3.007568359375, 3.11749267578125, 3.2274169921875, 3.33734130859375, 3.447265625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 14.0, 18.0, 19.0, 36.0, 34.0, 53.0, 77.0, 101.0, 104.0, 93.0, 93.0, 86.0, 69.0, 48.0, 37.0, 34.0, 20.0, 16.0, 5.0, 8.0, 4.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09375, -1.0618057250976562, -1.0298614501953125, -0.9979171752929688, -0.965972900390625, -0.9340286254882812, -0.9020843505859375, -0.8701400756835938, -0.83819580078125, -0.8062515258789062, -0.7743072509765625, -0.7423629760742188, -0.710418701171875, -0.6784744262695312, -0.6465301513671875, -0.6145858764648438, -0.5826416015625, -0.5506973266601562, -0.5187530517578125, -0.48680877685546875, -0.454864501953125, -0.42292022705078125, -0.3909759521484375, -0.35903167724609375, -0.32708740234375, -0.29514312744140625, -0.2631988525390625, -0.23125457763671875, -0.199310302734375, -0.16736602783203125, -0.1354217529296875, -0.10347747802734375, -0.071533203125, -0.03958892822265625, -0.0076446533203125, 0.02429962158203125, 0.056243896484375, 0.08818817138671875, 0.1201324462890625, 0.15207672119140625, 0.18402099609375, 0.21596527099609375, 0.2479095458984375, 0.27985382080078125, 0.311798095703125, 0.34374237060546875, 0.3756866455078125, 0.40763092041015625, 0.4395751953125, 0.47151947021484375, 0.5034637451171875, 0.5354080200195312, 0.567352294921875, 0.5992965698242188, 0.6312408447265625, 0.6631851196289062, 0.69512939453125, 0.7270736694335938, 0.7590179443359375, 0.7909622192382812, 0.822906494140625, 0.8548507690429688, 0.8867950439453125, 0.9187393188476562, 0.95068359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 7.0, 3.0, 8.0, 8.0, 13.0, 18.0, 27.0, 39.0, 66.0, 88.0, 119.0, 228.0, 425.0, 809.0, 1545.0, 3461.0, 10395.0, 39503.0, 190236.0, 546540.0, 196814.0, 40625.0, 10655.0, 3600.0, 1560.0, 752.0, 399.0, 212.0, 143.0, 90.0, 56.0, 32.0, 25.0, 19.0, 12.0, 7.0, 14.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.576629638671875, -2.47943115234375, -2.382232666015625, -2.2850341796875, -2.187835693359375, -2.09063720703125, -1.993438720703125, -1.896240234375, -1.799041748046875, -1.70184326171875, -1.604644775390625, -1.5074462890625, -1.410247802734375, -1.31304931640625, -1.215850830078125, -1.11865234375, -1.021453857421875, -0.92425537109375, -0.827056884765625, -0.7298583984375, -0.632659912109375, -0.53546142578125, -0.438262939453125, -0.341064453125, -0.243865966796875, -0.14666748046875, -0.049468994140625, 0.0477294921875, 0.144927978515625, 0.24212646484375, 0.339324951171875, 0.4365234375, 0.533721923828125, 0.63092041015625, 0.728118896484375, 0.8253173828125, 0.922515869140625, 1.01971435546875, 1.116912841796875, 1.214111328125, 1.311309814453125, 1.40850830078125, 1.505706787109375, 1.6029052734375, 1.700103759765625, 1.79730224609375, 1.894500732421875, 1.99169921875, 2.088897705078125, 2.18609619140625, 2.283294677734375, 2.3804931640625, 2.477691650390625, 2.57489013671875, 2.672088623046875, 2.769287109375, 2.866485595703125, 2.96368408203125, 3.060882568359375, 3.1580810546875, 3.255279541015625, 3.35247802734375, 3.449676513671875, 3.546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 13.0, 8.0, 7.0, 16.0, 16.0, 18.0, 12.0, 22.0, 27.0, 34.0, 32.0, 36.0, 44.0, 41.0, 45.0, 42.0, 47.0, 40.0, 37.0, 38.0, 48.0, 34.0, 44.0, 34.0, 31.0, 31.0, 33.0, 28.0, 18.0, 23.0, 14.0, 15.0, 17.0, 9.0, 9.0, 7.0, 8.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.51953125, -2.4354248046875, -2.351318359375, -2.2672119140625, -2.18310546875, -2.0989990234375, -2.014892578125, -1.9307861328125, -1.8466796875, -1.7625732421875, -1.678466796875, -1.5943603515625, -1.51025390625, -1.4261474609375, -1.342041015625, -1.2579345703125, -1.173828125, -1.0897216796875, -1.005615234375, -0.9215087890625, -0.83740234375, -0.7532958984375, -0.669189453125, -0.5850830078125, -0.5009765625, -0.4168701171875, -0.332763671875, -0.2486572265625, -0.16455078125, -0.0804443359375, 0.003662109375, 0.0877685546875, 0.171875, 0.2559814453125, 0.340087890625, 0.4241943359375, 0.50830078125, 0.5924072265625, 0.676513671875, 0.7606201171875, 0.8447265625, 0.9288330078125, 1.012939453125, 1.0970458984375, 1.18115234375, 1.2652587890625, 1.349365234375, 1.4334716796875, 1.517578125, 1.6016845703125, 1.685791015625, 1.7698974609375, 1.85400390625, 1.9381103515625, 2.022216796875, 2.1063232421875, 2.1904296875, 2.2745361328125, 2.358642578125, 2.4427490234375, 2.52685546875, 2.6109619140625, 2.695068359375, 2.7791748046875, 2.86328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 2.0, 6.0, 7.0, 12.0, 10.0, 21.0, 32.0, 45.0, 88.0, 145.0, 337.0, 769.0, 2519.0, 13318.0, 182368.0, 778226.0, 60888.0, 7067.0, 1647.0, 541.0, 220.0, 110.0, 54.0, 43.0, 25.0, 11.0, 11.0, 6.0, 9.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7255859375, -1.6704864501953125, -1.615386962890625, -1.5602874755859375, -1.50518798828125, -1.4500885009765625, -1.394989013671875, -1.3398895263671875, -1.2847900390625, -1.2296905517578125, -1.174591064453125, -1.1194915771484375, -1.06439208984375, -1.0092926025390625, -0.954193115234375, -0.8990936279296875, -0.843994140625, -0.7888946533203125, -0.733795166015625, -0.6786956787109375, -0.62359619140625, -0.5684967041015625, -0.513397216796875, -0.4582977294921875, -0.4031982421875, -0.3480987548828125, -0.292999267578125, -0.2378997802734375, -0.18280029296875, -0.1277008056640625, -0.072601318359375, -0.0175018310546875, 0.03759765625, 0.0926971435546875, 0.147796630859375, 0.2028961181640625, 0.25799560546875, 0.3130950927734375, 0.368194580078125, 0.4232940673828125, 0.4783935546875, 0.5334930419921875, 0.588592529296875, 0.6436920166015625, 0.69879150390625, 0.7538909912109375, 0.808990478515625, 0.8640899658203125, 0.919189453125, 0.9742889404296875, 1.029388427734375, 1.0844879150390625, 1.13958740234375, 1.1946868896484375, 1.249786376953125, 1.3048858642578125, 1.3599853515625, 1.4150848388671875, 1.470184326171875, 1.5252838134765625, 1.58038330078125, 1.6354827880859375, 1.690582275390625, 1.7456817626953125, 1.80078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 7.0, 9.0, 10.0, 22.0, 21.0, 34.0, 51.0, 48.0, 68.0, 95.0, 97.0, 110.0, 94.0, 66.0, 66.0, 38.0, 32.0, 25.0, 22.0, 19.0, 10.0, 7.0, 7.0, 8.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012421607971191406, -0.00011980906128883362, -0.00011540204286575317, -0.00011099502444267273, -0.00010658800601959229, -0.00010218098759651184, -9.77739691734314e-05, -9.336695075035095e-05, -8.895993232727051e-05, -8.455291390419006e-05, -8.014589548110962e-05, -7.573887705802917e-05, -7.133185863494873e-05, -6.692484021186829e-05, -6.251782178878784e-05, -5.81108033657074e-05, -5.370378494262695e-05, -4.929676651954651e-05, -4.4889748096466064e-05, -4.048272967338562e-05, -3.6075711250305176e-05, -3.166869282722473e-05, -2.7261674404144287e-05, -2.2854655981063843e-05, -1.84476375579834e-05, -1.4040619134902954e-05, -9.63360071182251e-06, -5.2265822887420654e-06, -8.195638656616211e-07, 3.5874545574188232e-06, 7.994472980499268e-06, 1.2401491403579712e-05, 1.6808509826660156e-05, 2.12155282497406e-05, 2.5622546672821045e-05, 3.002956509590149e-05, 3.4436583518981934e-05, 3.884360194206238e-05, 4.325062036514282e-05, 4.7657638788223267e-05, 5.206465721130371e-05, 5.6471675634384155e-05, 6.08786940574646e-05, 6.528571248054504e-05, 6.969273090362549e-05, 7.409974932670593e-05, 7.850676774978638e-05, 8.291378617286682e-05, 8.732080459594727e-05, 9.172782301902771e-05, 9.613484144210815e-05, 0.0001005418598651886, 0.00010494887828826904, 0.00010935589671134949, 0.00011376291513442993, 0.00011816993355751038, 0.00012257695198059082, 0.00012698397040367126, 0.0001313909888267517, 0.00013579800724983215, 0.0001402050256729126, 0.00014461204409599304, 0.00014901906251907349, 0.00015342608094215393, 0.00015783309936523438]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 5.0, 6.0, 5.0, 13.0, 9.0, 30.0, 51.0, 73.0, 135.0, 244.0, 540.0, 1432.0, 4979.0, 31034.0, 497536.0, 475465.0, 29827.0, 4676.0, 1398.0, 566.0, 236.0, 107.0, 72.0, 51.0, 28.0, 16.0, 5.0, 6.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.9794921875, -1.92999267578125, -1.8804931640625, -1.83099365234375, -1.781494140625, -1.73199462890625, -1.6824951171875, -1.63299560546875, -1.58349609375, -1.53399658203125, -1.4844970703125, -1.43499755859375, -1.385498046875, -1.33599853515625, -1.2864990234375, -1.23699951171875, -1.1875, -1.13800048828125, -1.0885009765625, -1.03900146484375, -0.989501953125, -0.94000244140625, -0.8905029296875, -0.84100341796875, -0.79150390625, -0.74200439453125, -0.6925048828125, -0.64300537109375, -0.593505859375, -0.54400634765625, -0.4945068359375, -0.44500732421875, -0.3955078125, -0.34600830078125, -0.2965087890625, -0.24700927734375, -0.197509765625, -0.14801025390625, -0.0985107421875, -0.04901123046875, 0.00048828125, 0.04998779296875, 0.0994873046875, 0.14898681640625, 0.198486328125, 0.24798583984375, 0.2974853515625, 0.34698486328125, 0.396484375, 0.44598388671875, 0.4954833984375, 0.54498291015625, 0.594482421875, 0.64398193359375, 0.6934814453125, 0.74298095703125, 0.79248046875, 0.84197998046875, 0.8914794921875, 0.94097900390625, 0.990478515625, 1.03997802734375, 1.0894775390625, 1.13897705078125, 1.1884765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 8.0, 14.0, 12.0, 19.0, 35.0, 42.0, 69.0, 78.0, 104.0, 134.0, 112.0, 115.0, 77.0, 59.0, 39.0, 24.0, 15.0, 14.0, 12.0, 7.0, 6.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.28515625, -1.24609375, -1.20703125, -1.16796875, -1.12890625, -1.08984375, -1.05078125, -1.01171875, -0.97265625, -0.93359375, -0.89453125, -0.85546875, -0.81640625, -0.77734375, -0.73828125, -0.69921875, -0.66015625, -0.62109375, -0.58203125, -0.54296875, -0.50390625, -0.46484375, -0.42578125, -0.38671875, -0.34765625, -0.30859375, -0.26953125, -0.23046875, -0.19140625, -0.15234375, -0.11328125, -0.07421875, -0.03515625, 0.00390625, 0.04296875, 0.08203125, 0.12109375, 0.16015625, 0.19921875, 0.23828125, 0.27734375, 0.31640625, 0.35546875, 0.39453125, 0.43359375, 0.47265625, 0.51171875, 0.55078125, 0.58984375, 0.62890625, 0.66796875, 0.70703125, 0.74609375, 0.78515625, 0.82421875, 0.86328125, 0.90234375, 0.94140625, 0.98046875, 1.01953125, 1.05859375, 1.09765625, 1.13671875, 1.17578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 12.0, 14.0, 31.0, 62.0, 119.0, 185.0, 229.0, 163.0, 83.0, 41.0, 23.0, 12.0, 12.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.986242294311523, -21.236927032470703, -20.487613677978516, -19.738300323486328, -18.988985061645508, -18.239669799804688, -17.4903564453125, -16.741043090820312, -15.991727828979492, -15.242413520812988, -14.493099212646484, -13.74378490447998, -12.994470596313477, -12.245156288146973, -11.495841979980469, -10.746527671813965, -9.997213363647461, -9.247899055480957, -8.498584747314453, -7.749270439147949, -6.999956130981445, -6.250641822814941, -5.5013275146484375, -4.752013206481934, -4.00269889831543, -3.253384590148926, -2.504070281982422, -1.754755973815918, -1.005441665649414, -0.25612735748291016, 0.49318695068359375, 1.2425012588500977, 1.9918174743652344, 2.7411317825317383, 3.490446090698242, 4.239760398864746, 4.98907470703125, 5.738389015197754, 6.487703323364258, 7.237017631530762, 7.986331939697266, 8.73564624786377, 9.484960556030273, 10.234274864196777, 10.983589172363281, 11.732903480529785, 12.482217788696289, 13.231532096862793, 13.980846405029297, 14.7301607131958, 15.479475021362305, 16.228790283203125, 16.978103637695312, 17.7274169921875, 18.47673225402832, 19.22604751586914, 19.975360870361328, 20.724674224853516, 21.473989486694336, 22.223304748535156, 22.972618103027344, 23.72193145751953, 24.47124671936035, 25.220561981201172, 25.96987533569336]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 6.0, 7.0, 12.0, 16.0, 14.0, 13.0, 24.0, 30.0, 34.0, 29.0, 37.0, 47.0, 44.0, 50.0, 57.0, 61.0, 56.0, 48.0, 65.0, 55.0, 45.0, 41.0, 41.0, 32.0, 32.0, 27.0, 14.0, 12.0, 14.0, 8.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.992145538330078, -18.393766403198242, -17.795387268066406, -17.19700813293457, -16.598628997802734, -16.00025177001953, -15.401871681213379, -14.80349349975586, -14.205114364624023, -13.606735229492188, -13.008356094360352, -12.409976959228516, -11.811598777770996, -11.21321964263916, -10.614840507507324, -10.016462326049805, -9.418082237243652, -8.819703102111816, -8.22132396697998, -7.622945308685303, -7.024566650390625, -6.426187515258789, -5.827808380126953, -5.229429721832275, -4.6310505867004395, -4.0326714515686035, -3.434292793273926, -2.83591365814209, -2.237534761428833, -1.6391558647155762, -1.0407767295837402, -0.4423980712890625, 0.15598106384277344, 0.754360020160675, 1.3527389764785767, 1.951117992401123, 2.54949688911438, 3.1478757858276367, 3.7462549209594727, 4.34463357925415, 4.943012714385986, 5.541391849517822, 6.1397705078125, 6.738149642944336, 7.336528778076172, 7.93490743637085, 8.533287048339844, 9.131665229797363, 9.7300443649292, 10.328423500061035, 10.926802635192871, 11.52518081665039, 12.123559951782227, 12.721939086914062, 13.320318222045898, 13.918697357177734, 14.51707649230957, 15.115455627441406, 15.713834762573242, 16.312213897705078, 16.910593032836914, 17.50897216796875, 18.107349395751953, 18.70572853088379, 19.304107666015625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 8.0, 14.0, 11.0, 11.0, 14.0, 24.0, 38.0, 66.0, 99.0, 132.0, 319.0, 592.0, 1338.0, 3634.0, 17272.0, 313272.0, 3808762.0, 38905.0, 6181.0, 1871.0, 801.0, 391.0, 204.0, 111.0, 68.0, 36.0, 37.0, 16.0, 18.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.62890625, -4.49737548828125, -4.3658447265625, -4.23431396484375, -4.102783203125, -3.97125244140625, -3.8397216796875, -3.70819091796875, -3.57666015625, -3.44512939453125, -3.3135986328125, -3.18206787109375, -3.050537109375, -2.91900634765625, -2.7874755859375, -2.65594482421875, -2.5244140625, -2.39288330078125, -2.2613525390625, -2.12982177734375, -1.998291015625, -1.86676025390625, -1.7352294921875, -1.60369873046875, -1.47216796875, -1.34063720703125, -1.2091064453125, -1.07757568359375, -0.946044921875, -0.81451416015625, -0.6829833984375, -0.55145263671875, -0.419921875, -0.28839111328125, -0.1568603515625, -0.02532958984375, 0.106201171875, 0.23773193359375, 0.3692626953125, 0.50079345703125, 0.63232421875, 0.76385498046875, 0.8953857421875, 1.02691650390625, 1.158447265625, 1.28997802734375, 1.4215087890625, 1.55303955078125, 1.6845703125, 1.81610107421875, 1.9476318359375, 2.07916259765625, 2.210693359375, 2.34222412109375, 2.4737548828125, 2.60528564453125, 2.73681640625, 2.86834716796875, 2.9998779296875, 3.13140869140625, 3.262939453125, 3.39447021484375, 3.5260009765625, 3.65753173828125, 3.7890625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 6.0, 12.0, 15.0, 23.0, 28.0, 39.0, 44.0, 67.0, 79.0, 73.0, 102.0, 77.0, 75.0, 74.0, 65.0, 52.0, 46.0, 20.0, 24.0, 23.0, 9.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.034942626953125, -1.00347900390625, -0.972015380859375, -0.9405517578125, -0.909088134765625, -0.87762451171875, -0.846160888671875, -0.814697265625, -0.783233642578125, -0.75177001953125, -0.720306396484375, -0.6888427734375, -0.657379150390625, -0.62591552734375, -0.594451904296875, -0.56298828125, -0.531524658203125, -0.50006103515625, -0.468597412109375, -0.4371337890625, -0.405670166015625, -0.37420654296875, -0.342742919921875, -0.311279296875, -0.279815673828125, -0.24835205078125, -0.216888427734375, -0.1854248046875, -0.153961181640625, -0.12249755859375, -0.091033935546875, -0.0595703125, -0.028106689453125, 0.00335693359375, 0.034820556640625, 0.0662841796875, 0.097747802734375, 0.12921142578125, 0.160675048828125, 0.192138671875, 0.223602294921875, 0.25506591796875, 0.286529541015625, 0.3179931640625, 0.349456787109375, 0.38092041015625, 0.412384033203125, 0.44384765625, 0.475311279296875, 0.50677490234375, 0.538238525390625, 0.5697021484375, 0.601165771484375, 0.63262939453125, 0.664093017578125, 0.695556640625, 0.727020263671875, 0.75848388671875, 0.789947509765625, 0.8214111328125, 0.852874755859375, 0.88433837890625, 0.915802001953125, 0.947265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 3.0, 8.0, 6.0, 10.0, 19.0, 45.0, 68.0, 158.0, 471.0, 1493.0, 6184.0, 40551.0, 2933109.0, 1171860.0, 32812.0, 5310.0, 1386.0, 448.0, 175.0, 59.0, 30.0, 25.0, 17.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.0748291015625, -3.958251953125, -3.8416748046875, -3.72509765625, -3.6085205078125, -3.491943359375, -3.3753662109375, -3.2587890625, -3.1422119140625, -3.025634765625, -2.9090576171875, -2.79248046875, -2.6759033203125, -2.559326171875, -2.4427490234375, -2.326171875, -2.2095947265625, -2.093017578125, -1.9764404296875, -1.85986328125, -1.7432861328125, -1.626708984375, -1.5101318359375, -1.3935546875, -1.2769775390625, -1.160400390625, -1.0438232421875, -0.92724609375, -0.8106689453125, -0.694091796875, -0.5775146484375, -0.4609375, -0.3443603515625, -0.227783203125, -0.1112060546875, 0.00537109375, 0.1219482421875, 0.238525390625, 0.3551025390625, 0.4716796875, 0.5882568359375, 0.704833984375, 0.8214111328125, 0.93798828125, 1.0545654296875, 1.171142578125, 1.2877197265625, 1.404296875, 1.5208740234375, 1.637451171875, 1.7540283203125, 1.87060546875, 1.9871826171875, 2.103759765625, 2.2203369140625, 2.3369140625, 2.4534912109375, 2.570068359375, 2.6866455078125, 2.80322265625, 2.9197998046875, 3.036376953125, 3.1529541015625, 3.26953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 8.0, 9.0, 16.0, 24.0, 24.0, 32.0, 69.0, 90.0, 137.0, 240.0, 627.0, 1625.0, 541.0, 226.0, 120.0, 91.0, 37.0, 26.0, 28.0, 32.0, 14.0, 5.0, 12.0, 3.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74658203125, -0.7212371826171875, -0.695892333984375, -0.6705474853515625, -0.64520263671875, -0.6198577880859375, -0.594512939453125, -0.5691680908203125, -0.5438232421875, -0.5184783935546875, -0.493133544921875, -0.4677886962890625, -0.44244384765625, -0.4170989990234375, -0.391754150390625, -0.3664093017578125, -0.341064453125, -0.3157196044921875, -0.290374755859375, -0.2650299072265625, -0.23968505859375, -0.2143402099609375, -0.188995361328125, -0.1636505126953125, -0.1383056640625, -0.1129608154296875, -0.087615966796875, -0.0622711181640625, -0.03692626953125, -0.0115814208984375, 0.013763427734375, 0.0391082763671875, 0.064453125, 0.0897979736328125, 0.115142822265625, 0.1404876708984375, 0.16583251953125, 0.1911773681640625, 0.216522216796875, 0.2418670654296875, 0.2672119140625, 0.2925567626953125, 0.317901611328125, 0.3432464599609375, 0.36859130859375, 0.3939361572265625, 0.419281005859375, 0.4446258544921875, 0.469970703125, 0.4953155517578125, 0.520660400390625, 0.5460052490234375, 0.57135009765625, 0.5966949462890625, 0.622039794921875, 0.6473846435546875, 0.6727294921875, 0.6980743408203125, 0.723419189453125, 0.7487640380859375, 0.77410888671875, 0.7994537353515625, 0.824798583984375, 0.8501434326171875, 0.87548828125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 12.0, 42.0, 138.0, 304.0, 295.0, 154.0, 43.0, 10.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9529218673706055, -3.622502088546753, -3.2920823097229004, -2.9616622924804688, -2.631242513656616, -2.3008227348327637, -1.9704028367996216, -1.6399829387664795, -1.309563159942627, -0.9791433215141296, -0.6487234830856323, -0.318303644657135, 0.012116193771362305, 0.34253597259521484, 0.6729558706283569, 1.003375768661499, 1.3337955474853516, 1.664215326309204, 1.9946352243423462, 2.3250551223754883, 2.655474901199341, 2.9858946800231934, 3.316314697265625, 3.6467344760894775, 3.97715425491333, 4.307574272155762, 4.637993812561035, 4.968413829803467, 5.298833847045898, 5.629253387451172, 5.9596734046936035, 6.290093421936035, 6.620513916015625, 6.950933933258057, 7.28135347366333, 7.611773490905762, 7.942193031311035, 8.272613525390625, 8.603033065795898, 8.933452606201172, 9.263872146606445, 9.594291687011719, 9.924712181091309, 10.255131721496582, 10.585551261901855, 10.915971755981445, 11.246391296386719, 11.576810836791992, 11.907231330871582, 12.237650871276855, 12.568071365356445, 12.898490905761719, 13.228910446166992, 13.559329986572266, 13.889750480651855, 14.220170021057129, 14.550590515136719, 14.881010055541992, 15.211430549621582, 15.541850090026855, 15.872269630432129, 16.20269012451172, 16.533109664916992, 16.863529205322266, 17.19394874572754]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 4.0, 2.0, 5.0, 7.0, 9.0, 13.0, 16.0, 18.0, 20.0, 15.0, 22.0, 36.0, 34.0, 33.0, 37.0, 47.0, 51.0, 35.0, 52.0, 44.0, 47.0, 51.0, 49.0, 41.0, 30.0, 41.0, 35.0, 37.0, 24.0, 25.0, 29.0, 12.0, 15.0, 16.0, 15.0, 7.0, 9.0, 1.0, 5.0, 4.0, 10.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7082347869873047, -2.6209793090820312, -2.533723831176758, -2.4464683532714844, -2.359212875366211, -2.2719573974609375, -2.184701919555664, -2.0974464416503906, -2.010190963745117, -1.9229354858398438, -1.8356800079345703, -1.7484245300292969, -1.6611690521240234, -1.57391357421875, -1.4866582155227661, -1.3994027376174927, -1.3121473789215088, -1.2248919010162354, -1.137636423110962, -1.0503809452056885, -0.9631255269050598, -0.8758700489997864, -0.7886146306991577, -0.7013591527938843, -0.6141036748886108, -0.5268481969833374, -0.43959274888038635, -0.3523373007774353, -0.26508182287216187, -0.17782634496688843, -0.09057092666625977, -0.003315448760986328, 0.08394002914428711, 0.17119549214839935, 0.2584509551525116, 0.34570640325546265, 0.4329618811607361, 0.5202173590660095, 0.6074727773666382, 0.6947282552719116, 0.7819837331771851, 0.8692392110824585, 0.9564946889877319, 1.0437500476837158, 1.1310055255889893, 1.2182610034942627, 1.3055164813995361, 1.3927719593048096, 1.480027437210083, 1.5672829151153564, 1.6545383930206299, 1.7417938709259033, 1.8290493488311768, 1.9163048267364502, 2.0035600662231445, 2.090815544128418, 2.1780710220336914, 2.265326499938965, 2.3525819778442383, 2.4398374557495117, 2.527092933654785, 2.6143484115600586, 2.701603889465332, 2.7888593673706055, 2.876114845275879]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 9.0, 10.0, 16.0, 30.0, 30.0, 50.0, 79.0, 104.0, 163.0, 233.0, 351.0, 588.0, 1061.0, 2087.0, 4869.0, 14599.0, 63445.0, 412615.0, 452243.0, 69951.0, 15544.0, 5306.0, 2188.0, 1161.0, 627.0, 395.0, 263.0, 153.0, 108.0, 84.0, 41.0, 35.0, 24.0, 25.0, 7.0, 14.0, 10.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.05255126953125, -3.9176025390625, -3.78265380859375, -3.647705078125, -3.51275634765625, -3.3778076171875, -3.24285888671875, -3.10791015625, -2.97296142578125, -2.8380126953125, -2.70306396484375, -2.568115234375, -2.43316650390625, -2.2982177734375, -2.16326904296875, -2.0283203125, -1.89337158203125, -1.7584228515625, -1.62347412109375, -1.488525390625, -1.35357666015625, -1.2186279296875, -1.08367919921875, -0.94873046875, -0.81378173828125, -0.6788330078125, -0.54388427734375, -0.408935546875, -0.27398681640625, -0.1390380859375, -0.00408935546875, 0.130859375, 0.26580810546875, 0.4007568359375, 0.53570556640625, 0.670654296875, 0.80560302734375, 0.9405517578125, 1.07550048828125, 1.21044921875, 1.34539794921875, 1.4803466796875, 1.61529541015625, 1.750244140625, 1.88519287109375, 2.0201416015625, 2.15509033203125, 2.2900390625, 2.42498779296875, 2.5599365234375, 2.69488525390625, 2.829833984375, 2.96478271484375, 3.0997314453125, 3.23468017578125, 3.36962890625, 3.50457763671875, 3.6395263671875, 3.77447509765625, 3.909423828125, 4.04437255859375, 4.1793212890625, 4.31427001953125, 4.44921875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 15.0, 19.0, 26.0, 35.0, 43.0, 59.0, 76.0, 72.0, 100.0, 88.0, 71.0, 88.0, 63.0, 62.0, 42.0, 17.0, 31.0, 13.0, 15.0, 9.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0869140625, -1.0550689697265625, -1.023223876953125, -0.9913787841796875, -0.95953369140625, -0.9276885986328125, -0.895843505859375, -0.8639984130859375, -0.8321533203125, -0.8003082275390625, -0.768463134765625, -0.7366180419921875, -0.70477294921875, -0.6729278564453125, -0.641082763671875, -0.6092376708984375, -0.577392578125, -0.5455474853515625, -0.513702392578125, -0.4818572998046875, -0.45001220703125, -0.4181671142578125, -0.386322021484375, -0.3544769287109375, -0.3226318359375, -0.2907867431640625, -0.258941650390625, -0.2270965576171875, -0.19525146484375, -0.1634063720703125, -0.131561279296875, -0.0997161865234375, -0.06787109375, -0.0360260009765625, -0.004180908203125, 0.0276641845703125, 0.05950927734375, 0.0913543701171875, 0.123199462890625, 0.1550445556640625, 0.1868896484375, 0.2187347412109375, 0.250579833984375, 0.2824249267578125, 0.31427001953125, 0.3461151123046875, 0.377960205078125, 0.4098052978515625, 0.441650390625, 0.4734954833984375, 0.505340576171875, 0.5371856689453125, 0.56903076171875, 0.6008758544921875, 0.632720947265625, 0.6645660400390625, 0.6964111328125, 0.7282562255859375, 0.760101318359375, 0.7919464111328125, 0.82379150390625, 0.8556365966796875, 0.887481689453125, 0.9193267822265625, 0.951171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 9.0, 14.0, 26.0, 27.0, 44.0, 53.0, 66.0, 120.0, 160.0, 239.0, 335.0, 526.0, 859.0, 1509.0, 2835.0, 6117.0, 15182.0, 44225.0, 146206.0, 412249.0, 285795.0, 85430.0, 26980.0, 10021.0, 4231.0, 2114.0, 1123.0, 682.0, 393.0, 309.0, 194.0, 122.0, 104.0, 65.0, 55.0, 40.0, 21.0, 16.0, 14.0, 15.0, 10.0, 7.0, 4.0, 7.0, 1.0, 4.0, 0.0, 1.0], "bins": [-2.5, -2.4301300048828125, -2.360260009765625, -2.2903900146484375, -2.22052001953125, -2.1506500244140625, -2.080780029296875, -2.0109100341796875, -1.9410400390625, -1.8711700439453125, -1.801300048828125, -1.7314300537109375, -1.66156005859375, -1.5916900634765625, -1.521820068359375, -1.4519500732421875, -1.382080078125, -1.3122100830078125, -1.242340087890625, -1.1724700927734375, -1.10260009765625, -1.0327301025390625, -0.962860107421875, -0.8929901123046875, -0.8231201171875, -0.7532501220703125, -0.683380126953125, -0.6135101318359375, -0.54364013671875, -0.4737701416015625, -0.403900146484375, -0.3340301513671875, -0.26416015625, -0.1942901611328125, -0.124420166015625, -0.0545501708984375, 0.01531982421875, 0.0851898193359375, 0.155059814453125, 0.2249298095703125, 0.2947998046875, 0.3646697998046875, 0.434539794921875, 0.5044097900390625, 0.57427978515625, 0.6441497802734375, 0.714019775390625, 0.7838897705078125, 0.853759765625, 0.9236297607421875, 0.993499755859375, 1.0633697509765625, 1.13323974609375, 1.2031097412109375, 1.272979736328125, 1.3428497314453125, 1.4127197265625, 1.4825897216796875, 1.552459716796875, 1.6223297119140625, 1.69219970703125, 1.7620697021484375, 1.831939697265625, 1.9018096923828125, 1.9716796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 4.0, 8.0, 11.0, 11.0, 8.0, 14.0, 15.0, 23.0, 25.0, 28.0, 27.0, 18.0, 39.0, 44.0, 38.0, 32.0, 40.0, 47.0, 57.0, 42.0, 40.0, 47.0, 44.0, 51.0, 45.0, 29.0, 28.0, 27.0, 22.0, 26.0, 18.0, 11.0, 11.0, 11.0, 11.0, 11.0, 8.0, 3.0, 2.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.84375, -2.755615234375, -2.66748046875, -2.579345703125, -2.4912109375, -2.403076171875, -2.31494140625, -2.226806640625, -2.138671875, -2.050537109375, -1.96240234375, -1.874267578125, -1.7861328125, -1.697998046875, -1.60986328125, -1.521728515625, -1.43359375, -1.345458984375, -1.25732421875, -1.169189453125, -1.0810546875, -0.992919921875, -0.90478515625, -0.816650390625, -0.728515625, -0.640380859375, -0.55224609375, -0.464111328125, -0.3759765625, -0.287841796875, -0.19970703125, -0.111572265625, -0.0234375, 0.064697265625, 0.15283203125, 0.240966796875, 0.3291015625, 0.417236328125, 0.50537109375, 0.593505859375, 0.681640625, 0.769775390625, 0.85791015625, 0.946044921875, 1.0341796875, 1.122314453125, 1.21044921875, 1.298583984375, 1.38671875, 1.474853515625, 1.56298828125, 1.651123046875, 1.7392578125, 1.827392578125, 1.91552734375, 2.003662109375, 2.091796875, 2.179931640625, 2.26806640625, 2.356201171875, 2.4443359375, 2.532470703125, 2.62060546875, 2.708740234375, 2.796875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 8.0, 5.0, 22.0, 27.0, 49.0, 103.0, 235.0, 533.0, 1638.0, 8812.0, 147972.0, 825632.0, 56752.0, 4929.0, 1109.0, 378.0, 158.0, 66.0, 45.0, 30.0, 18.0, 15.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4072265625, -1.3442840576171875, -1.281341552734375, -1.2183990478515625, -1.15545654296875, -1.0925140380859375, -1.029571533203125, -0.9666290283203125, -0.9036865234375, -0.8407440185546875, -0.777801513671875, -0.7148590087890625, -0.65191650390625, -0.5889739990234375, -0.526031494140625, -0.4630889892578125, -0.400146484375, -0.3372039794921875, -0.274261474609375, -0.2113189697265625, -0.14837646484375, -0.0854339599609375, -0.022491455078125, 0.0404510498046875, 0.1033935546875, 0.1663360595703125, 0.229278564453125, 0.2922210693359375, 0.35516357421875, 0.4181060791015625, 0.481048583984375, 0.5439910888671875, 0.60693359375, 0.6698760986328125, 0.732818603515625, 0.7957611083984375, 0.85870361328125, 0.9216461181640625, 0.984588623046875, 1.0475311279296875, 1.1104736328125, 1.1734161376953125, 1.236358642578125, 1.2993011474609375, 1.36224365234375, 1.4251861572265625, 1.488128662109375, 1.5510711669921875, 1.614013671875, 1.6769561767578125, 1.739898681640625, 1.8028411865234375, 1.86578369140625, 1.9287261962890625, 1.991668701171875, 2.0546112060546875, 2.1175537109375, 2.1804962158203125, 2.243438720703125, 2.3063812255859375, 2.36932373046875, 2.4322662353515625, 2.495208740234375, 2.5581512451171875, 2.62109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 8.0, 11.0, 13.0, 12.0, 21.0, 14.0, 25.0, 42.0, 56.0, 65.0, 76.0, 83.0, 105.0, 102.0, 90.0, 63.0, 67.0, 49.0, 27.0, 15.0, 14.0, 8.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017523765563964844, -0.00017056986689567566, -0.00016590207815170288, -0.0001612342894077301, -0.00015656650066375732, -0.00015189871191978455, -0.00014723092317581177, -0.000142563134431839, -0.0001378953456878662, -0.00013322755694389343, -0.00012855976819992065, -0.00012389197945594788, -0.0001192241907119751, -0.00011455640196800232, -0.00010988861322402954, -0.00010522082448005676, -0.00010055303573608398, -9.58852469921112e-05, -9.121745824813843e-05, -8.654966950416565e-05, -8.188188076019287e-05, -7.721409201622009e-05, -7.254630327224731e-05, -6.787851452827454e-05, -6.321072578430176e-05, -5.854293704032898e-05, -5.38751482963562e-05, -4.920735955238342e-05, -4.4539570808410645e-05, -3.9871782064437866e-05, -3.520399332046509e-05, -3.053620457649231e-05, -2.586841583251953e-05, -2.1200627088546753e-05, -1.6532838344573975e-05, -1.1865049600601196e-05, -7.197260856628418e-06, -2.5294721126556396e-06, 2.1383166313171387e-06, 6.806105375289917e-06, 1.1473894119262695e-05, 1.6141682863235474e-05, 2.0809471607208252e-05, 2.547726035118103e-05, 3.014504909515381e-05, 3.481283783912659e-05, 3.9480626583099365e-05, 4.4148415327072144e-05, 4.881620407104492e-05, 5.34839928150177e-05, 5.815178155899048e-05, 6.281957030296326e-05, 6.748735904693604e-05, 7.215514779090881e-05, 7.682293653488159e-05, 8.149072527885437e-05, 8.615851402282715e-05, 9.082630276679993e-05, 9.54940915107727e-05, 0.00010016188025474548, 0.00010482966899871826, 0.00010949745774269104, 0.00011416524648666382, 0.0001188330352306366, 0.00012350082397460938]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 11.0, 9.0, 25.0, 31.0, 54.0, 144.0, 261.0, 654.0, 2105.0, 11771.0, 226951.0, 760295.0, 40058.0, 4334.0, 1095.0, 386.0, 169.0, 82.0, 41.0, 22.0, 13.0, 8.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.677734375, -2.6143341064453125, -2.550933837890625, -2.4875335693359375, -2.42413330078125, -2.3607330322265625, -2.297332763671875, -2.2339324951171875, -2.1705322265625, -2.1071319580078125, -2.043731689453125, -1.9803314208984375, -1.91693115234375, -1.8535308837890625, -1.790130615234375, -1.7267303466796875, -1.663330078125, -1.5999298095703125, -1.536529541015625, -1.4731292724609375, -1.40972900390625, -1.3463287353515625, -1.282928466796875, -1.2195281982421875, -1.1561279296875, -1.0927276611328125, -1.029327392578125, -0.9659271240234375, -0.90252685546875, -0.8391265869140625, -0.775726318359375, -0.7123260498046875, -0.64892578125, -0.5855255126953125, -0.522125244140625, -0.4587249755859375, -0.39532470703125, -0.3319244384765625, -0.268524169921875, -0.2051239013671875, -0.1417236328125, -0.0783233642578125, -0.014923095703125, 0.0484771728515625, 0.11187744140625, 0.1752777099609375, 0.238677978515625, 0.3020782470703125, 0.365478515625, 0.4288787841796875, 0.492279052734375, 0.5556793212890625, 0.61907958984375, 0.6824798583984375, 0.745880126953125, 0.8092803955078125, 0.8726806640625, 0.9360809326171875, 0.999481201171875, 1.0628814697265625, 1.12628173828125, 1.1896820068359375, 1.253082275390625, 1.3164825439453125, 1.3798828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 9.0, 13.0, 17.0, 26.0, 44.0, 56.0, 59.0, 92.0, 108.0, 124.0, 119.0, 105.0, 73.0, 54.0, 34.0, 21.0, 15.0, 7.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8310546875, -1.7810821533203125, -1.731109619140625, -1.6811370849609375, -1.63116455078125, -1.5811920166015625, -1.531219482421875, -1.4812469482421875, -1.4312744140625, -1.3813018798828125, -1.331329345703125, -1.2813568115234375, -1.23138427734375, -1.1814117431640625, -1.131439208984375, -1.0814666748046875, -1.031494140625, -0.9815216064453125, -0.931549072265625, -0.8815765380859375, -0.83160400390625, -0.7816314697265625, -0.731658935546875, -0.6816864013671875, -0.6317138671875, -0.5817413330078125, -0.531768798828125, -0.4817962646484375, -0.43182373046875, -0.3818511962890625, -0.331878662109375, -0.2819061279296875, -0.23193359375, -0.1819610595703125, -0.131988525390625, -0.0820159912109375, -0.03204345703125, 0.0179290771484375, 0.067901611328125, 0.1178741455078125, 0.1678466796875, 0.2178192138671875, 0.267791748046875, 0.3177642822265625, 0.36773681640625, 0.4177093505859375, 0.467681884765625, 0.5176544189453125, 0.567626953125, 0.6175994873046875, 0.667572021484375, 0.7175445556640625, 0.76751708984375, 0.8174896240234375, 0.867462158203125, 0.9174346923828125, 0.9674072265625, 1.0173797607421875, 1.067352294921875, 1.1173248291015625, 1.16729736328125, 1.2172698974609375, 1.267242431640625, 1.3172149658203125, 1.3671875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 14.0, 14.0, 17.0, 30.0, 83.0, 112.0, 183.0, 184.0, 181.0, 96.0, 40.0, 16.0, 13.0, 7.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.089115142822266, -21.336265563964844, -20.583415985107422, -19.83056640625, -19.077716827392578, -18.324867248535156, -17.572017669677734, -16.81916618347168, -16.066316604614258, -15.313467025756836, -14.560617446899414, -13.807767868041992, -13.054917335510254, -12.302067756652832, -11.54921817779541, -10.796367645263672, -10.043519020080566, -9.290669441223145, -8.537819862365723, -7.784969806671143, -7.0321197509765625, -6.279270172119141, -5.526420593261719, -4.773570537567139, -4.020720958709717, -3.267871141433716, -2.515021324157715, -1.762171745300293, -1.009321928024292, -0.256472110748291, 0.49637746810913086, 1.249227523803711, 2.002077102661133, 2.754926919937134, 3.5077767372131348, 4.260626316070557, 5.013476371765137, 5.766325950622559, 6.5191755294799805, 7.2720255851745605, 8.02487564086914, 8.777725219726562, 9.530574798583984, 10.283424377441406, 11.036274909973145, 11.789124488830566, 12.541974067687988, 13.294824600219727, 14.047673225402832, 14.800522804260254, 15.553372383117676, 16.306222915649414, 17.059072494506836, 17.811922073364258, 18.56477165222168, 19.3176212310791, 20.070470809936523, 20.823320388793945, 21.576169967651367, 22.32901954650879, 23.08186912536621, 23.834720611572266, 24.587570190429688, 25.34041976928711, 26.09326934814453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 10.0, 5.0, 11.0, 16.0, 14.0, 25.0, 21.0, 35.0, 26.0, 31.0, 28.0, 35.0, 40.0, 34.0, 37.0, 44.0, 50.0, 54.0, 35.0, 40.0, 43.0, 39.0, 36.0, 43.0, 34.0, 27.0, 25.0, 16.0, 18.0, 16.0, 19.0, 17.0, 14.0, 10.0, 5.0, 10.0, 6.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.71651554107666, -13.220603942871094, -12.724691390991211, -12.228779792785645, -11.732868194580078, -11.236956596374512, -10.741044998168945, -10.245132446289062, -9.749220848083496, -9.25330924987793, -8.757396697998047, -8.26148509979248, -7.765573501586914, -7.269661903381348, -6.773749828338623, -6.277837753295898, -5.781926155090332, -5.286014556884766, -4.790102481842041, -4.294190406799316, -3.79827880859375, -3.3023669719696045, -2.806455135345459, -2.3105432987213135, -1.814631462097168, -1.3187196254730225, -0.822807788848877, -0.32689595222473145, 0.16901588439941406, 0.6649277210235596, 1.160839557647705, 1.6567513942718506, 2.1526641845703125, 2.648576021194458, 3.1444878578186035, 3.640399694442749, 4.1363115310668945, 4.632223129272461, 5.1281352043151855, 5.62404727935791, 6.119958877563477, 6.615870475769043, 7.111782550811768, 7.607694625854492, 8.103606224060059, 8.599517822265625, 9.095430374145508, 9.591341972351074, 10.08725357055664, 10.583165168762207, 11.079076766967773, 11.574989318847656, 12.070900917053223, 12.566812515258789, 13.062725067138672, 13.558636665344238, 14.054548263549805, 14.550459861755371, 15.046371459960938, 15.54228401184082, 16.038196563720703, 16.534107208251953, 17.030019760131836, 17.525930404663086, 18.02184295654297]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 6.0, 9.0, 6.0, 9.0, 15.0, 12.0, 22.0, 31.0, 30.0, 36.0, 69.0, 83.0, 143.0, 244.0, 405.0, 763.0, 1562.0, 3470.0, 9715.0, 38949.0, 671496.0, 3387197.0, 59003.0, 12655.0, 4340.0, 1882.0, 883.0, 460.0, 276.0, 181.0, 102.0, 89.0, 38.0, 24.0, 15.0, 16.0, 10.0, 8.0, 7.0, 4.0, 9.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.537109375, -3.436370849609375, -3.33563232421875, -3.234893798828125, -3.1341552734375, -3.033416748046875, -2.93267822265625, -2.831939697265625, -2.731201171875, -2.630462646484375, -2.52972412109375, -2.428985595703125, -2.3282470703125, -2.227508544921875, -2.12677001953125, -2.026031494140625, -1.92529296875, -1.824554443359375, -1.72381591796875, -1.623077392578125, -1.5223388671875, -1.421600341796875, -1.32086181640625, -1.220123291015625, -1.119384765625, -1.018646240234375, -0.91790771484375, -0.817169189453125, -0.7164306640625, -0.615692138671875, -0.51495361328125, -0.414215087890625, -0.3134765625, -0.212738037109375, -0.11199951171875, -0.011260986328125, 0.0894775390625, 0.190216064453125, 0.29095458984375, 0.391693115234375, 0.492431640625, 0.593170166015625, 0.69390869140625, 0.794647216796875, 0.8953857421875, 0.996124267578125, 1.09686279296875, 1.197601318359375, 1.29833984375, 1.399078369140625, 1.49981689453125, 1.600555419921875, 1.7012939453125, 1.802032470703125, 1.90277099609375, 2.003509521484375, 2.104248046875, 2.204986572265625, 2.30572509765625, 2.406463623046875, 2.5072021484375, 2.607940673828125, 2.70867919921875, 2.809417724609375, 2.91015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 9.0, 7.0, 18.0, 10.0, 26.0, 28.0, 43.0, 54.0, 58.0, 80.0, 67.0, 70.0, 82.0, 72.0, 75.0, 64.0, 48.0, 33.0, 44.0, 22.0, 24.0, 10.0, 13.0, 11.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.21484375, -1.1820602416992188, -1.1492767333984375, -1.1164932250976562, -1.083709716796875, -1.0509262084960938, -1.0181427001953125, -0.9853591918945312, -0.95257568359375, -0.9197921752929688, -0.8870086669921875, -0.8542251586914062, -0.821441650390625, -0.7886581420898438, -0.7558746337890625, -0.7230911254882812, -0.6903076171875, -0.6575241088867188, -0.6247406005859375, -0.5919570922851562, -0.559173583984375, -0.5263900756835938, -0.4936065673828125, -0.46082305908203125, -0.42803955078125, -0.39525604248046875, -0.3624725341796875, -0.32968902587890625, -0.296905517578125, -0.26412200927734375, -0.2313385009765625, -0.19855499267578125, -0.165771484375, -0.13298797607421875, -0.1002044677734375, -0.06742095947265625, -0.034637451171875, -0.00185394287109375, 0.0309295654296875, 0.06371307373046875, 0.09649658203125, 0.12928009033203125, 0.1620635986328125, 0.19484710693359375, 0.227630615234375, 0.26041412353515625, 0.2931976318359375, 0.32598114013671875, 0.3587646484375, 0.39154815673828125, 0.4243316650390625, 0.45711517333984375, 0.489898681640625, 0.5226821899414062, 0.5554656982421875, 0.5882492065429688, 0.62103271484375, 0.6538162231445312, 0.6865997314453125, 0.7193832397460938, 0.752166748046875, 0.7849502563476562, 0.8177337646484375, 0.8505172729492188, 0.88330078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 12.0, 6.0, 19.0, 27.0, 53.0, 114.0, 248.0, 672.0, 2218.0, 13409.0, 345962.0, 3788249.0, 37372.0, 4242.0, 1028.0, 356.0, 124.0, 80.0, 40.0, 21.0, 7.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8125, -4.6531982421875, -4.493896484375, -4.3345947265625, -4.17529296875, -4.0159912109375, -3.856689453125, -3.6973876953125, -3.5380859375, -3.3787841796875, -3.219482421875, -3.0601806640625, -2.90087890625, -2.7415771484375, -2.582275390625, -2.4229736328125, -2.263671875, -2.1043701171875, -1.945068359375, -1.7857666015625, -1.62646484375, -1.4671630859375, -1.307861328125, -1.1485595703125, -0.9892578125, -0.8299560546875, -0.670654296875, -0.5113525390625, -0.35205078125, -0.1927490234375, -0.033447265625, 0.1258544921875, 0.28515625, 0.4444580078125, 0.603759765625, 0.7630615234375, 0.92236328125, 1.0816650390625, 1.240966796875, 1.4002685546875, 1.5595703125, 1.7188720703125, 1.878173828125, 2.0374755859375, 2.19677734375, 2.3560791015625, 2.515380859375, 2.6746826171875, 2.833984375, 2.9932861328125, 3.152587890625, 3.3118896484375, 3.47119140625, 3.6304931640625, 3.789794921875, 3.9490966796875, 4.1083984375, 4.2677001953125, 4.427001953125, 4.5863037109375, 4.74560546875, 4.9049072265625, 5.064208984375, 5.2235107421875, 5.3828125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 10.0, 6.0, 21.0, 26.0, 43.0, 86.0, 163.0, 517.0, 2017.0, 734.0, 222.0, 82.0, 64.0, 29.0, 21.0, 11.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.98150634765625, -1.9259033203125, -1.87030029296875, -1.814697265625, -1.75909423828125, -1.7034912109375, -1.64788818359375, -1.59228515625, -1.53668212890625, -1.4810791015625, -1.42547607421875, -1.369873046875, -1.31427001953125, -1.2586669921875, -1.20306396484375, -1.1474609375, -1.09185791015625, -1.0362548828125, -0.98065185546875, -0.925048828125, -0.86944580078125, -0.8138427734375, -0.75823974609375, -0.70263671875, -0.64703369140625, -0.5914306640625, -0.53582763671875, -0.480224609375, -0.42462158203125, -0.3690185546875, -0.31341552734375, -0.2578125, -0.20220947265625, -0.1466064453125, -0.09100341796875, -0.035400390625, 0.02020263671875, 0.0758056640625, 0.13140869140625, 0.18701171875, 0.24261474609375, 0.2982177734375, 0.35382080078125, 0.409423828125, 0.46502685546875, 0.5206298828125, 0.57623291015625, 0.6318359375, 0.68743896484375, 0.7430419921875, 0.79864501953125, 0.854248046875, 0.90985107421875, 0.9654541015625, 1.02105712890625, 1.07666015625, 1.13226318359375, 1.1878662109375, 1.24346923828125, 1.299072265625, 1.35467529296875, 1.4102783203125, 1.46588134765625, 1.521484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 18.0, 574.0, 407.0, 9.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.823486328125, -84.31658172607422, -82.8096694946289, -81.30276489257812, -79.79585266113281, -78.28894805908203, -76.78203582763672, -75.27513122558594, -73.76821899414062, -72.26131439208984, -70.75440216064453, -69.24749755859375, -67.74058532714844, -66.23368072509766, -64.72676849365234, -63.21986389160156, -61.712955474853516, -60.20604705810547, -58.69913864135742, -57.192230224609375, -55.68532180786133, -54.17841339111328, -52.6715087890625, -51.16459655761719, -49.657691955566406, -48.15078353881836, -46.64387512207031, -45.136966705322266, -43.63005828857422, -42.12314987182617, -40.616241455078125, -39.109336853027344, -37.6024284362793, -36.09552001953125, -34.5886116027832, -33.081703186035156, -31.57479476928711, -30.067886352539062, -28.56097984313965, -27.0540714263916, -25.547163009643555, -24.040254592895508, -22.53334617614746, -21.026439666748047, -19.51953125, -18.012622833251953, -16.505714416503906, -14.99880599975586, -13.491897583007812, -11.984989166259766, -10.478080749511719, -8.971173286437988, -7.464264869689941, -5.9573564529418945, -4.450448989868164, -2.943540573120117, -1.4366321563720703, 0.07027602195739746, 1.5771842002868652, 3.084092140197754, 4.591000556945801, 6.097908973693848, 7.604816436767578, 9.111724853515625, 10.618633270263672]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 9.0, 7.0, 11.0, 14.0, 22.0, 28.0, 39.0, 33.0, 52.0, 60.0, 65.0, 57.0, 70.0, 65.0, 80.0, 63.0, 62.0, 36.0, 49.0, 26.0, 36.0, 24.0, 17.0, 24.0, 12.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.981032848358154, -5.809842586517334, -5.638652324676514, -5.467462062835693, -5.296271800994873, -5.125082015991211, -4.953891754150391, -4.78270149230957, -4.61151123046875, -4.44032096862793, -4.269130706787109, -4.097940444946289, -3.926750421524048, -3.7555601596832275, -3.5843698978424072, -3.413179874420166, -3.2419893741607666, -3.0707991123199463, -2.899608850479126, -2.7284188270568848, -2.5572285652160645, -2.386038303375244, -2.214848041534424, -2.0436577796936035, -1.8724676370620728, -1.7012773752212524, -1.5300872325897217, -1.3588969707489014, -1.187706708908081, -1.0165165662765503, -0.84532630443573, -0.6741361618041992, -0.5029458999633789, -0.33175569772720337, -0.16056546568870544, 0.01062476634979248, 0.18181496858596802, 0.35300517082214355, 0.5241954326629639, 0.6953855752944946, 0.8665758371353149, 1.0377660989761353, 1.208956241607666, 1.3801465034484863, 1.5513367652893066, 1.7225269079208374, 1.8937171697616577, 2.0649073123931885, 2.236097574234009, 2.407287836074829, 2.5784780979156494, 2.7496681213378906, 2.920858383178711, 3.0920486450195312, 3.2632389068603516, 3.434429168701172, 3.605619430541992, 3.7768096923828125, 3.947999954223633, 4.119190216064453, 4.290380477905273, 4.461570739746094, 4.632761001586914, 4.803950786590576, 4.9751410484313965]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 2.0, 7.0, 7.0, 8.0, 11.0, 12.0, 19.0, 28.0, 29.0, 47.0, 72.0, 86.0, 129.0, 204.0, 277.0, 451.0, 858.0, 1653.0, 3603.0, 8975.0, 27559.0, 129690.0, 662432.0, 161923.0, 32332.0, 9860.0, 3929.0, 1850.0, 941.0, 542.0, 317.0, 226.0, 123.0, 104.0, 61.0, 60.0, 40.0, 22.0, 17.0, 15.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.05078125, -3.933563232421875, -3.81634521484375, -3.699127197265625, -3.5819091796875, -3.464691162109375, -3.34747314453125, -3.230255126953125, -3.113037109375, -2.995819091796875, -2.87860107421875, -2.761383056640625, -2.6441650390625, -2.526947021484375, -2.40972900390625, -2.292510986328125, -2.17529296875, -2.058074951171875, -1.94085693359375, -1.823638916015625, -1.7064208984375, -1.589202880859375, -1.47198486328125, -1.354766845703125, -1.237548828125, -1.120330810546875, -1.00311279296875, -0.885894775390625, -0.7686767578125, -0.651458740234375, -0.53424072265625, -0.417022705078125, -0.2998046875, -0.182586669921875, -0.06536865234375, 0.051849365234375, 0.1690673828125, 0.286285400390625, 0.40350341796875, 0.520721435546875, 0.637939453125, 0.755157470703125, 0.87237548828125, 0.989593505859375, 1.1068115234375, 1.224029541015625, 1.34124755859375, 1.458465576171875, 1.57568359375, 1.692901611328125, 1.81011962890625, 1.927337646484375, 2.0445556640625, 2.161773681640625, 2.27899169921875, 2.396209716796875, 2.513427734375, 2.630645751953125, 2.74786376953125, 2.865081787109375, 2.9822998046875, 3.099517822265625, 3.21673583984375, 3.333953857421875, 3.451171875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 3.0, 5.0, 15.0, 14.0, 16.0, 14.0, 36.0, 44.0, 48.0, 62.0, 66.0, 73.0, 83.0, 71.0, 85.0, 81.0, 53.0, 50.0, 32.0, 36.0, 27.0, 19.0, 12.0, 16.0, 9.0, 6.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2236328125, -1.1905746459960938, -1.1575164794921875, -1.1244583129882812, -1.091400146484375, -1.0583419799804688, -1.0252838134765625, -0.9922256469726562, -0.95916748046875, -0.9261093139648438, -0.8930511474609375, -0.8599929809570312, -0.826934814453125, -0.7938766479492188, -0.7608184814453125, -0.7277603149414062, -0.6947021484375, -0.6616439819335938, -0.6285858154296875, -0.5955276489257812, -0.562469482421875, -0.5294113159179688, -0.4963531494140625, -0.46329498291015625, -0.43023681640625, -0.39717864990234375, -0.3641204833984375, -0.33106231689453125, -0.298004150390625, -0.26494598388671875, -0.2318878173828125, -0.19882965087890625, -0.165771484375, -0.13271331787109375, -0.0996551513671875, -0.06659698486328125, -0.033538818359375, -0.00048065185546875, 0.0325775146484375, 0.06563568115234375, 0.09869384765625, 0.13175201416015625, 0.1648101806640625, 0.19786834716796875, 0.230926513671875, 0.26398468017578125, 0.2970428466796875, 0.33010101318359375, 0.3631591796875, 0.39621734619140625, 0.4292755126953125, 0.46233367919921875, 0.495391845703125, 0.5284500122070312, 0.5615081787109375, 0.5945663452148438, 0.62762451171875, 0.6606826782226562, 0.6937408447265625, 0.7267990112304688, 0.759857177734375, 0.7929153442382812, 0.8259735107421875, 0.8590316772460938, 0.89208984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 0.0, 4.0, 6.0, 11.0, 11.0, 16.0, 14.0, 27.0, 51.0, 56.0, 73.0, 122.0, 164.0, 248.0, 384.0, 660.0, 1215.0, 2537.0, 5994.0, 17798.0, 64206.0, 349383.0, 481042.0, 87585.0, 22884.0, 7644.0, 2953.0, 1399.0, 724.0, 447.0, 271.0, 173.0, 117.0, 85.0, 55.0, 46.0, 31.0, 35.0, 19.0, 12.0, 14.0, 9.0, 7.0, 10.0, 3.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0], "bins": [-3.005859375, -2.92022705078125, -2.8345947265625, -2.74896240234375, -2.663330078125, -2.57769775390625, -2.4920654296875, -2.40643310546875, -2.32080078125, -2.23516845703125, -2.1495361328125, -2.06390380859375, -1.978271484375, -1.89263916015625, -1.8070068359375, -1.72137451171875, -1.6357421875, -1.55010986328125, -1.4644775390625, -1.37884521484375, -1.293212890625, -1.20758056640625, -1.1219482421875, -1.03631591796875, -0.95068359375, -0.86505126953125, -0.7794189453125, -0.69378662109375, -0.608154296875, -0.52252197265625, -0.4368896484375, -0.35125732421875, -0.265625, -0.17999267578125, -0.0943603515625, -0.00872802734375, 0.076904296875, 0.16253662109375, 0.2481689453125, 0.33380126953125, 0.41943359375, 0.50506591796875, 0.5906982421875, 0.67633056640625, 0.761962890625, 0.84759521484375, 0.9332275390625, 1.01885986328125, 1.1044921875, 1.19012451171875, 1.2757568359375, 1.36138916015625, 1.447021484375, 1.53265380859375, 1.6182861328125, 1.70391845703125, 1.78955078125, 1.87518310546875, 1.9608154296875, 2.04644775390625, 2.132080078125, 2.21771240234375, 2.3033447265625, 2.38897705078125, 2.474609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 4.0, 3.0, 12.0, 11.0, 11.0, 20.0, 8.0, 18.0, 32.0, 27.0, 29.0, 31.0, 32.0, 34.0, 37.0, 37.0, 52.0, 37.0, 36.0, 40.0, 34.0, 38.0, 41.0, 32.0, 34.0, 37.0, 39.0, 30.0, 24.0, 18.0, 23.0, 23.0, 17.0, 16.0, 18.0, 6.0, 11.0, 10.0, 4.0, 6.0, 4.0, 3.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.541015625, -2.457489013671875, -2.37396240234375, -2.290435791015625, -2.2069091796875, -2.123382568359375, -2.03985595703125, -1.956329345703125, -1.872802734375, -1.789276123046875, -1.70574951171875, -1.622222900390625, -1.5386962890625, -1.455169677734375, -1.37164306640625, -1.288116455078125, -1.20458984375, -1.121063232421875, -1.03753662109375, -0.954010009765625, -0.8704833984375, -0.786956787109375, -0.70343017578125, -0.619903564453125, -0.536376953125, -0.452850341796875, -0.36932373046875, -0.285797119140625, -0.2022705078125, -0.118743896484375, -0.03521728515625, 0.048309326171875, 0.1318359375, 0.215362548828125, 0.29888916015625, 0.382415771484375, 0.4659423828125, 0.549468994140625, 0.63299560546875, 0.716522216796875, 0.800048828125, 0.883575439453125, 0.96710205078125, 1.050628662109375, 1.1341552734375, 1.217681884765625, 1.30120849609375, 1.384735107421875, 1.46826171875, 1.551788330078125, 1.63531494140625, 1.718841552734375, 1.8023681640625, 1.885894775390625, 1.96942138671875, 2.052947998046875, 2.136474609375, 2.220001220703125, 2.30352783203125, 2.387054443359375, 2.4705810546875, 2.554107666015625, 2.63763427734375, 2.721160888671875, 2.8046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 18.0, 15.0, 20.0, 38.0, 72.0, 144.0, 275.0, 609.0, 1814.0, 8160.0, 75054.0, 851853.0, 97552.0, 9515.0, 2019.0, 680.0, 323.0, 148.0, 102.0, 40.0, 31.0, 19.0, 9.0, 8.0, 7.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4677734375, -1.41448974609375, -1.3612060546875, -1.30792236328125, -1.254638671875, -1.20135498046875, -1.1480712890625, -1.09478759765625, -1.04150390625, -0.98822021484375, -0.9349365234375, -0.88165283203125, -0.828369140625, -0.77508544921875, -0.7218017578125, -0.66851806640625, -0.615234375, -0.56195068359375, -0.5086669921875, -0.45538330078125, -0.402099609375, -0.34881591796875, -0.2955322265625, -0.24224853515625, -0.18896484375, -0.13568115234375, -0.0823974609375, -0.02911376953125, 0.024169921875, 0.07745361328125, 0.1307373046875, 0.18402099609375, 0.2373046875, 0.29058837890625, 0.3438720703125, 0.39715576171875, 0.450439453125, 0.50372314453125, 0.5570068359375, 0.61029052734375, 0.66357421875, 0.71685791015625, 0.7701416015625, 0.82342529296875, 0.876708984375, 0.92999267578125, 0.9832763671875, 1.03656005859375, 1.08984375, 1.14312744140625, 1.1964111328125, 1.24969482421875, 1.302978515625, 1.35626220703125, 1.4095458984375, 1.46282958984375, 1.51611328125, 1.56939697265625, 1.6226806640625, 1.67596435546875, 1.729248046875, 1.78253173828125, 1.8358154296875, 1.88909912109375, 1.9423828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 5.0, 6.0, 2.0, 11.0, 8.0, 9.0, 16.0, 17.0, 34.0, 53.0, 57.0, 101.0, 144.0, 171.0, 121.0, 74.0, 43.0, 37.0, 18.0, 15.0, 11.0, 10.0, 6.0, 7.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0002048015594482422, -0.00019959546625614166, -0.00019438937306404114, -0.0001891832798719406, -0.0001839771866798401, -0.00017877109348773956, -0.00017356500029563904, -0.0001683589071035385, -0.000163152813911438, -0.00015794672071933746, -0.00015274062752723694, -0.00014753453433513641, -0.0001423284411430359, -0.00013712234795093536, -0.00013191625475883484, -0.00012671016156673431, -0.00012150406837463379, -0.00011629797518253326, -0.00011109188199043274, -0.00010588578879833221, -0.00010067969560623169, -9.547360241413116e-05, -9.026750922203064e-05, -8.506141602993011e-05, -7.985532283782959e-05, -7.464922964572906e-05, -6.944313645362854e-05, -6.423704326152802e-05, -5.903095006942749e-05, -5.3824856877326965e-05, -4.861876368522644e-05, -4.3412670493125916e-05, -3.820657730102539e-05, -3.3000484108924866e-05, -2.779439091682434e-05, -2.2588297724723816e-05, -1.738220453262329e-05, -1.2176111340522766e-05, -6.970018148422241e-06, -1.7639249563217163e-06, 3.4421682357788086e-06, 8.648261427879333e-06, 1.3854354619979858e-05, 1.9060447812080383e-05, 2.4266541004180908e-05, 2.9472634196281433e-05, 3.467872738838196e-05, 3.988482058048248e-05, 4.509091377258301e-05, 5.029700696468353e-05, 5.550310015678406e-05, 6.070919334888458e-05, 6.591528654098511e-05, 7.112137973308563e-05, 7.632747292518616e-05, 8.153356611728668e-05, 8.673965930938721e-05, 9.194575250148773e-05, 9.715184569358826e-05, 0.00010235793888568878, 0.0001075640320777893, 0.00011277012526988983, 0.00011797621846199036, 0.00012318231165409088, 0.0001283884048461914]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 7.0, 11.0, 33.0, 52.0, 123.0, 244.0, 1035.0, 6589.0, 149965.0, 868278.0, 19436.0, 2031.0, 426.0, 169.0, 66.0, 28.0, 16.0, 12.0, 7.0, 2.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.06695556640625, -1.9815673828125, -1.89617919921875, -1.810791015625, -1.72540283203125, -1.6400146484375, -1.55462646484375, -1.46923828125, -1.38385009765625, -1.2984619140625, -1.21307373046875, -1.127685546875, -1.04229736328125, -0.9569091796875, -0.87152099609375, -0.7861328125, -0.70074462890625, -0.6153564453125, -0.52996826171875, -0.444580078125, -0.35919189453125, -0.2738037109375, -0.18841552734375, -0.10302734375, -0.01763916015625, 0.0677490234375, 0.15313720703125, 0.238525390625, 0.32391357421875, 0.4093017578125, 0.49468994140625, 0.580078125, 0.66546630859375, 0.7508544921875, 0.83624267578125, 0.921630859375, 1.00701904296875, 1.0924072265625, 1.17779541015625, 1.26318359375, 1.34857177734375, 1.4339599609375, 1.51934814453125, 1.604736328125, 1.69012451171875, 1.7755126953125, 1.86090087890625, 1.9462890625, 2.03167724609375, 2.1170654296875, 2.20245361328125, 2.287841796875, 2.37322998046875, 2.4586181640625, 2.54400634765625, 2.62939453125, 2.71478271484375, 2.8001708984375, 2.88555908203125, 2.970947265625, 3.05633544921875, 3.1417236328125, 3.22711181640625, 3.3125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 5.0, 3.0, 3.0, 4.0, 4.0, 7.0, 15.0, 8.0, 22.0, 17.0, 15.0, 19.0, 40.0, 72.0, 82.0, 117.0, 140.0, 104.0, 87.0, 46.0, 39.0, 33.0, 28.0, 15.0, 12.0, 10.0, 10.0, 8.0, 6.0, 2.0, 6.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8515625, -0.819366455078125, -0.78717041015625, -0.754974365234375, -0.7227783203125, -0.690582275390625, -0.65838623046875, -0.626190185546875, -0.593994140625, -0.561798095703125, -0.52960205078125, -0.497406005859375, -0.4652099609375, -0.433013916015625, -0.40081787109375, -0.368621826171875, -0.33642578125, -0.304229736328125, -0.27203369140625, -0.239837646484375, -0.2076416015625, -0.175445556640625, -0.14324951171875, -0.111053466796875, -0.078857421875, -0.046661376953125, -0.01446533203125, 0.017730712890625, 0.0499267578125, 0.082122802734375, 0.11431884765625, 0.146514892578125, 0.1787109375, 0.210906982421875, 0.24310302734375, 0.275299072265625, 0.3074951171875, 0.339691162109375, 0.37188720703125, 0.404083251953125, 0.436279296875, 0.468475341796875, 0.50067138671875, 0.532867431640625, 0.5650634765625, 0.597259521484375, 0.62945556640625, 0.661651611328125, 0.69384765625, 0.726043701171875, 0.75823974609375, 0.790435791015625, 0.8226318359375, 0.854827880859375, 0.88702392578125, 0.919219970703125, 0.951416015625, 0.983612060546875, 1.01580810546875, 1.048004150390625, 1.0802001953125, 1.112396240234375, 1.14459228515625, 1.176788330078125, 1.208984375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 105.0, 739.0, 157.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-193.56809997558594, -190.08590698242188, -186.6037139892578, -183.1215362548828, -179.63934326171875, -176.1571502685547, -172.67495727539062, -169.19277954101562, -165.71058654785156, -162.2283935546875, -158.74620056152344, -155.26402282714844, -151.78182983398438, -148.2996368408203, -144.81744384765625, -141.33526611328125, -137.85305786132812, -134.37086486816406, -130.888671875, -127.40648651123047, -123.92430114746094, -120.44210815429688, -116.95991516113281, -113.47772979736328, -109.99554443359375, -106.51335144042969, -103.03116607666016, -99.5489730834961, -96.06678771972656, -92.5845947265625, -89.10240173339844, -85.6202163696289, -82.13803100585938, -78.65583801269531, -75.17365264892578, -71.69145965576172, -68.20927429199219, -64.72708129882812, -61.24489212036133, -57.76270294189453, -54.280513763427734, -50.79832458496094, -47.31613540649414, -43.833946228027344, -40.35175323486328, -36.86956787109375, -33.38737487792969, -29.90518569946289, -26.422996520996094, -22.940807342529297, -19.4586181640625, -15.97642707824707, -12.494237899780273, -9.012048721313477, -5.529857635498047, -2.04766845703125, 1.4345207214355469, 4.916710376739502, 8.398900032043457, 11.88109016418457, 15.363279342651367, 18.845468521118164, 22.327659606933594, 25.80984878540039, 29.292037963867188]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 5.0, 5.0, 6.0, 4.0, 6.0, 9.0, 12.0, 9.0, 17.0, 15.0, 26.0, 31.0, 41.0, 33.0, 34.0, 46.0, 32.0, 33.0, 51.0, 51.0, 33.0, 36.0, 34.0, 45.0, 44.0, 41.0, 43.0, 42.0, 29.0, 43.0, 31.0, 24.0, 19.0, 13.0, 12.0, 10.0, 8.0, 9.0, 10.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.28242301940918, -15.79780101776123, -15.313179016113281, -14.828557014465332, -14.343935012817383, -13.859313011169434, -13.374691009521484, -12.890069007873535, -12.405447006225586, -11.920825004577637, -11.436203002929688, -10.951581001281738, -10.466958999633789, -9.98233699798584, -9.49771499633789, -9.013092994689941, -8.528470993041992, -8.043848991394043, -7.559226989746094, -7.0746049880981445, -6.589982986450195, -6.105360984802246, -5.620738983154297, -5.136116981506348, -4.651494979858398, -4.166872978210449, -3.6822509765625, -3.197628974914551, -2.7130069732666016, -2.2283849716186523, -1.7437629699707031, -1.259140968322754, -0.7745189666748047, -0.28989696502685547, 0.19472503662109375, 0.679347038269043, 1.1639690399169922, 1.6485910415649414, 2.1332130432128906, 2.61783504486084, 3.102457046508789, 3.5870790481567383, 4.0717010498046875, 4.556323051452637, 5.040945053100586, 5.525567054748535, 6.010189056396484, 6.494811058044434, 6.979433059692383, 7.464055061340332, 7.948677062988281, 8.43329906463623, 8.91792106628418, 9.402543067932129, 9.887165069580078, 10.371787071228027, 10.856409072875977, 11.341031074523926, 11.825653076171875, 12.310275077819824, 12.794897079467773, 13.279519081115723, 13.764141082763672, 14.248763084411621, 14.73338508605957]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 6.0, 13.0, 8.0, 9.0, 15.0, 18.0, 19.0, 32.0, 52.0, 77.0, 95.0, 203.0, 305.0, 672.0, 1369.0, 3233.0, 9966.0, 47879.0, 3569763.0, 516230.0, 31449.0, 7596.0, 2767.0, 1184.0, 558.0, 305.0, 169.0, 80.0, 73.0, 41.0, 24.0, 19.0, 22.0, 12.0, 2.0, 6.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.21240234375, -3.1083984375, -3.00439453125, -2.900390625, -2.79638671875, -2.6923828125, -2.58837890625, -2.484375, -2.38037109375, -2.2763671875, -2.17236328125, -2.068359375, -1.96435546875, -1.8603515625, -1.75634765625, -1.65234375, -1.54833984375, -1.4443359375, -1.34033203125, -1.236328125, -1.13232421875, -1.0283203125, -0.92431640625, -0.8203125, -0.71630859375, -0.6123046875, -0.50830078125, -0.404296875, -0.30029296875, -0.1962890625, -0.09228515625, 0.01171875, 0.11572265625, 0.2197265625, 0.32373046875, 0.427734375, 0.53173828125, 0.6357421875, 0.73974609375, 0.84375, 0.94775390625, 1.0517578125, 1.15576171875, 1.259765625, 1.36376953125, 1.4677734375, 1.57177734375, 1.67578125, 1.77978515625, 1.8837890625, 1.98779296875, 2.091796875, 2.19580078125, 2.2998046875, 2.40380859375, 2.5078125, 2.61181640625, 2.7158203125, 2.81982421875, 2.923828125, 3.02783203125, 3.1318359375, 3.23583984375, 3.33984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 11.0, 11.0, 24.0, 23.0, 25.0, 52.0, 52.0, 54.0, 70.0, 68.0, 82.0, 81.0, 75.0, 64.0, 66.0, 42.0, 47.0, 33.0, 23.0, 28.0, 11.0, 11.0, 9.0, 8.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3234939575195312, -1.2866363525390625, -1.2497787475585938, -1.212921142578125, -1.1760635375976562, -1.1392059326171875, -1.1023483276367188, -1.06549072265625, -1.0286331176757812, -0.9917755126953125, -0.9549179077148438, -0.918060302734375, -0.8812026977539062, -0.8443450927734375, -0.8074874877929688, -0.7706298828125, -0.7337722778320312, -0.6969146728515625, -0.6600570678710938, -0.623199462890625, -0.5863418579101562, -0.5494842529296875, -0.5126266479492188, -0.47576904296875, -0.43891143798828125, -0.4020538330078125, -0.36519622802734375, -0.328338623046875, -0.29148101806640625, -0.2546234130859375, -0.21776580810546875, -0.180908203125, -0.14405059814453125, -0.1071929931640625, -0.07033538818359375, -0.033477783203125, 0.00337982177734375, 0.0402374267578125, 0.07709503173828125, 0.11395263671875, 0.15081024169921875, 0.1876678466796875, 0.22452545166015625, 0.261383056640625, 0.29824066162109375, 0.3350982666015625, 0.37195587158203125, 0.4088134765625, 0.44567108154296875, 0.4825286865234375, 0.5193862915039062, 0.556243896484375, 0.5931015014648438, 0.6299591064453125, 0.6668167114257812, 0.70367431640625, 0.7405319213867188, 0.7773895263671875, 0.8142471313476562, 0.851104736328125, 0.8879623413085938, 0.9248199462890625, 0.9616775512695312, 0.99853515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 16.0, 25.0, 48.0, 59.0, 106.0, 224.0, 581.0, 2359.0, 16270.0, 1309433.0, 2844499.0, 17278.0, 2365.0, 568.0, 207.0, 100.0, 54.0, 30.0, 18.0, 11.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15234375, -3.9637451171875, -3.775146484375, -3.5865478515625, -3.39794921875, -3.2093505859375, -3.020751953125, -2.8321533203125, -2.6435546875, -2.4549560546875, -2.266357421875, -2.0777587890625, -1.88916015625, -1.7005615234375, -1.511962890625, -1.3233642578125, -1.134765625, -0.9461669921875, -0.757568359375, -0.5689697265625, -0.38037109375, -0.1917724609375, -0.003173828125, 0.1854248046875, 0.3740234375, 0.5626220703125, 0.751220703125, 0.9398193359375, 1.12841796875, 1.3170166015625, 1.505615234375, 1.6942138671875, 1.8828125, 2.0714111328125, 2.260009765625, 2.4486083984375, 2.63720703125, 2.8258056640625, 3.014404296875, 3.2030029296875, 3.3916015625, 3.5802001953125, 3.768798828125, 3.9573974609375, 4.14599609375, 4.3345947265625, 4.523193359375, 4.7117919921875, 4.900390625, 5.0889892578125, 5.277587890625, 5.4661865234375, 5.65478515625, 5.8433837890625, 6.031982421875, 6.2205810546875, 6.4091796875, 6.5977783203125, 6.786376953125, 6.9749755859375, 7.16357421875, 7.3521728515625, 7.540771484375, 7.7293701171875, 7.91796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 14.0, 13.0, 25.0, 34.0, 88.0, 219.0, 1616.0, 1696.0, 203.0, 74.0, 41.0, 21.0, 13.0, 5.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.591796875, -2.527008056640625, -2.46221923828125, -2.397430419921875, -2.3326416015625, -2.267852783203125, -2.20306396484375, -2.138275146484375, -2.073486328125, -2.008697509765625, -1.94390869140625, -1.879119873046875, -1.8143310546875, -1.749542236328125, -1.68475341796875, -1.619964599609375, -1.55517578125, -1.490386962890625, -1.42559814453125, -1.360809326171875, -1.2960205078125, -1.231231689453125, -1.16644287109375, -1.101654052734375, -1.036865234375, -0.972076416015625, -0.90728759765625, -0.842498779296875, -0.7777099609375, -0.712921142578125, -0.64813232421875, -0.583343505859375, -0.5185546875, -0.453765869140625, -0.38897705078125, -0.324188232421875, -0.2593994140625, -0.194610595703125, -0.12982177734375, -0.065032958984375, -0.000244140625, 0.064544677734375, 0.12933349609375, 0.194122314453125, 0.2589111328125, 0.323699951171875, 0.38848876953125, 0.453277587890625, 0.51806640625, 0.582855224609375, 0.64764404296875, 0.712432861328125, 0.7772216796875, 0.842010498046875, 0.90679931640625, 0.971588134765625, 1.036376953125, 1.101165771484375, 1.16595458984375, 1.230743408203125, 1.2955322265625, 1.360321044921875, 1.42510986328125, 1.489898681640625, 1.5546875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 13.0, 43.0, 111.0, 236.0, 305.0, 183.0, 73.0, 18.0, 10.0, 3.0, 2.0, 1.0, 3.0], "bins": [-21.966527938842773, -21.569799423217773, -21.173070907592773, -20.776342391967773, -20.379613876342773, -19.98288345336914, -19.58615493774414, -19.18942642211914, -18.79269790649414, -18.39596939086914, -17.99924087524414, -17.60251235961914, -17.20578384399414, -16.809053421020508, -16.412324905395508, -16.015596389770508, -15.618867874145508, -15.222139358520508, -14.825410842895508, -14.428681373596191, -14.031952857971191, -13.635224342346191, -13.238495826721191, -12.841766357421875, -12.445038795471191, -12.048310279846191, -11.651581764221191, -11.254852294921875, -10.858123779296875, -10.461395263671875, -10.064666748046875, -9.667938232421875, -9.271209716796875, -8.874481201171875, -8.477752685546875, -8.081023216247559, -7.684294700622559, -7.287566184997559, -6.890837669372559, -6.4941086769104, -6.097379684448242, -5.700651168823242, -5.303922176361084, -4.907193660736084, -4.510464668273926, -4.113736152648926, -3.7170073986053467, -3.3202786445617676, -2.9235496520996094, -2.5268208980560303, -2.130092144012451, -1.7333635091781616, -1.3366347551345825, -0.9399060010910034, -0.5431773662567139, -0.14644861221313477, 0.25028014183044434, 0.6470088958740234, 1.0437376499176025, 1.440466284751892, 1.8371950387954712, 2.23392391204834, 2.63065242767334, 3.027381181716919, 3.424109935760498]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 13.0, 6.0, 14.0, 15.0, 27.0, 24.0, 32.0, 32.0, 44.0, 41.0, 50.0, 36.0, 66.0, 46.0, 54.0, 40.0, 40.0, 59.0, 36.0, 45.0, 27.0, 30.0, 29.0, 28.0, 29.0, 17.0, 24.0, 19.0, 8.0, 9.0, 9.0, 7.0, 4.0, 7.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.06730842590332, -3.9501895904541016, -3.833070755004883, -3.715952157974243, -3.5988333225250244, -3.4817144870758057, -3.364595890045166, -3.2474770545959473, -3.1303582191467285, -3.0132393836975098, -2.896120548248291, -2.7790019512176514, -2.6618831157684326, -2.544764280319214, -2.427645683288574, -2.3105268478393555, -2.1934080123901367, -2.076289176940918, -1.9591704607009888, -1.8420517444610596, -1.7249329090118408, -1.607814073562622, -1.4906953573226929, -1.3735766410827637, -1.256457805633545, -1.1393389701843262, -1.022220253944397, -0.905101478099823, -0.787982702255249, -0.670863926410675, -0.5537451505661011, -0.4366263747215271, -0.3195078372955322, -0.20238906145095825, -0.08527028560638428, 0.0318484902381897, 0.14896726608276367, 0.26608604192733765, 0.3832048177719116, 0.5003235936164856, 0.6174423694610596, 0.7345611453056335, 0.8516799211502075, 0.9687986969947815, 1.0859174728393555, 1.2030363082885742, 1.3201550245285034, 1.4372737407684326, 1.5543925762176514, 1.6715114116668701, 1.7886301279067993, 1.9057488441467285, 2.0228676795959473, 2.139986515045166, 2.2571053504943848, 2.3742239475250244, 2.491342782974243, 2.608461618423462, 2.7255802154541016, 2.8426990509033203, 2.959817886352539, 3.076936721801758, 3.1940555572509766, 3.311174154281616, 3.428292989730835]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 13.0, 17.0, 25.0, 32.0, 60.0, 72.0, 123.0, 159.0, 284.0, 484.0, 1003.0, 2137.0, 6409.0, 25381.0, 151599.0, 675845.0, 149219.0, 25035.0, 6271.0, 2128.0, 967.0, 510.0, 257.0, 175.0, 114.0, 94.0, 40.0, 25.0, 22.0, 14.0, 6.0, 8.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.484375, -4.34637451171875, -4.2083740234375, -4.07037353515625, -3.932373046875, -3.79437255859375, -3.6563720703125, -3.51837158203125, -3.38037109375, -3.24237060546875, -3.1043701171875, -2.96636962890625, -2.828369140625, -2.69036865234375, -2.5523681640625, -2.41436767578125, -2.2763671875, -2.13836669921875, -2.0003662109375, -1.86236572265625, -1.724365234375, -1.58636474609375, -1.4483642578125, -1.31036376953125, -1.17236328125, -1.03436279296875, -0.8963623046875, -0.75836181640625, -0.620361328125, -0.48236083984375, -0.3443603515625, -0.20635986328125, -0.068359375, 0.06964111328125, 0.2076416015625, 0.34564208984375, 0.483642578125, 0.62164306640625, 0.7596435546875, 0.89764404296875, 1.03564453125, 1.17364501953125, 1.3116455078125, 1.44964599609375, 1.587646484375, 1.72564697265625, 1.8636474609375, 2.00164794921875, 2.1396484375, 2.27764892578125, 2.4156494140625, 2.55364990234375, 2.691650390625, 2.82965087890625, 2.9676513671875, 3.10565185546875, 3.24365234375, 3.38165283203125, 3.5196533203125, 3.65765380859375, 3.795654296875, 3.93365478515625, 4.0716552734375, 4.20965576171875, 4.34765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 9.0, 10.0, 16.0, 26.0, 25.0, 38.0, 38.0, 51.0, 60.0, 66.0, 64.0, 84.0, 97.0, 63.0, 59.0, 68.0, 57.0, 43.0, 25.0, 23.0, 15.0, 18.0, 11.0, 6.0, 7.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.349609375, -1.311859130859375, -1.27410888671875, -1.236358642578125, -1.1986083984375, -1.160858154296875, -1.12310791015625, -1.085357666015625, -1.047607421875, -1.009857177734375, -0.97210693359375, -0.934356689453125, -0.8966064453125, -0.858856201171875, -0.82110595703125, -0.783355712890625, -0.74560546875, -0.707855224609375, -0.67010498046875, -0.632354736328125, -0.5946044921875, -0.556854248046875, -0.51910400390625, -0.481353759765625, -0.443603515625, -0.405853271484375, -0.36810302734375, -0.330352783203125, -0.2926025390625, -0.254852294921875, -0.21710205078125, -0.179351806640625, -0.1416015625, -0.103851318359375, -0.06610107421875, -0.028350830078125, 0.0093994140625, 0.047149658203125, 0.08489990234375, 0.122650146484375, 0.160400390625, 0.198150634765625, 0.23590087890625, 0.273651123046875, 0.3114013671875, 0.349151611328125, 0.38690185546875, 0.424652099609375, 0.46240234375, 0.500152587890625, 0.53790283203125, 0.575653076171875, 0.6134033203125, 0.651153564453125, 0.68890380859375, 0.726654052734375, 0.764404296875, 0.802154541015625, 0.83990478515625, 0.877655029296875, 0.9154052734375, 0.953155517578125, 0.99090576171875, 1.028656005859375, 1.06640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 7.0, 9.0, 12.0, 11.0, 21.0, 23.0, 39.0, 42.0, 64.0, 109.0, 162.0, 224.0, 440.0, 892.0, 1986.0, 5381.0, 17006.0, 70601.0, 478360.0, 389609.0, 60125.0, 14945.0, 4709.0, 1802.0, 811.0, 446.0, 264.0, 135.0, 92.0, 65.0, 39.0, 36.0, 26.0, 17.0, 6.0, 8.0, 12.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.5625, -3.45098876953125, -3.3394775390625, -3.22796630859375, -3.116455078125, -3.00494384765625, -2.8934326171875, -2.78192138671875, -2.67041015625, -2.55889892578125, -2.4473876953125, -2.33587646484375, -2.224365234375, -2.11285400390625, -2.0013427734375, -1.88983154296875, -1.7783203125, -1.66680908203125, -1.5552978515625, -1.44378662109375, -1.332275390625, -1.22076416015625, -1.1092529296875, -0.99774169921875, -0.88623046875, -0.77471923828125, -0.6632080078125, -0.55169677734375, -0.440185546875, -0.32867431640625, -0.2171630859375, -0.10565185546875, 0.005859375, 0.11737060546875, 0.2288818359375, 0.34039306640625, 0.451904296875, 0.56341552734375, 0.6749267578125, 0.78643798828125, 0.89794921875, 1.00946044921875, 1.1209716796875, 1.23248291015625, 1.343994140625, 1.45550537109375, 1.5670166015625, 1.67852783203125, 1.7900390625, 1.90155029296875, 2.0130615234375, 2.12457275390625, 2.236083984375, 2.34759521484375, 2.4591064453125, 2.57061767578125, 2.68212890625, 2.79364013671875, 2.9051513671875, 3.01666259765625, 3.128173828125, 3.23968505859375, 3.3511962890625, 3.46270751953125, 3.57421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 11.0, 9.0, 8.0, 10.0, 12.0, 16.0, 17.0, 21.0, 18.0, 13.0, 25.0, 29.0, 36.0, 51.0, 43.0, 54.0, 60.0, 42.0, 49.0, 36.0, 34.0, 48.0, 47.0, 39.0, 36.0, 47.0, 24.0, 21.0, 21.0, 14.0, 20.0, 13.0, 22.0, 11.0, 10.0, 8.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.9207763671875, -2.820068359375, -2.7193603515625, -2.61865234375, -2.5179443359375, -2.417236328125, -2.3165283203125, -2.2158203125, -2.1151123046875, -2.014404296875, -1.9136962890625, -1.81298828125, -1.7122802734375, -1.611572265625, -1.5108642578125, -1.41015625, -1.3094482421875, -1.208740234375, -1.1080322265625, -1.00732421875, -0.9066162109375, -0.805908203125, -0.7052001953125, -0.6044921875, -0.5037841796875, -0.403076171875, -0.3023681640625, -0.20166015625, -0.1009521484375, -0.000244140625, 0.1004638671875, 0.201171875, 0.3018798828125, 0.402587890625, 0.5032958984375, 0.60400390625, 0.7047119140625, 0.805419921875, 0.9061279296875, 1.0068359375, 1.1075439453125, 1.208251953125, 1.3089599609375, 1.40966796875, 1.5103759765625, 1.611083984375, 1.7117919921875, 1.8125, 1.9132080078125, 2.013916015625, 2.1146240234375, 2.21533203125, 2.3160400390625, 2.416748046875, 2.5174560546875, 2.6181640625, 2.7188720703125, 2.819580078125, 2.9202880859375, 3.02099609375, 3.1217041015625, 3.222412109375, 3.3231201171875, 3.423828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 10.0, 12.0, 19.0, 30.0, 51.0, 122.0, 266.0, 772.0, 3127.0, 24526.0, 743335.0, 261891.0, 11425.0, 1994.0, 578.0, 200.0, 78.0, 54.0, 20.0, 14.0, 7.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7607421875, -1.7036590576171875, -1.646575927734375, -1.5894927978515625, -1.53240966796875, -1.4753265380859375, -1.418243408203125, -1.3611602783203125, -1.3040771484375, -1.2469940185546875, -1.189910888671875, -1.1328277587890625, -1.07574462890625, -1.0186614990234375, -0.961578369140625, -0.9044952392578125, -0.847412109375, -0.7903289794921875, -0.733245849609375, -0.6761627197265625, -0.61907958984375, -0.5619964599609375, -0.504913330078125, -0.4478302001953125, -0.3907470703125, -0.3336639404296875, -0.276580810546875, -0.2194976806640625, -0.16241455078125, -0.1053314208984375, -0.048248291015625, 0.0088348388671875, 0.06591796875, 0.1230010986328125, 0.180084228515625, 0.2371673583984375, 0.29425048828125, 0.3513336181640625, 0.408416748046875, 0.4654998779296875, 0.5225830078125, 0.5796661376953125, 0.636749267578125, 0.6938323974609375, 0.75091552734375, 0.8079986572265625, 0.865081787109375, 0.9221649169921875, 0.979248046875, 1.0363311767578125, 1.093414306640625, 1.1504974365234375, 1.20758056640625, 1.2646636962890625, 1.321746826171875, 1.3788299560546875, 1.4359130859375, 1.4929962158203125, 1.550079345703125, 1.6071624755859375, 1.66424560546875, 1.7213287353515625, 1.778411865234375, 1.8354949951171875, 1.892578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 11.0, 9.0, 7.0, 10.0, 24.0, 36.0, 49.0, 59.0, 105.0, 149.0, 164.0, 124.0, 89.0, 42.0, 30.0, 34.0, 16.0, 5.0, 6.0, 7.0, 3.0, 4.0, 7.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00022649765014648438, -0.00022042728960514069, -0.000214356929063797, -0.0002082865685224533, -0.00020221620798110962, -0.00019614584743976593, -0.00019007548689842224, -0.00018400512635707855, -0.00017793476581573486, -0.00017186440527439117, -0.00016579404473304749, -0.0001597236841917038, -0.0001536533236503601, -0.00014758296310901642, -0.00014151260256767273, -0.00013544224202632904, -0.00012937188148498535, -0.00012330152094364166, -0.00011723116040229797, -0.00011116079986095428, -0.0001050904393196106, -9.90200787782669e-05, -9.294971823692322e-05, -8.687935769557953e-05, -8.080899715423584e-05, -7.473863661289215e-05, -6.866827607154846e-05, -6.259791553020477e-05, -5.6527554988861084e-05, -5.0457194447517395e-05, -4.4386833906173706e-05, -3.831647336483002e-05, -3.224611282348633e-05, -2.617575228214264e-05, -2.010539174079895e-05, -1.4035031199455261e-05, -7.964670658111572e-06, -1.8943101167678833e-06, 4.176050424575806e-06, 1.0246410965919495e-05, 1.6316771507263184e-05, 2.2387132048606873e-05, 2.845749258995056e-05, 3.452785313129425e-05, 4.059821367263794e-05, 4.666857421398163e-05, 5.273893475532532e-05, 5.8809295296669006e-05, 6.48796558380127e-05, 7.095001637935638e-05, 7.702037692070007e-05, 8.309073746204376e-05, 8.916109800338745e-05, 9.523145854473114e-05, 0.00010130181908607483, 0.00010737217962741852, 0.00011344254016876221, 0.0001195129007101059, 0.00012558326125144958, 0.00013165362179279327, 0.00013772398233413696, 0.00014379434287548065, 0.00014986470341682434, 0.00015593506395816803, 0.00016200542449951172]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 10.0, 14.0, 31.0, 66.0, 137.0, 357.0, 1119.0, 6299.0, 109992.0, 891617.0, 34344.0, 3338.0, 745.0, 271.0, 86.0, 52.0, 24.0, 9.0, 13.0, 6.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0859375, -2.0233612060546875, -1.960784912109375, -1.8982086181640625, -1.83563232421875, -1.7730560302734375, -1.710479736328125, -1.6479034423828125, -1.5853271484375, -1.5227508544921875, -1.460174560546875, -1.3975982666015625, -1.33502197265625, -1.2724456787109375, -1.209869384765625, -1.1472930908203125, -1.084716796875, -1.0221405029296875, -0.959564208984375, -0.8969879150390625, -0.83441162109375, -0.7718353271484375, -0.709259033203125, -0.6466827392578125, -0.5841064453125, -0.5215301513671875, -0.458953857421875, -0.3963775634765625, -0.33380126953125, -0.2712249755859375, -0.208648681640625, -0.1460723876953125, -0.08349609375, -0.0209197998046875, 0.041656494140625, 0.1042327880859375, 0.16680908203125, 0.2293853759765625, 0.291961669921875, 0.3545379638671875, 0.4171142578125, 0.4796905517578125, 0.542266845703125, 0.6048431396484375, 0.66741943359375, 0.7299957275390625, 0.792572021484375, 0.8551483154296875, 0.917724609375, 0.9803009033203125, 1.042877197265625, 1.1054534912109375, 1.16802978515625, 1.2306060791015625, 1.293182373046875, 1.3557586669921875, 1.4183349609375, 1.4809112548828125, 1.543487548828125, 1.6060638427734375, 1.66864013671875, 1.7312164306640625, 1.793792724609375, 1.8563690185546875, 1.9189453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 12.0, 8.0, 18.0, 24.0, 26.0, 36.0, 41.0, 70.0, 98.0, 138.0, 143.0, 111.0, 57.0, 47.0, 52.0, 32.0, 13.0, 22.0, 9.0, 9.0, 9.0, 4.0, 0.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.2607421875, -1.2282562255859375, -1.195770263671875, -1.1632843017578125, -1.13079833984375, -1.0983123779296875, -1.065826416015625, -1.0333404541015625, -1.0008544921875, -0.9683685302734375, -0.935882568359375, -0.9033966064453125, -0.87091064453125, -0.8384246826171875, -0.805938720703125, -0.7734527587890625, -0.740966796875, -0.7084808349609375, -0.675994873046875, -0.6435089111328125, -0.61102294921875, -0.5785369873046875, -0.546051025390625, -0.5135650634765625, -0.4810791015625, -0.4485931396484375, -0.416107177734375, -0.3836212158203125, -0.35113525390625, -0.3186492919921875, -0.286163330078125, -0.2536773681640625, -0.22119140625, -0.1887054443359375, -0.156219482421875, -0.1237335205078125, -0.09124755859375, -0.0587615966796875, -0.026275634765625, 0.0062103271484375, 0.0386962890625, 0.0711822509765625, 0.103668212890625, 0.1361541748046875, 0.16864013671875, 0.2011260986328125, 0.233612060546875, 0.2660980224609375, 0.298583984375, 0.3310699462890625, 0.363555908203125, 0.3960418701171875, 0.42852783203125, 0.4610137939453125, 0.493499755859375, 0.5259857177734375, 0.5584716796875, 0.5909576416015625, 0.623443603515625, 0.6559295654296875, 0.68841552734375, 0.7209014892578125, 0.753387451171875, 0.7858734130859375, 0.818359375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 20.0, 309.0, 627.0, 55.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-193.10693359375, -189.7327117919922, -186.35848999023438, -182.9842529296875, -179.6100311279297, -176.23580932617188, -172.86158752441406, -169.48736572265625, -166.11314392089844, -162.73892211914062, -159.3647003173828, -155.990478515625, -152.61624145507812, -149.2420196533203, -145.8677978515625, -142.4935760498047, -139.1193389892578, -135.7451171875, -132.3708953857422, -128.99667358398438, -125.62244415283203, -122.24821472167969, -118.87399291992188, -115.49977111816406, -112.12554931640625, -108.75132751464844, -105.3770980834961, -102.00287628173828, -98.62865447998047, -95.25442504882812, -91.88020324707031, -88.5059814453125, -85.13175964355469, -81.75753784179688, -78.38330841064453, -75.00908660888672, -71.6348648071289, -68.26063537597656, -64.88641357421875, -61.51218795776367, -58.137962341308594, -54.763736724853516, -51.3895149230957, -48.015289306640625, -44.64106369018555, -41.26683807373047, -37.892616271972656, -34.51839065551758, -31.144166946411133, -27.769943237304688, -24.39571762084961, -21.021493911743164, -17.64727020263672, -14.27304458618164, -10.898820877075195, -7.524595260620117, -4.150371551513672, -0.7761471271514893, 2.5980772972106934, 5.972301483154297, 9.346526145935059, 12.72075080871582, 16.094974517822266, 19.469200134277344, 22.84342384338379]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 5.0, 7.0, 8.0, 14.0, 16.0, 15.0, 16.0, 22.0, 27.0, 24.0, 28.0, 26.0, 38.0, 41.0, 34.0, 38.0, 44.0, 63.0, 39.0, 54.0, 34.0, 44.0, 41.0, 48.0, 30.0, 38.0, 34.0, 16.0, 18.0, 16.0, 13.0, 25.0, 13.0, 12.0, 9.0, 8.0, 9.0, 4.0, 4.0, 2.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.780782699584961, -13.335488319396973, -12.890193939208984, -12.444899559020996, -11.999605178833008, -11.554309844970703, -11.109015464782715, -10.663721084594727, -10.218426704406738, -9.77313232421875, -9.327837944030762, -8.882543563842773, -8.437248229980469, -7.991954326629639, -7.546659469604492, -7.101365089416504, -6.656070709228516, -6.210776329040527, -5.765481948852539, -5.320187091827393, -4.874892711639404, -4.429598331451416, -3.9843037128448486, -3.5390090942382812, -3.093714714050293, -2.6484203338623047, -2.2031257152557373, -1.7578312158584595, -1.3125367164611816, -0.8672423362731934, -0.421947717666626, 0.023346900939941406, 0.4686412811279297, 0.9139357805252075, 1.3592302799224854, 1.8045247793197632, 2.249819278717041, 2.6951136589050293, 3.1404082775115967, 3.585702896118164, 4.030997276306152, 4.476291656494141, 4.921586036682129, 5.366880893707275, 5.812175273895264, 6.257469654083252, 6.702764511108398, 7.148058891296387, 7.593353271484375, 8.038647651672363, 8.483942031860352, 8.92923641204834, 9.374530792236328, 9.819826126098633, 10.265120506286621, 10.71041488647461, 11.155709266662598, 11.601003646850586, 12.046298027038574, 12.491592407226562, 12.936887741088867, 13.382181167602539, 13.827476501464844, 14.272770881652832, 14.71806526184082]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 4.0, 2.0, 5.0, 10.0, 3.0, 8.0, 21.0, 18.0, 43.0, 34.0, 53.0, 64.0, 116.0, 218.0, 342.0, 592.0, 1174.0, 2443.0, 6495.0, 22224.0, 183341.0, 3889350.0, 66191.0, 13104.0, 4372.0, 1911.0, 888.0, 491.0, 278.0, 167.0, 109.0, 67.0, 42.0, 30.0, 20.0, 13.0, 7.0, 7.0, 1.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.56512451171875, -4.4193115234375, -4.27349853515625, -4.127685546875, -3.98187255859375, -3.8360595703125, -3.69024658203125, -3.54443359375, -3.39862060546875, -3.2528076171875, -3.10699462890625, -2.961181640625, -2.81536865234375, -2.6695556640625, -2.52374267578125, -2.3779296875, -2.23211669921875, -2.0863037109375, -1.94049072265625, -1.794677734375, -1.64886474609375, -1.5030517578125, -1.35723876953125, -1.21142578125, -1.06561279296875, -0.9197998046875, -0.77398681640625, -0.628173828125, -0.48236083984375, -0.3365478515625, -0.19073486328125, -0.044921875, 0.10089111328125, 0.2467041015625, 0.39251708984375, 0.538330078125, 0.68414306640625, 0.8299560546875, 0.97576904296875, 1.12158203125, 1.26739501953125, 1.4132080078125, 1.55902099609375, 1.704833984375, 1.85064697265625, 1.9964599609375, 2.14227294921875, 2.2880859375, 2.43389892578125, 2.5797119140625, 2.72552490234375, 2.871337890625, 3.01715087890625, 3.1629638671875, 3.30877685546875, 3.45458984375, 3.60040283203125, 3.7462158203125, 3.89202880859375, 4.037841796875, 4.18365478515625, 4.3294677734375, 4.47528076171875, 4.62109375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 11.0, 11.0, 11.0, 16.0, 23.0, 26.0, 38.0, 36.0, 54.0, 57.0, 61.0, 78.0, 80.0, 68.0, 75.0, 60.0, 53.0, 53.0, 41.0, 29.0, 26.0, 22.0, 17.0, 13.0, 11.0, 5.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3662109375, -1.328033447265625, -1.28985595703125, -1.251678466796875, -1.2135009765625, -1.175323486328125, -1.13714599609375, -1.098968505859375, -1.060791015625, -1.022613525390625, -0.98443603515625, -0.946258544921875, -0.9080810546875, -0.869903564453125, -0.83172607421875, -0.793548583984375, -0.75537109375, -0.717193603515625, -0.67901611328125, -0.640838623046875, -0.6026611328125, -0.564483642578125, -0.52630615234375, -0.488128662109375, -0.449951171875, -0.411773681640625, -0.37359619140625, -0.335418701171875, -0.2972412109375, -0.259063720703125, -0.22088623046875, -0.182708740234375, -0.14453125, -0.106353759765625, -0.06817626953125, -0.029998779296875, 0.0081787109375, 0.046356201171875, 0.08453369140625, 0.122711181640625, 0.160888671875, 0.199066162109375, 0.23724365234375, 0.275421142578125, 0.3135986328125, 0.351776123046875, 0.38995361328125, 0.428131103515625, 0.46630859375, 0.504486083984375, 0.54266357421875, 0.580841064453125, 0.6190185546875, 0.657196044921875, 0.69537353515625, 0.733551025390625, 0.771728515625, 0.809906005859375, 0.84808349609375, 0.886260986328125, 0.9244384765625, 0.962615966796875, 1.00079345703125, 1.038970947265625, 1.0771484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 25.0, 45.0, 98.0, 197.0, 547.0, 1419.0, 4592.0, 21127.0, 263116.0, 3837485.0, 53041.0, 8776.0, 2370.0, 807.0, 355.0, 138.0, 55.0, 35.0, 12.0, 10.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.59765625, -6.4049072265625, -6.212158203125, -6.0194091796875, -5.82666015625, -5.6339111328125, -5.441162109375, -5.2484130859375, -5.0556640625, -4.8629150390625, -4.670166015625, -4.4774169921875, -4.28466796875, -4.0919189453125, -3.899169921875, -3.7064208984375, -3.513671875, -3.3209228515625, -3.128173828125, -2.9354248046875, -2.74267578125, -2.5499267578125, -2.357177734375, -2.1644287109375, -1.9716796875, -1.7789306640625, -1.586181640625, -1.3934326171875, -1.20068359375, -1.0079345703125, -0.815185546875, -0.6224365234375, -0.4296875, -0.2369384765625, -0.044189453125, 0.1485595703125, 0.34130859375, 0.5340576171875, 0.726806640625, 0.9195556640625, 1.1123046875, 1.3050537109375, 1.497802734375, 1.6905517578125, 1.88330078125, 2.0760498046875, 2.268798828125, 2.4615478515625, 2.654296875, 2.8470458984375, 3.039794921875, 3.2325439453125, 3.42529296875, 3.6180419921875, 3.810791015625, 4.0035400390625, 4.1962890625, 4.3890380859375, 4.581787109375, 4.7745361328125, 4.96728515625, 5.1600341796875, 5.352783203125, 5.5455322265625, 5.73828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 9.0, 20.0, 18.0, 21.0, 47.0, 110.0, 235.0, 2284.0, 836.0, 207.0, 97.0, 49.0, 34.0, 14.0, 21.0, 21.0, 7.0, 11.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.097442626953125, -2.04058837890625, -1.983734130859375, -1.9268798828125, -1.870025634765625, -1.81317138671875, -1.756317138671875, -1.699462890625, -1.642608642578125, -1.58575439453125, -1.528900146484375, -1.4720458984375, -1.415191650390625, -1.35833740234375, -1.301483154296875, -1.24462890625, -1.187774658203125, -1.13092041015625, -1.074066162109375, -1.0172119140625, -0.960357666015625, -0.90350341796875, -0.846649169921875, -0.789794921875, -0.732940673828125, -0.67608642578125, -0.619232177734375, -0.5623779296875, -0.505523681640625, -0.44866943359375, -0.391815185546875, -0.3349609375, -0.278106689453125, -0.22125244140625, -0.164398193359375, -0.1075439453125, -0.050689697265625, 0.00616455078125, 0.063018798828125, 0.119873046875, 0.176727294921875, 0.23358154296875, 0.290435791015625, 0.3472900390625, 0.404144287109375, 0.46099853515625, 0.517852783203125, 0.57470703125, 0.631561279296875, 0.68841552734375, 0.745269775390625, 0.8021240234375, 0.858978271484375, 0.91583251953125, 0.972686767578125, 1.029541015625, 1.086395263671875, 1.14324951171875, 1.200103759765625, 1.2569580078125, 1.313812255859375, 1.37066650390625, 1.427520751953125, 1.484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 33.0, 325.0, 488.0, 125.0, 21.0, 11.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.38621997833252, -10.344137191772461, -9.302054405212402, -8.259971618652344, -7.217888355255127, -6.175805568695068, -5.133722305297852, -4.091639518737793, -3.0495567321777344, -2.007473945617676, -0.9653909206390381, 0.07669210433959961, 1.1187748908996582, 2.160857677459717, 3.2029409408569336, 4.245023727416992, 5.287106513977051, 6.329189300537109, 7.371272087097168, 8.413354873657227, 9.455438613891602, 10.497520446777344, 11.539604187011719, 12.581686973571777, 13.623769760131836, 14.665852546691895, 15.707935333251953, 16.750019073486328, 17.79210090637207, 18.834184646606445, 19.876266479492188, 20.918350219726562, 21.960433959960938, 23.002517700195312, 24.044599533081055, 25.08668327331543, 26.128765106201172, 27.170848846435547, 28.212932586669922, 29.255014419555664, 30.297096252441406, 31.33917999267578, 32.381263732910156, 33.423343658447266, 34.46542739868164, 35.507511138916016, 36.54959487915039, 37.5916748046875, 38.633758544921875, 39.67584228515625, 40.717926025390625, 41.760005950927734, 42.80208969116211, 43.844173431396484, 44.88625717163086, 45.92833709716797, 46.97042465209961, 48.012508392333984, 49.05459213256836, 50.09667205810547, 51.138755798339844, 52.18083953857422, 53.222923278808594, 54.26500701904297, 55.30708694458008]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 8.0, 10.0, 10.0, 14.0, 16.0, 15.0, 27.0, 29.0, 38.0, 37.0, 35.0, 43.0, 49.0, 48.0, 51.0, 32.0, 51.0, 55.0, 49.0, 46.0, 38.0, 39.0, 38.0, 40.0, 23.0, 36.0, 28.0, 21.0, 17.0, 18.0, 9.0, 7.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-7.671318054199219, -7.475038051605225, -7.278757572174072, -7.082477569580078, -6.886197090148926, -6.689917087554932, -6.4936370849609375, -6.297356605529785, -6.101076126098633, -5.904796123504639, -5.708515644073486, -5.512235641479492, -5.31595516204834, -5.119675159454346, -4.923395156860352, -4.727114677429199, -4.530834674835205, -4.334554672241211, -4.138274192810059, -3.9419941902160645, -3.745713710784912, -3.549433708190918, -3.3531534671783447, -3.1568732261657715, -2.9605929851531982, -2.764312744140625, -2.5680325031280518, -2.3717522621154785, -2.1754722595214844, -1.9791918992996216, -1.782911777496338, -1.5866315364837646, -1.3903512954711914, -1.1940710544586182, -0.9977908730506897, -0.8015106916427612, -0.605230450630188, -0.40895020961761475, -0.21267008781433105, -0.016389846801757812, 0.17989039421081543, 0.3761706054210663, 0.5724508166313171, 0.7687309980392456, 0.9650112390518188, 1.161291480064392, 1.3575716018676758, 1.553851842880249, 1.7501320838928223, 1.9464123249053955, 2.1426925659179688, 2.338972568511963, 2.5352530479431152, 2.7315330505371094, 2.9278132915496826, 3.124093532562256, 3.320373773574829, 3.5166540145874023, 3.7129342555999756, 3.909214496612549, 4.105494499206543, 4.301774978637695, 4.4980549812316895, 4.694334983825684, 4.890615463256836]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 0.0, 3.0, 8.0, 10.0, 15.0, 18.0, 28.0, 38.0, 51.0, 74.0, 91.0, 106.0, 195.0, 281.0, 478.0, 854.0, 1678.0, 3838.0, 9716.0, 31442.0, 138010.0, 555264.0, 234226.0, 48535.0, 13776.0, 4966.0, 2137.0, 1037.0, 617.0, 339.0, 202.0, 149.0, 118.0, 65.0, 52.0, 29.0, 29.0, 22.0, 13.0, 16.0, 10.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.3125, -5.1546630859375, -4.996826171875, -4.8389892578125, -4.68115234375, -4.5233154296875, -4.365478515625, -4.2076416015625, -4.0498046875, -3.8919677734375, -3.734130859375, -3.5762939453125, -3.41845703125, -3.2606201171875, -3.102783203125, -2.9449462890625, -2.787109375, -2.6292724609375, -2.471435546875, -2.3135986328125, -2.15576171875, -1.9979248046875, -1.840087890625, -1.6822509765625, -1.5244140625, -1.3665771484375, -1.208740234375, -1.0509033203125, -0.89306640625, -0.7352294921875, -0.577392578125, -0.4195556640625, -0.26171875, -0.1038818359375, 0.053955078125, 0.2117919921875, 0.36962890625, 0.5274658203125, 0.685302734375, 0.8431396484375, 1.0009765625, 1.1588134765625, 1.316650390625, 1.4744873046875, 1.63232421875, 1.7901611328125, 1.947998046875, 2.1058349609375, 2.263671875, 2.4215087890625, 2.579345703125, 2.7371826171875, 2.89501953125, 3.0528564453125, 3.210693359375, 3.3685302734375, 3.5263671875, 3.6842041015625, 3.842041015625, 3.9998779296875, 4.15771484375, 4.3155517578125, 4.473388671875, 4.6312255859375, 4.7890625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 8.0, 8.0, 16.0, 24.0, 26.0, 27.0, 37.0, 52.0, 51.0, 49.0, 74.0, 62.0, 69.0, 82.0, 75.0, 50.0, 50.0, 54.0, 36.0, 25.0, 19.0, 33.0, 13.0, 15.0, 13.0, 4.0, 8.0, 2.0, 4.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.390625, -1.3526153564453125, -1.314605712890625, -1.2765960693359375, -1.23858642578125, -1.2005767822265625, -1.162567138671875, -1.1245574951171875, -1.0865478515625, -1.0485382080078125, -1.010528564453125, -0.9725189208984375, -0.93450927734375, -0.8964996337890625, -0.858489990234375, -0.8204803466796875, -0.782470703125, -0.7444610595703125, -0.706451416015625, -0.6684417724609375, -0.63043212890625, -0.5924224853515625, -0.554412841796875, -0.5164031982421875, -0.4783935546875, -0.4403839111328125, -0.402374267578125, -0.3643646240234375, -0.32635498046875, -0.2883453369140625, -0.250335693359375, -0.2123260498046875, -0.17431640625, -0.1363067626953125, -0.098297119140625, -0.0602874755859375, -0.02227783203125, 0.0157318115234375, 0.053741455078125, 0.0917510986328125, 0.1297607421875, 0.1677703857421875, 0.205780029296875, 0.2437896728515625, 0.28179931640625, 0.3198089599609375, 0.357818603515625, 0.3958282470703125, 0.433837890625, 0.4718475341796875, 0.509857177734375, 0.5478668212890625, 0.58587646484375, 0.6238861083984375, 0.661895751953125, 0.6999053955078125, 0.7379150390625, 0.7759246826171875, 0.813934326171875, 0.8519439697265625, 0.88995361328125, 0.9279632568359375, 0.965972900390625, 1.0039825439453125, 1.0419921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 15.0, 13.0, 14.0, 17.0, 51.0, 57.0, 115.0, 179.0, 325.0, 628.0, 1364.0, 3142.0, 7750.0, 27045.0, 132343.0, 589267.0, 225869.0, 41784.0, 11039.0, 3979.0, 1676.0, 873.0, 404.0, 224.0, 122.0, 88.0, 42.0, 27.0, 27.0, 19.0, 10.0, 6.0, 6.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.83673095703125, -4.6929931640625, -4.54925537109375, -4.405517578125, -4.26177978515625, -4.1180419921875, -3.97430419921875, -3.83056640625, -3.68682861328125, -3.5430908203125, -3.39935302734375, -3.255615234375, -3.11187744140625, -2.9681396484375, -2.82440185546875, -2.6806640625, -2.53692626953125, -2.3931884765625, -2.24945068359375, -2.105712890625, -1.96197509765625, -1.8182373046875, -1.67449951171875, -1.53076171875, -1.38702392578125, -1.2432861328125, -1.09954833984375, -0.955810546875, -0.81207275390625, -0.6683349609375, -0.52459716796875, -0.380859375, -0.23712158203125, -0.0933837890625, 0.05035400390625, 0.194091796875, 0.33782958984375, 0.4815673828125, 0.62530517578125, 0.76904296875, 0.91278076171875, 1.0565185546875, 1.20025634765625, 1.343994140625, 1.48773193359375, 1.6314697265625, 1.77520751953125, 1.9189453125, 2.06268310546875, 2.2064208984375, 2.35015869140625, 2.493896484375, 2.63763427734375, 2.7813720703125, 2.92510986328125, 3.06884765625, 3.21258544921875, 3.3563232421875, 3.50006103515625, 3.643798828125, 3.78753662109375, 3.9312744140625, 4.07501220703125, 4.21875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 7.0, 9.0, 8.0, 9.0, 12.0, 15.0, 24.0, 25.0, 25.0, 31.0, 47.0, 45.0, 42.0, 48.0, 55.0, 62.0, 53.0, 58.0, 64.0, 46.0, 49.0, 24.0, 40.0, 41.0, 34.0, 30.0, 32.0, 16.0, 14.0, 9.0, 5.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.6484375, -4.49285888671875, -4.3372802734375, -4.18170166015625, -4.026123046875, -3.87054443359375, -3.7149658203125, -3.55938720703125, -3.40380859375, -3.24822998046875, -3.0926513671875, -2.93707275390625, -2.781494140625, -2.62591552734375, -2.4703369140625, -2.31475830078125, -2.1591796875, -2.00360107421875, -1.8480224609375, -1.69244384765625, -1.536865234375, -1.38128662109375, -1.2257080078125, -1.07012939453125, -0.91455078125, -0.75897216796875, -0.6033935546875, -0.44781494140625, -0.292236328125, -0.13665771484375, 0.0189208984375, 0.17449951171875, 0.330078125, 0.48565673828125, 0.6412353515625, 0.79681396484375, 0.952392578125, 1.10797119140625, 1.2635498046875, 1.41912841796875, 1.57470703125, 1.73028564453125, 1.8858642578125, 2.04144287109375, 2.197021484375, 2.35260009765625, 2.5081787109375, 2.66375732421875, 2.8193359375, 2.97491455078125, 3.1304931640625, 3.28607177734375, 3.441650390625, 3.59722900390625, 3.7528076171875, 3.90838623046875, 4.06396484375, 4.21954345703125, 4.3751220703125, 4.53070068359375, 4.686279296875, 4.84185791015625, 4.9974365234375, 5.15301513671875, 5.30859375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 10.0, 3.0, 17.0, 18.0, 26.0, 38.0, 58.0, 90.0, 133.0, 238.0, 416.0, 731.0, 1503.0, 3637.0, 12516.0, 125881.0, 838340.0, 51387.0, 8156.0, 2681.0, 1158.0, 569.0, 376.0, 215.0, 96.0, 85.0, 57.0, 34.0, 26.0, 17.0, 12.0, 11.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.9375, -3.82916259765625, -3.7208251953125, -3.61248779296875, -3.504150390625, -3.39581298828125, -3.2874755859375, -3.17913818359375, -3.07080078125, -2.96246337890625, -2.8541259765625, -2.74578857421875, -2.637451171875, -2.52911376953125, -2.4207763671875, -2.31243896484375, -2.2041015625, -2.09576416015625, -1.9874267578125, -1.87908935546875, -1.770751953125, -1.66241455078125, -1.5540771484375, -1.44573974609375, -1.33740234375, -1.22906494140625, -1.1207275390625, -1.01239013671875, -0.904052734375, -0.79571533203125, -0.6873779296875, -0.57904052734375, -0.470703125, -0.36236572265625, -0.2540283203125, -0.14569091796875, -0.037353515625, 0.07098388671875, 0.1793212890625, 0.28765869140625, 0.39599609375, 0.50433349609375, 0.6126708984375, 0.72100830078125, 0.829345703125, 0.93768310546875, 1.0460205078125, 1.15435791015625, 1.2626953125, 1.37103271484375, 1.4793701171875, 1.58770751953125, 1.696044921875, 1.80438232421875, 1.9127197265625, 2.02105712890625, 2.12939453125, 2.23773193359375, 2.3460693359375, 2.45440673828125, 2.562744140625, 2.67108154296875, 2.7794189453125, 2.88775634765625, 2.99609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 6.0, 12.0, 17.0, 19.0, 30.0, 48.0, 71.0, 117.0, 162.0, 154.0, 115.0, 81.0, 53.0, 36.0, 25.0, 12.0, 7.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002970695495605469, -0.00028610602021217346, -0.00027514249086380005, -0.00026417896151542664, -0.0002532154321670532, -0.0002422519028186798, -0.0002312883734703064, -0.00022032484412193298, -0.00020936131477355957, -0.00019839778542518616, -0.00018743425607681274, -0.00017647072672843933, -0.00016550719738006592, -0.0001545436680316925, -0.0001435801386833191, -0.00013261660933494568, -0.00012165307998657227, -0.00011068955063819885, -9.972602128982544e-05, -8.876249194145203e-05, -7.779896259307861e-05, -6.68354332447052e-05, -5.587190389633179e-05, -4.4908374547958374e-05, -3.394484519958496e-05, -2.2981315851211548e-05, -1.2017786502838135e-05, -1.0542571544647217e-06, 9.909272193908691e-06, 2.0872801542282104e-05, 3.183633089065552e-05, 4.279986023902893e-05, 5.3763389587402344e-05, 6.472691893577576e-05, 7.569044828414917e-05, 8.665397763252258e-05, 9.7617506980896e-05, 0.00010858103632926941, 0.00011954456567764282, 0.00013050809502601624, 0.00014147162437438965, 0.00015243515372276306, 0.00016339868307113647, 0.0001743622124195099, 0.0001853257417678833, 0.00019628927111625671, 0.00020725280046463013, 0.00021821632981300354, 0.00022917985916137695, 0.00024014338850975037, 0.0002511069178581238, 0.0002620704472064972, 0.0002730339765548706, 0.000283997505903244, 0.00029496103525161743, 0.00030592456459999084, 0.00031688809394836426, 0.00032785162329673767, 0.0003388151526451111, 0.0003497786819934845, 0.0003607422113418579, 0.0003717057406902313, 0.00038266927003860474, 0.00039363279938697815, 0.00040459632873535156]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 21.0, 19.0, 22.0, 41.0, 71.0, 96.0, 176.0, 414.0, 1186.0, 8046.0, 726467.0, 304752.0, 5440.0, 996.0, 324.0, 164.0, 91.0, 77.0, 38.0, 29.0, 18.0, 10.0, 13.0, 15.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.35009765625, -6.1572265625, -5.96435546875, -5.771484375, -5.57861328125, -5.3857421875, -5.19287109375, -5.0, -4.80712890625, -4.6142578125, -4.42138671875, -4.228515625, -4.03564453125, -3.8427734375, -3.64990234375, -3.45703125, -3.26416015625, -3.0712890625, -2.87841796875, -2.685546875, -2.49267578125, -2.2998046875, -2.10693359375, -1.9140625, -1.72119140625, -1.5283203125, -1.33544921875, -1.142578125, -0.94970703125, -0.7568359375, -0.56396484375, -0.37109375, -0.17822265625, 0.0146484375, 0.20751953125, 0.400390625, 0.59326171875, 0.7861328125, 0.97900390625, 1.171875, 1.36474609375, 1.5576171875, 1.75048828125, 1.943359375, 2.13623046875, 2.3291015625, 2.52197265625, 2.71484375, 2.90771484375, 3.1005859375, 3.29345703125, 3.486328125, 3.67919921875, 3.8720703125, 4.06494140625, 4.2578125, 4.45068359375, 4.6435546875, 4.83642578125, 5.029296875, 5.22216796875, 5.4150390625, 5.60791015625, 5.80078125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 7.0, 11.0, 21.0, 66.0, 151.0, 356.0, 234.0, 76.0, 48.0, 16.0, 9.0, 9.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7734375, -6.5291748046875, -6.284912109375, -6.0406494140625, -5.79638671875, -5.5521240234375, -5.307861328125, -5.0635986328125, -4.8193359375, -4.5750732421875, -4.330810546875, -4.0865478515625, -3.84228515625, -3.5980224609375, -3.353759765625, -3.1094970703125, -2.865234375, -2.6209716796875, -2.376708984375, -2.1324462890625, -1.88818359375, -1.6439208984375, -1.399658203125, -1.1553955078125, -0.9111328125, -0.6668701171875, -0.422607421875, -0.1783447265625, 0.06591796875, 0.3101806640625, 0.554443359375, 0.7987060546875, 1.04296875, 1.2872314453125, 1.531494140625, 1.7757568359375, 2.02001953125, 2.2642822265625, 2.508544921875, 2.7528076171875, 2.9970703125, 3.2413330078125, 3.485595703125, 3.7298583984375, 3.97412109375, 4.2183837890625, 4.462646484375, 4.7069091796875, 4.951171875, 5.1954345703125, 5.439697265625, 5.6839599609375, 5.92822265625, 6.1724853515625, 6.416748046875, 6.6610107421875, 6.9052734375, 7.1495361328125, 7.393798828125, 7.6380615234375, 7.88232421875, 8.1265869140625, 8.370849609375, 8.6151123046875, 8.859375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 5.0, 8.0, 24.0, 17.0, 54.0, 130.0, 207.0, 229.0, 166.0, 78.0, 48.0, 25.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.90658950805664, -17.215009689331055, -15.523430824279785, -13.831851959228516, -12.14027214050293, -10.448692321777344, -8.757113456726074, -7.065534591674805, -5.373954772949219, -3.682375431060791, -1.9907960891723633, -0.29921674728393555, 1.3923625946044922, 3.083942413330078, 4.775521278381348, 6.467100143432617, 8.158679962158203, 9.850259780883789, 11.541838645935059, 13.233417510986328, 14.924997329711914, 16.6165771484375, 18.308155059814453, 19.99973487854004, 21.691314697265625, 23.38289451599121, 25.074474334716797, 26.76605224609375, 28.457632064819336, 30.149211883544922, 31.840789794921875, 33.532371520996094, 35.22395324707031, 36.915531158447266, 38.607112884521484, 40.29869079589844, 41.990272521972656, 43.68185043334961, 45.37342834472656, 47.06501007080078, 48.756587982177734, 50.44816589355469, 52.139747619628906, 53.83132553100586, 55.52290344238281, 57.21448516845703, 58.906063079833984, 60.59764099121094, 62.289222717285156, 63.98080062866211, 65.67237854003906, 67.36396026611328, 69.0555419921875, 70.74711608886719, 72.4386978149414, 74.13027954101562, 75.82185363769531, 77.51343536376953, 79.20500946044922, 80.89659118652344, 82.58817291259766, 84.27975463867188, 85.97132873535156, 87.66291046142578, 89.3544921875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 10.0, 14.0, 16.0, 20.0, 20.0, 17.0, 31.0, 32.0, 34.0, 46.0, 41.0, 41.0, 36.0, 52.0, 54.0, 41.0, 36.0, 57.0, 47.0, 50.0, 41.0, 31.0, 31.0, 34.0, 26.0, 23.0, 24.0, 18.0, 7.0, 10.0, 13.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.955293655395508, -24.15846824645996, -23.361642837524414, -22.564817428588867, -21.767990112304688, -20.97116470336914, -20.174339294433594, -19.377513885498047, -18.5806884765625, -17.783863067626953, -16.987037658691406, -16.19021224975586, -15.393385887145996, -14.59656047821045, -13.799734115600586, -13.002908706665039, -12.206083297729492, -11.409257888793945, -10.612432479858398, -9.815606117248535, -9.018780708312988, -8.221955299377441, -7.425129413604736, -6.628303527832031, -5.831478118896484, -5.0346527099609375, -4.237826824188232, -3.4410011768341064, -2.6441755294799805, -1.8473498821258545, -1.0505242347717285, -0.25369834899902344, 0.5431251525878906, 1.3399507999420166, 2.1367764472961426, 2.9336020946502686, 3.7304277420043945, 4.527253150939941, 5.3240790367126465, 6.120904922485352, 6.917730331420898, 7.714555740356445, 8.511381149291992, 9.308207511901855, 10.105032920837402, 10.90185832977295, 11.698684692382812, 12.49551010131836, 13.292335510253906, 14.089160919189453, 14.885986328125, 15.682812690734863, 16.479637145996094, 17.276464462280273, 18.07328987121582, 18.870115280151367, 19.666940689086914, 20.46376609802246, 21.260591506958008, 22.057416915893555, 22.854244232177734, 23.65106964111328, 24.447895050048828, 25.244720458984375, 26.041545867919922]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 11.0, 18.0, 13.0, 24.0, 34.0, 57.0, 80.0, 199.0, 351.0, 861.0, 3134.0, 22462.0, 3982653.0, 172741.0, 8632.0, 1798.0, 570.0, 286.0, 132.0, 73.0, 35.0, 35.0, 26.0, 13.0, 10.0, 9.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4765625, -11.1368408203125, -10.797119140625, -10.4573974609375, -10.11767578125, -9.7779541015625, -9.438232421875, -9.0985107421875, -8.7587890625, -8.4190673828125, -8.079345703125, -7.7396240234375, -7.39990234375, -7.0601806640625, -6.720458984375, -6.3807373046875, -6.041015625, -5.7012939453125, -5.361572265625, -5.0218505859375, -4.68212890625, -4.3424072265625, -4.002685546875, -3.6629638671875, -3.3232421875, -2.9835205078125, -2.643798828125, -2.3040771484375, -1.96435546875, -1.6246337890625, -1.284912109375, -0.9451904296875, -0.60546875, -0.2657470703125, 0.073974609375, 0.4136962890625, 0.75341796875, 1.0931396484375, 1.432861328125, 1.7725830078125, 2.1123046875, 2.4520263671875, 2.791748046875, 3.1314697265625, 3.47119140625, 3.8109130859375, 4.150634765625, 4.4903564453125, 4.830078125, 5.1697998046875, 5.509521484375, 5.8492431640625, 6.18896484375, 6.5286865234375, 6.868408203125, 7.2081298828125, 7.5478515625, 7.8875732421875, 8.227294921875, 8.5670166015625, 8.90673828125, 9.2464599609375, 9.586181640625, 9.9259033203125, 10.265625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 11.0, 7.0, 15.0, 14.0, 14.0, 23.0, 29.0, 35.0, 42.0, 53.0, 48.0, 55.0, 56.0, 65.0, 65.0, 65.0, 63.0, 51.0, 42.0, 48.0, 26.0, 43.0, 30.0, 17.0, 19.0, 16.0, 12.0, 9.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.388671875, -1.34814453125, -1.3076171875, -1.26708984375, -1.2265625, -1.18603515625, -1.1455078125, -1.10498046875, -1.064453125, -1.02392578125, -0.9833984375, -0.94287109375, -0.90234375, -0.86181640625, -0.8212890625, -0.78076171875, -0.740234375, -0.69970703125, -0.6591796875, -0.61865234375, -0.578125, -0.53759765625, -0.4970703125, -0.45654296875, -0.416015625, -0.37548828125, -0.3349609375, -0.29443359375, -0.25390625, -0.21337890625, -0.1728515625, -0.13232421875, -0.091796875, -0.05126953125, -0.0107421875, 0.02978515625, 0.0703125, 0.11083984375, 0.1513671875, 0.19189453125, 0.232421875, 0.27294921875, 0.3134765625, 0.35400390625, 0.39453125, 0.43505859375, 0.4755859375, 0.51611328125, 0.556640625, 0.59716796875, 0.6376953125, 0.67822265625, 0.71875, 0.75927734375, 0.7998046875, 0.84033203125, 0.880859375, 0.92138671875, 0.9619140625, 1.00244140625, 1.04296875, 1.08349609375, 1.1240234375, 1.16455078125, 1.205078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 10.0, 12.0, 8.0, 20.0, 29.0, 33.0, 42.0, 81.0, 124.0, 181.0, 352.0, 603.0, 1194.0, 2782.0, 8240.0, 40677.0, 3026179.0, 1066894.0, 34446.0, 7290.0, 2549.0, 1180.0, 612.0, 262.0, 151.0, 111.0, 61.0, 55.0, 26.0, 24.0, 23.0, 13.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53125, -7.2879638671875, -7.044677734375, -6.8013916015625, -6.55810546875, -6.3148193359375, -6.071533203125, -5.8282470703125, -5.5849609375, -5.3416748046875, -5.098388671875, -4.8551025390625, -4.61181640625, -4.3685302734375, -4.125244140625, -3.8819580078125, -3.638671875, -3.3953857421875, -3.152099609375, -2.9088134765625, -2.66552734375, -2.4222412109375, -2.178955078125, -1.9356689453125, -1.6923828125, -1.4490966796875, -1.205810546875, -0.9625244140625, -0.71923828125, -0.4759521484375, -0.232666015625, 0.0106201171875, 0.25390625, 0.4971923828125, 0.740478515625, 0.9837646484375, 1.22705078125, 1.4703369140625, 1.713623046875, 1.9569091796875, 2.2001953125, 2.4434814453125, 2.686767578125, 2.9300537109375, 3.17333984375, 3.4166259765625, 3.659912109375, 3.9031982421875, 4.146484375, 4.3897705078125, 4.633056640625, 4.8763427734375, 5.11962890625, 5.3629150390625, 5.606201171875, 5.8494873046875, 6.0927734375, 6.3360595703125, 6.579345703125, 6.8226318359375, 7.06591796875, 7.3092041015625, 7.552490234375, 7.7957763671875, 8.0390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 7.0, 10.0, 15.0, 23.0, 35.0, 67.0, 161.0, 627.0, 2610.0, 319.0, 88.0, 62.0, 17.0, 10.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2578125, -6.113311767578125, -5.96881103515625, -5.824310302734375, -5.6798095703125, -5.535308837890625, -5.39080810546875, -5.246307373046875, -5.101806640625, -4.957305908203125, -4.81280517578125, -4.668304443359375, -4.5238037109375, -4.379302978515625, -4.23480224609375, -4.090301513671875, -3.94580078125, -3.801300048828125, -3.65679931640625, -3.512298583984375, -3.3677978515625, -3.223297119140625, -3.07879638671875, -2.934295654296875, -2.789794921875, -2.645294189453125, -2.50079345703125, -2.356292724609375, -2.2117919921875, -2.067291259765625, -1.92279052734375, -1.778289794921875, -1.6337890625, -1.489288330078125, -1.34478759765625, -1.200286865234375, -1.0557861328125, -0.911285400390625, -0.76678466796875, -0.622283935546875, -0.477783203125, -0.333282470703125, -0.18878173828125, -0.044281005859375, 0.1002197265625, 0.244720458984375, 0.38922119140625, 0.533721923828125, 0.67822265625, 0.822723388671875, 0.96722412109375, 1.111724853515625, 1.2562255859375, 1.400726318359375, 1.54522705078125, 1.689727783203125, 1.834228515625, 1.978729248046875, 2.12322998046875, 2.267730712890625, 2.4122314453125, 2.556732177734375, 2.70123291015625, 2.845733642578125, 2.990234375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 8.0, 36.0, 104.0, 335.0, 394.0, 96.0, 19.0, 8.0, 3.0, 2.0, 1.0], "bins": [-92.97163391113281, -91.34947967529297, -89.72732543945312, -88.10517120361328, -86.48301696777344, -84.8608627319336, -83.23870849609375, -81.6165542602539, -79.99440002441406, -78.37224578857422, -76.75009155273438, -75.12793731689453, -73.50578308105469, -71.88362884521484, -70.261474609375, -68.63932037353516, -67.01716613769531, -65.39501190185547, -63.772857666015625, -62.15070343017578, -60.52854919433594, -58.906394958496094, -57.28424072265625, -55.662086486816406, -54.03993225097656, -52.41777801513672, -50.795623779296875, -49.17346954345703, -47.55131530761719, -45.929161071777344, -44.3070068359375, -42.684852600097656, -41.06269836425781, -39.44054412841797, -37.818389892578125, -36.19623565673828, -34.57408142089844, -32.951927185058594, -31.32977294921875, -29.707618713378906, -28.085464477539062, -26.46331024169922, -24.841156005859375, -23.21900177001953, -21.596847534179688, -19.974693298339844, -18.3525390625, -16.730384826660156, -15.108230590820312, -13.486076354980469, -11.863922119140625, -10.241767883300781, -8.619613647460938, -6.997459411621094, -5.37530517578125, -3.7531509399414062, -2.1309967041015625, -0.5088424682617188, 1.113311767578125, 2.7354660034179688, 4.3576202392578125, 5.979774475097656, 7.6019287109375, 9.224082946777344, 10.846237182617188]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 13.0, 10.0, 11.0, 11.0, 15.0, 14.0, 18.0, 27.0, 44.0, 43.0, 36.0, 49.0, 47.0, 59.0, 46.0, 37.0, 48.0, 32.0, 45.0, 46.0, 45.0, 39.0, 28.0, 30.0, 31.0, 30.0, 26.0, 22.0, 18.0, 21.0, 10.0, 12.0, 10.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.471174240112305, -12.124832153320312, -11.77849006652832, -11.432147979736328, -11.085805892944336, -10.739463806152344, -10.393121719360352, -10.046778678894043, -9.70043659210205, -9.354094505310059, -9.007752418518066, -8.661410331726074, -8.315068244934082, -7.968725681304932, -7.6223835945129395, -7.276041030883789, -6.929699420928955, -6.583357334136963, -6.237015247344971, -5.89067268371582, -5.544330596923828, -5.197988510131836, -4.851646423339844, -4.505304336547852, -4.158962249755859, -3.812620162963867, -3.466277837753296, -3.1199357509613037, -2.7735934257507324, -2.4272513389587402, -2.080909252166748, -1.7345669269561768, -1.3882246017456055, -1.0418823957443237, -0.6955402493476868, -0.3491981029510498, -0.0028558969497680664, 0.34348630905151367, 0.6898283958435059, 1.0361707210540771, 1.3825128078460693, 1.728855013847351, 2.075197219848633, 2.421539306640625, 2.767881393432617, 3.1142237186431885, 3.4605658054351807, 3.806908130645752, 4.153250217437744, 4.499592304229736, 4.8459343910217285, 5.192276954650879, 5.538619041442871, 5.884961128234863, 6.2313032150268555, 6.577645301818848, 6.92398738861084, 7.270329475402832, 7.616671562194824, 7.963013648986816, 8.309355735778809, 8.655698776245117, 9.00204086303711, 9.348382949829102, 9.694725036621094]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 7.0, 10.0, 11.0, 16.0, 19.0, 33.0, 36.0, 50.0, 70.0, 119.0, 166.0, 254.0, 376.0, 642.0, 1073.0, 1958.0, 3742.0, 7096.0, 15794.0, 38895.0, 110121.0, 313546.0, 346374.0, 128630.0, 44437.0, 17864.0, 7955.0, 3975.0, 2123.0, 1204.0, 683.0, 441.0, 276.0, 162.0, 121.0, 83.0, 54.0, 37.0, 24.0, 25.0, 14.0, 15.0, 12.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.52734375, -4.39044189453125, -4.2535400390625, -4.11663818359375, -3.979736328125, -3.84283447265625, -3.7059326171875, -3.56903076171875, -3.43212890625, -3.29522705078125, -3.1583251953125, -3.02142333984375, -2.884521484375, -2.74761962890625, -2.6107177734375, -2.47381591796875, -2.3369140625, -2.20001220703125, -2.0631103515625, -1.92620849609375, -1.789306640625, -1.65240478515625, -1.5155029296875, -1.37860107421875, -1.24169921875, -1.10479736328125, -0.9678955078125, -0.83099365234375, -0.694091796875, -0.55718994140625, -0.4202880859375, -0.28338623046875, -0.146484375, -0.00958251953125, 0.1273193359375, 0.26422119140625, 0.401123046875, 0.53802490234375, 0.6749267578125, 0.81182861328125, 0.94873046875, 1.08563232421875, 1.2225341796875, 1.35943603515625, 1.496337890625, 1.63323974609375, 1.7701416015625, 1.90704345703125, 2.0439453125, 2.18084716796875, 2.3177490234375, 2.45465087890625, 2.591552734375, 2.72845458984375, 2.8653564453125, 3.00225830078125, 3.13916015625, 3.27606201171875, 3.4129638671875, 3.54986572265625, 3.686767578125, 3.82366943359375, 3.9605712890625, 4.09747314453125, 4.234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 1.0, 5.0, 12.0, 6.0, 12.0, 17.0, 11.0, 14.0, 24.0, 29.0, 24.0, 35.0, 48.0, 52.0, 49.0, 68.0, 61.0, 54.0, 60.0, 60.0, 59.0, 44.0, 40.0, 40.0, 36.0, 22.0, 24.0, 22.0, 19.0, 10.0, 12.0, 5.0, 7.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4091796875, -1.3671722412109375, -1.325164794921875, -1.2831573486328125, -1.24114990234375, -1.1991424560546875, -1.157135009765625, -1.1151275634765625, -1.0731201171875, -1.0311126708984375, -0.989105224609375, -0.9470977783203125, -0.90509033203125, -0.8630828857421875, -0.821075439453125, -0.7790679931640625, -0.737060546875, -0.6950531005859375, -0.653045654296875, -0.6110382080078125, -0.56903076171875, -0.5270233154296875, -0.485015869140625, -0.4430084228515625, -0.4010009765625, -0.3589935302734375, -0.316986083984375, -0.2749786376953125, -0.23297119140625, -0.1909637451171875, -0.148956298828125, -0.1069488525390625, -0.06494140625, -0.0229339599609375, 0.019073486328125, 0.0610809326171875, 0.10308837890625, 0.1450958251953125, 0.187103271484375, 0.2291107177734375, 0.2711181640625, 0.3131256103515625, 0.355133056640625, 0.3971405029296875, 0.43914794921875, 0.4811553955078125, 0.523162841796875, 0.5651702880859375, 0.607177734375, 0.6491851806640625, 0.691192626953125, 0.7332000732421875, 0.77520751953125, 0.8172149658203125, 0.859222412109375, 0.9012298583984375, 0.9432373046875, 0.9852447509765625, 1.027252197265625, 1.0692596435546875, 1.11126708984375, 1.1532745361328125, 1.195281982421875, 1.2372894287109375, 1.279296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 12.0, 17.0, 29.0, 32.0, 54.0, 69.0, 149.0, 255.0, 438.0, 790.0, 1489.0, 2915.0, 5738.0, 11979.0, 27512.0, 69335.0, 217390.0, 427108.0, 179346.0, 58820.0, 23607.0, 10763.0, 5069.0, 2495.0, 1349.0, 744.0, 407.0, 248.0, 144.0, 90.0, 45.0, 25.0, 28.0, 14.0, 10.0, 7.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.25, -5.0928955078125, -4.935791015625, -4.7786865234375, -4.62158203125, -4.4644775390625, -4.307373046875, -4.1502685546875, -3.9931640625, -3.8360595703125, -3.678955078125, -3.5218505859375, -3.36474609375, -3.2076416015625, -3.050537109375, -2.8934326171875, -2.736328125, -2.5792236328125, -2.422119140625, -2.2650146484375, -2.10791015625, -1.9508056640625, -1.793701171875, -1.6365966796875, -1.4794921875, -1.3223876953125, -1.165283203125, -1.0081787109375, -0.85107421875, -0.6939697265625, -0.536865234375, -0.3797607421875, -0.22265625, -0.0655517578125, 0.091552734375, 0.2486572265625, 0.40576171875, 0.5628662109375, 0.719970703125, 0.8770751953125, 1.0341796875, 1.1912841796875, 1.348388671875, 1.5054931640625, 1.66259765625, 1.8197021484375, 1.976806640625, 2.1339111328125, 2.291015625, 2.4481201171875, 2.605224609375, 2.7623291015625, 2.91943359375, 3.0765380859375, 3.233642578125, 3.3907470703125, 3.5478515625, 3.7049560546875, 3.862060546875, 4.0191650390625, 4.17626953125, 4.3333740234375, 4.490478515625, 4.6475830078125, 4.8046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 7.0, 3.0, 4.0, 1.0, 4.0, 9.0, 11.0, 12.0, 8.0, 15.0, 16.0, 15.0, 17.0, 22.0, 30.0, 28.0, 17.0, 26.0, 26.0, 23.0, 32.0, 33.0, 40.0, 28.0, 23.0, 33.0, 36.0, 39.0, 35.0, 39.0, 35.0, 21.0, 36.0, 34.0, 31.0, 22.0, 29.0, 22.0, 28.0, 12.0, 16.0, 13.0, 9.0, 6.0, 14.0, 9.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.48828125, -5.31353759765625, -5.1387939453125, -4.96405029296875, -4.789306640625, -4.61456298828125, -4.4398193359375, -4.26507568359375, -4.09033203125, -3.91558837890625, -3.7408447265625, -3.56610107421875, -3.391357421875, -3.21661376953125, -3.0418701171875, -2.86712646484375, -2.6923828125, -2.51763916015625, -2.3428955078125, -2.16815185546875, -1.993408203125, -1.81866455078125, -1.6439208984375, -1.46917724609375, -1.29443359375, -1.11968994140625, -0.9449462890625, -0.77020263671875, -0.595458984375, -0.42071533203125, -0.2459716796875, -0.07122802734375, 0.103515625, 0.27825927734375, 0.4530029296875, 0.62774658203125, 0.802490234375, 0.97723388671875, 1.1519775390625, 1.32672119140625, 1.50146484375, 1.67620849609375, 1.8509521484375, 2.02569580078125, 2.200439453125, 2.37518310546875, 2.5499267578125, 2.72467041015625, 2.8994140625, 3.07415771484375, 3.2489013671875, 3.42364501953125, 3.598388671875, 3.77313232421875, 3.9478759765625, 4.12261962890625, 4.29736328125, 4.47210693359375, 4.6468505859375, 4.82159423828125, 4.996337890625, 5.17108154296875, 5.3458251953125, 5.52056884765625, 5.6953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 13.0, 13.0, 13.0, 13.0, 24.0, 43.0, 62.0, 83.0, 130.0, 231.0, 415.0, 888.0, 2210.0, 5578.0, 20763.0, 331854.0, 641496.0, 32503.0, 7322.0, 2590.0, 1151.0, 474.0, 245.0, 128.0, 87.0, 66.0, 41.0, 22.0, 32.0, 13.0, 12.0, 15.0, 11.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.10748291015625, -4.9532470703125, -4.79901123046875, -4.644775390625, -4.49053955078125, -4.3363037109375, -4.18206787109375, -4.02783203125, -3.87359619140625, -3.7193603515625, -3.56512451171875, -3.410888671875, -3.25665283203125, -3.1024169921875, -2.94818115234375, -2.7939453125, -2.63970947265625, -2.4854736328125, -2.33123779296875, -2.177001953125, -2.02276611328125, -1.8685302734375, -1.71429443359375, -1.56005859375, -1.40582275390625, -1.2515869140625, -1.09735107421875, -0.943115234375, -0.78887939453125, -0.6346435546875, -0.48040771484375, -0.326171875, -0.17193603515625, -0.0177001953125, 0.13653564453125, 0.290771484375, 0.44500732421875, 0.5992431640625, 0.75347900390625, 0.90771484375, 1.06195068359375, 1.2161865234375, 1.37042236328125, 1.524658203125, 1.67889404296875, 1.8331298828125, 1.98736572265625, 2.1416015625, 2.29583740234375, 2.4500732421875, 2.60430908203125, 2.758544921875, 2.91278076171875, 3.0670166015625, 3.22125244140625, 3.37548828125, 3.52972412109375, 3.6839599609375, 3.83819580078125, 3.992431640625, 4.14666748046875, 4.3009033203125, 4.45513916015625, 4.609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 8.0, 19.0, 25.0, 43.0, 62.0, 91.0, 129.0, 146.0, 141.0, 109.0, 64.0, 53.0, 34.0, 16.0, 16.0, 9.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002887248992919922, -0.00027147307991981506, -0.00025422126054763794, -0.00023696944117546082, -0.0002197176218032837, -0.00020246580243110657, -0.00018521398305892944, -0.00016796216368675232, -0.0001507103443145752, -0.00013345852494239807, -0.00011620670557022095, -9.895488619804382e-05, -8.17030668258667e-05, -6.445124745368958e-05, -4.719942808151245e-05, -2.9947608709335327e-05, -1.2695789337158203e-05, 4.556030035018921e-06, 2.1807849407196045e-05, 3.905966877937317e-05, 5.631148815155029e-05, 7.356330752372742e-05, 9.081512689590454e-05, 0.00010806694626808167, 0.0001253187656402588, 0.0001425705850124359, 0.00015982240438461304, 0.00017707422375679016, 0.00019432604312896729, 0.0002115778625011444, 0.00022882968187332153, 0.00024608150124549866, 0.0002633333206176758, 0.0002805851399898529, 0.00029783695936203003, 0.00031508877873420715, 0.0003323405981063843, 0.0003495924174785614, 0.0003668442368507385, 0.00038409605622291565, 0.0004013478755950928, 0.0004185996949672699, 0.000435851514339447, 0.00045310333371162415, 0.00047035515308380127, 0.0004876069724559784, 0.0005048587918281555, 0.0005221106112003326, 0.0005393624305725098, 0.0005566142499446869, 0.000573866069316864, 0.0005911178886890411, 0.0006083697080612183, 0.0006256215274333954, 0.0006428733468055725, 0.0006601251661777496, 0.0006773769855499268, 0.0006946288049221039, 0.000711880624294281, 0.0007291324436664581, 0.0007463842630386353, 0.0007636360824108124, 0.0007808879017829895, 0.0007981397211551666, 0.0008153915405273438]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 12.0, 13.0, 26.0, 43.0, 69.0, 96.0, 163.0, 248.0, 514.0, 1047.0, 2647.0, 8925.0, 49735.0, 571826.0, 369546.0, 32806.0, 6723.0, 2091.0, 904.0, 459.0, 241.0, 152.0, 91.0, 58.0, 31.0, 36.0, 21.0, 10.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.5234375, -4.404083251953125, -4.28472900390625, -4.165374755859375, -4.0460205078125, -3.926666259765625, -3.80731201171875, -3.687957763671875, -3.568603515625, -3.449249267578125, -3.32989501953125, -3.210540771484375, -3.0911865234375, -2.971832275390625, -2.85247802734375, -2.733123779296875, -2.61376953125, -2.494415283203125, -2.37506103515625, -2.255706787109375, -2.1363525390625, -2.016998291015625, -1.89764404296875, -1.778289794921875, -1.658935546875, -1.539581298828125, -1.42022705078125, -1.300872802734375, -1.1815185546875, -1.062164306640625, -0.94281005859375, -0.823455810546875, -0.7041015625, -0.584747314453125, -0.46539306640625, -0.346038818359375, -0.2266845703125, -0.107330322265625, 0.01202392578125, 0.131378173828125, 0.250732421875, 0.370086669921875, 0.48944091796875, 0.608795166015625, 0.7281494140625, 0.847503662109375, 0.96685791015625, 1.086212158203125, 1.20556640625, 1.324920654296875, 1.44427490234375, 1.563629150390625, 1.6829833984375, 1.802337646484375, 1.92169189453125, 2.041046142578125, 2.160400390625, 2.279754638671875, 2.39910888671875, 2.518463134765625, 2.6378173828125, 2.757171630859375, 2.87652587890625, 2.995880126953125, 3.115234375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 3.0, 6.0, 9.0, 18.0, 22.0, 41.0, 59.0, 83.0, 125.0, 164.0, 138.0, 107.0, 74.0, 45.0, 40.0, 19.0, 19.0, 7.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33984375, -4.18292236328125, -4.0260009765625, -3.86907958984375, -3.712158203125, -3.55523681640625, -3.3983154296875, -3.24139404296875, -3.08447265625, -2.92755126953125, -2.7706298828125, -2.61370849609375, -2.456787109375, -2.29986572265625, -2.1429443359375, -1.98602294921875, -1.8291015625, -1.67218017578125, -1.5152587890625, -1.35833740234375, -1.201416015625, -1.04449462890625, -0.8875732421875, -0.73065185546875, -0.57373046875, -0.41680908203125, -0.2598876953125, -0.10296630859375, 0.053955078125, 0.21087646484375, 0.3677978515625, 0.52471923828125, 0.681640625, 0.83856201171875, 0.9954833984375, 1.15240478515625, 1.309326171875, 1.46624755859375, 1.6231689453125, 1.78009033203125, 1.93701171875, 2.09393310546875, 2.2508544921875, 2.40777587890625, 2.564697265625, 2.72161865234375, 2.8785400390625, 3.03546142578125, 3.1923828125, 3.34930419921875, 3.5062255859375, 3.66314697265625, 3.820068359375, 3.97698974609375, 4.1339111328125, 4.29083251953125, 4.44775390625, 4.60467529296875, 4.7615966796875, 4.91851806640625, 5.075439453125, 5.23236083984375, 5.3892822265625, 5.54620361328125, 5.703125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 14.0, 18.0, 34.0, 51.0, 124.0, 186.0, 194.0, 163.0, 116.0, 48.0, 30.0, 15.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-109.27366638183594, -106.86898040771484, -104.46428680419922, -102.05960083007812, -99.6549072265625, -97.2502212524414, -94.84553527832031, -92.44084167480469, -90.0361557006836, -87.6314697265625, -85.22677612304688, -82.82209014892578, -80.41740417480469, -78.01271057128906, -75.60802459716797, -73.20333862304688, -70.79864501953125, -68.39395904541016, -65.98926544189453, -63.58457946777344, -61.17988967895508, -58.77519989013672, -56.370513916015625, -53.965824127197266, -51.561134338378906, -49.15644454956055, -46.75175476074219, -44.347068786621094, -41.942378997802734, -39.537689208984375, -37.13300323486328, -34.72831344604492, -32.32361602783203, -29.918926239013672, -27.514238357543945, -25.10955047607422, -22.70486068725586, -20.3001708984375, -17.895483016967773, -15.490795135498047, -13.086105346679688, -10.681416511535645, -8.276727676391602, -5.872038841247559, -3.4673500061035156, -1.0626611709594727, 1.3420276641845703, 3.746715545654297, 6.151405334472656, 8.5560941696167, 10.960783004760742, 13.365471839904785, 15.770160675048828, 18.174850463867188, 20.579538345336914, 22.98422622680664, 25.388916015625, 27.79360580444336, 30.198293685913086, 32.60298156738281, 35.00767135620117, 37.41236114501953, 39.817047119140625, 42.221736907958984, 44.626426696777344]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 10.0, 6.0, 7.0, 6.0, 12.0, 15.0, 19.0, 18.0, 18.0, 21.0, 34.0, 32.0, 41.0, 42.0, 41.0, 43.0, 49.0, 51.0, 55.0, 35.0, 34.0, 50.0, 45.0, 42.0, 36.0, 23.0, 38.0, 27.0, 29.0, 24.0, 22.0, 21.0, 18.0, 8.0, 9.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.57080078125, -34.32867431640625, -33.0865478515625, -31.84442138671875, -30.602294921875, -29.36016845703125, -28.118040084838867, -26.875913619995117, -25.633787155151367, -24.391660690307617, -23.149534225463867, -21.907407760620117, -20.665279388427734, -19.423152923583984, -18.181026458740234, -16.938899993896484, -15.696773529052734, -14.454647064208984, -13.212520599365234, -11.970393180847168, -10.728266716003418, -9.486140251159668, -8.244012832641602, -7.001886367797852, -5.759759902954102, -4.517633438110352, -3.2755064964294434, -2.0333797931671143, -0.7912530899047852, 0.45087337493896484, 1.693000316619873, 2.9351272583007812, 4.177253723144531, 5.419380187988281, 6.6615071296691895, 7.903634071350098, 9.145760536193848, 10.387887001037598, 11.630014419555664, 12.872140884399414, 14.114267349243164, 15.356393814086914, 16.598520278930664, 17.840646743774414, 19.082775115966797, 20.324901580810547, 21.567028045654297, 22.809154510498047, 24.051280975341797, 25.293407440185547, 26.535533905029297, 27.777660369873047, 29.019786834716797, 30.261913299560547, 31.50404167175293, 32.74617004394531, 33.98829650878906, 35.23042297363281, 36.47254943847656, 37.71467590332031, 38.95680236816406, 40.19892883300781, 41.44105529785156, 42.68318176269531, 43.92530822753906]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 18.0, 28.0, 24.0, 51.0, 73.0, 119.0, 210.0, 428.0, 1135.0, 4110.0, 27267.0, 4121060.0, 32772.0, 4646.0, 1286.0, 458.0, 208.0, 115.0, 76.0, 49.0, 39.0, 17.0, 27.0, 14.0, 9.0, 9.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.4725341796875, -10.077880859375, -9.6832275390625, -9.28857421875, -8.8939208984375, -8.499267578125, -8.1046142578125, -7.7099609375, -7.3153076171875, -6.920654296875, -6.5260009765625, -6.13134765625, -5.7366943359375, -5.342041015625, -4.9473876953125, -4.552734375, -4.1580810546875, -3.763427734375, -3.3687744140625, -2.97412109375, -2.5794677734375, -2.184814453125, -1.7901611328125, -1.3955078125, -1.0008544921875, -0.606201171875, -0.2115478515625, 0.18310546875, 0.5777587890625, 0.972412109375, 1.3670654296875, 1.76171875, 2.1563720703125, 2.551025390625, 2.9456787109375, 3.34033203125, 3.7349853515625, 4.129638671875, 4.5242919921875, 4.9189453125, 5.3135986328125, 5.708251953125, 6.1029052734375, 6.49755859375, 6.8922119140625, 7.286865234375, 7.6815185546875, 8.076171875, 8.4708251953125, 8.865478515625, 9.2601318359375, 9.65478515625, 10.0494384765625, 10.444091796875, 10.8387451171875, 11.2333984375, 11.6280517578125, 12.022705078125, 12.4173583984375, 12.81201171875, 13.2066650390625, 13.601318359375, 13.9959716796875, 14.390625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 8.0, 7.0, 11.0, 12.0, 27.0, 23.0, 25.0, 35.0, 42.0, 48.0, 55.0, 55.0, 71.0, 81.0, 82.0, 60.0, 72.0, 52.0, 44.0, 36.0, 35.0, 31.0, 27.0, 12.0, 12.0, 13.0, 11.0, 7.0, 2.0, 0.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.65625, -1.5924072265625, -1.528564453125, -1.4647216796875, -1.40087890625, -1.3370361328125, -1.273193359375, -1.2093505859375, -1.1455078125, -1.0816650390625, -1.017822265625, -0.9539794921875, -0.89013671875, -0.8262939453125, -0.762451171875, -0.6986083984375, -0.634765625, -0.5709228515625, -0.507080078125, -0.4432373046875, -0.37939453125, -0.3155517578125, -0.251708984375, -0.1878662109375, -0.1240234375, -0.0601806640625, 0.003662109375, 0.0675048828125, 0.13134765625, 0.1951904296875, 0.259033203125, 0.3228759765625, 0.38671875, 0.4505615234375, 0.514404296875, 0.5782470703125, 0.64208984375, 0.7059326171875, 0.769775390625, 0.8336181640625, 0.8974609375, 0.9613037109375, 1.025146484375, 1.0889892578125, 1.15283203125, 1.2166748046875, 1.280517578125, 1.3443603515625, 1.408203125, 1.4720458984375, 1.535888671875, 1.5997314453125, 1.66357421875, 1.7274169921875, 1.791259765625, 1.8551025390625, 1.9189453125, 1.9827880859375, 2.046630859375, 2.1104736328125, 2.17431640625, 2.2381591796875, 2.302001953125, 2.3658447265625, 2.4296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 12.0, 8.0, 7.0, 18.0, 12.0, 21.0, 26.0, 37.0, 47.0, 71.0, 83.0, 116.0, 189.0, 339.0, 514.0, 973.0, 1932.0, 4086.0, 9923.0, 36767.0, 4029092.0, 84321.0, 14509.0, 5525.0, 2557.0, 1253.0, 661.0, 411.0, 257.0, 153.0, 78.0, 67.0, 40.0, 42.0, 29.0, 32.0, 20.0, 9.0, 10.0, 7.0, 7.0, 2.0, 6.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.3203125, -9.0164794921875, -8.712646484375, -8.4088134765625, -8.10498046875, -7.8011474609375, -7.497314453125, -7.1934814453125, -6.8896484375, -6.5858154296875, -6.281982421875, -5.9781494140625, -5.67431640625, -5.3704833984375, -5.066650390625, -4.7628173828125, -4.458984375, -4.1551513671875, -3.851318359375, -3.5474853515625, -3.24365234375, -2.9398193359375, -2.635986328125, -2.3321533203125, -2.0283203125, -1.7244873046875, -1.420654296875, -1.1168212890625, -0.81298828125, -0.5091552734375, -0.205322265625, 0.0985107421875, 0.40234375, 0.7061767578125, 1.010009765625, 1.3138427734375, 1.61767578125, 1.9215087890625, 2.225341796875, 2.5291748046875, 2.8330078125, 3.1368408203125, 3.440673828125, 3.7445068359375, 4.04833984375, 4.3521728515625, 4.656005859375, 4.9598388671875, 5.263671875, 5.5675048828125, 5.871337890625, 6.1751708984375, 6.47900390625, 6.7828369140625, 7.086669921875, 7.3905029296875, 7.6943359375, 7.9981689453125, 8.302001953125, 8.6058349609375, 8.90966796875, 9.2135009765625, 9.517333984375, 9.8211669921875, 10.125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 11.0, 18.0, 55.0, 244.0, 3573.0, 79.0, 28.0, 11.0, 5.0, 9.0, 11.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -3.0235595703125, -2.937744140625, -2.8519287109375, -2.76611328125, -2.6802978515625, -2.594482421875, -2.5086669921875, -2.4228515625, -2.3370361328125, -2.251220703125, -2.1654052734375, -2.07958984375, -1.9937744140625, -1.907958984375, -1.8221435546875, -1.736328125, -1.6505126953125, -1.564697265625, -1.4788818359375, -1.39306640625, -1.3072509765625, -1.221435546875, -1.1356201171875, -1.0498046875, -0.9639892578125, -0.878173828125, -0.7923583984375, -0.70654296875, -0.6207275390625, -0.534912109375, -0.4490966796875, -0.36328125, -0.2774658203125, -0.191650390625, -0.1058349609375, -0.02001953125, 0.0657958984375, 0.151611328125, 0.2374267578125, 0.3232421875, 0.4090576171875, 0.494873046875, 0.5806884765625, 0.66650390625, 0.7523193359375, 0.838134765625, 0.9239501953125, 1.009765625, 1.0955810546875, 1.181396484375, 1.2672119140625, 1.35302734375, 1.4388427734375, 1.524658203125, 1.6104736328125, 1.6962890625, 1.7821044921875, 1.867919921875, 1.9537353515625, 2.03955078125, 2.1253662109375, 2.211181640625, 2.2969970703125, 2.3828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 16.0, 13.0, 25.0, 58.0, 93.0, 142.0, 178.0, 184.0, 105.0, 73.0, 48.0, 29.0, 17.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.679746627807617, -6.394729137420654, -6.109711647033691, -5.824694633483887, -5.539677143096924, -5.254659652709961, -4.969642639160156, -4.684625148773193, -4.3996076583862305, -4.114590167999268, -3.829572916030884, -3.5445556640625, -3.259538173675537, -2.974520683288574, -2.6895034313201904, -2.4044861793518066, -2.1194686889648438, -1.8344513177871704, -1.549433946609497, -1.2644165754318237, -0.9793992042541504, -0.694381833076477, -0.4093644618988037, -0.12434709072113037, 0.16067028045654297, 0.4456876516342163, 0.7307050228118896, 1.015722393989563, 1.3007397651672363, 1.5857571363449097, 1.870774507522583, 2.155791759490967, 2.4408092498779297, 2.7258267402648926, 3.0108439922332764, 3.29586124420166, 3.580878734588623, 3.865896224975586, 4.150913238525391, 4.4359307289123535, 4.720948219299316, 5.005965709686279, 5.290983200073242, 5.576000213623047, 5.86101770401001, 6.146035194396973, 6.431052207946777, 6.71606969833374, 7.001087188720703, 7.286104679107666, 7.571122169494629, 7.856139183044434, 8.141157150268555, 8.42617416381836, 8.711191177368164, 8.996209144592285, 9.28122615814209, 9.566243171691895, 9.851261138916016, 10.13627815246582, 10.421295166015625, 10.706313133239746, 10.99133014678955, 11.276348114013672, 11.561365127563477]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 14.0, 11.0, 18.0, 16.0, 14.0, 17.0, 22.0, 22.0, 35.0, 40.0, 39.0, 41.0, 42.0, 41.0, 48.0, 49.0, 44.0, 36.0, 55.0, 39.0, 34.0, 36.0, 39.0, 44.0, 28.0, 25.0, 33.0, 20.0, 12.0, 13.0, 14.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9291679859161377, -3.815011978149414, -3.7008562088012695, -3.586700201034546, -3.4725444316864014, -3.3583884239196777, -3.244232654571533, -3.1300766468048096, -3.015920639038086, -2.9017646312713623, -2.7876088619232178, -2.673452854156494, -2.5592970848083496, -2.445141077041626, -2.3309850692749023, -2.216829299926758, -2.1026735305786133, -1.9885176420211792, -1.8743617534637451, -1.7602057456970215, -1.6460498571395874, -1.5318939685821533, -1.4177380800247192, -1.3035821914672852, -1.1894261837005615, -1.0752702951431274, -0.9611143469810486, -0.8469584584236145, -0.7328025102615356, -0.6186466217041016, -0.5044907331466675, -0.3903347849845886, -0.27617883682250977, -0.1620229184627533, -0.04786701500415802, 0.06628888845443726, 0.18044480681419373, 0.2946007251739502, 0.4087566137313843, 0.5229125618934631, 0.6370684504508972, 0.7512243390083313, 0.8653802871704102, 0.9795361757278442, 1.0936920642852783, 1.207848072052002, 1.3220038414001465, 1.4361598491668701, 1.5503157377243042, 1.6644716262817383, 1.7786275148391724, 1.8927834033966064, 2.00693941116333, 2.1210951805114746, 2.2352511882781982, 2.349407196044922, 2.4635629653930664, 2.57771897315979, 2.6918747425079346, 2.806030750274658, 2.9201865196228027, 3.0343425273895264, 3.14849853515625, 3.2626543045043945, 3.376810312271118]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 10.0, 12.0, 14.0, 15.0, 17.0, 34.0, 34.0, 62.0, 96.0, 128.0, 233.0, 378.0, 650.0, 1186.0, 2300.0, 4967.0, 11641.0, 32929.0, 109572.0, 378928.0, 353937.0, 100261.0, 30325.0, 11107.0, 4716.0, 2224.0, 1102.0, 635.0, 393.0, 248.0, 142.0, 84.0, 47.0, 48.0, 23.0, 14.0, 15.0, 12.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84375, -6.62274169921875, -6.4017333984375, -6.18072509765625, -5.959716796875, -5.73870849609375, -5.5177001953125, -5.29669189453125, -5.07568359375, -4.85467529296875, -4.6336669921875, -4.41265869140625, -4.191650390625, -3.97064208984375, -3.7496337890625, -3.52862548828125, -3.3076171875, -3.08660888671875, -2.8656005859375, -2.64459228515625, -2.423583984375, -2.20257568359375, -1.9815673828125, -1.76055908203125, -1.53955078125, -1.31854248046875, -1.0975341796875, -0.87652587890625, -0.655517578125, -0.43450927734375, -0.2135009765625, 0.00750732421875, 0.228515625, 0.44952392578125, 0.6705322265625, 0.89154052734375, 1.112548828125, 1.33355712890625, 1.5545654296875, 1.77557373046875, 1.99658203125, 2.21759033203125, 2.4385986328125, 2.65960693359375, 2.880615234375, 3.10162353515625, 3.3226318359375, 3.54364013671875, 3.7646484375, 3.98565673828125, 4.2066650390625, 4.42767333984375, 4.648681640625, 4.86968994140625, 5.0906982421875, 5.31170654296875, 5.53271484375, 5.75372314453125, 5.9747314453125, 6.19573974609375, 6.416748046875, 6.63775634765625, 6.8587646484375, 7.07977294921875, 7.30078125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 11.0, 20.0, 16.0, 25.0, 28.0, 29.0, 35.0, 42.0, 55.0, 39.0, 69.0, 64.0, 62.0, 57.0, 62.0, 63.0, 52.0, 52.0, 33.0, 32.0, 28.0, 16.0, 26.0, 21.0, 15.0, 10.0, 3.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6806640625, -1.6200408935546875, -1.559417724609375, -1.4987945556640625, -1.43817138671875, -1.3775482177734375, -1.316925048828125, -1.2563018798828125, -1.1956787109375, -1.1350555419921875, -1.074432373046875, -1.0138092041015625, -0.95318603515625, -0.8925628662109375, -0.831939697265625, -0.7713165283203125, -0.710693359375, -0.6500701904296875, -0.589447021484375, -0.5288238525390625, -0.46820068359375, -0.4075775146484375, -0.346954345703125, -0.2863311767578125, -0.2257080078125, -0.1650848388671875, -0.104461669921875, -0.0438385009765625, 0.01678466796875, 0.0774078369140625, 0.138031005859375, 0.1986541748046875, 0.25927734375, 0.3199005126953125, 0.380523681640625, 0.4411468505859375, 0.50177001953125, 0.5623931884765625, 0.623016357421875, 0.6836395263671875, 0.7442626953125, 0.8048858642578125, 0.865509033203125, 0.9261322021484375, 0.98675537109375, 1.0473785400390625, 1.108001708984375, 1.1686248779296875, 1.229248046875, 1.2898712158203125, 1.350494384765625, 1.4111175537109375, 1.47174072265625, 1.5323638916015625, 1.592987060546875, 1.6536102294921875, 1.7142333984375, 1.7748565673828125, 1.835479736328125, 1.8961029052734375, 1.95672607421875, 2.0173492431640625, 2.077972412109375, 2.1385955810546875, 2.19921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 7.0, 10.0, 15.0, 20.0, 36.0, 32.0, 74.0, 122.0, 201.0, 335.0, 621.0, 1256.0, 2636.0, 6998.0, 23272.0, 113216.0, 567484.0, 265546.0, 46725.0, 12095.0, 4176.0, 1751.0, 819.0, 421.0, 241.0, 143.0, 89.0, 61.0, 46.0, 29.0, 19.0, 14.0, 6.0, 6.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.66015625, -7.38397216796875, -7.1077880859375, -6.83160400390625, -6.555419921875, -6.27923583984375, -6.0030517578125, -5.72686767578125, -5.45068359375, -5.17449951171875, -4.8983154296875, -4.62213134765625, -4.345947265625, -4.06976318359375, -3.7935791015625, -3.51739501953125, -3.2412109375, -2.96502685546875, -2.6888427734375, -2.41265869140625, -2.136474609375, -1.86029052734375, -1.5841064453125, -1.30792236328125, -1.03173828125, -0.75555419921875, -0.4793701171875, -0.20318603515625, 0.072998046875, 0.34918212890625, 0.6253662109375, 0.90155029296875, 1.177734375, 1.45391845703125, 1.7301025390625, 2.00628662109375, 2.282470703125, 2.55865478515625, 2.8348388671875, 3.11102294921875, 3.38720703125, 3.66339111328125, 3.9395751953125, 4.21575927734375, 4.491943359375, 4.76812744140625, 5.0443115234375, 5.32049560546875, 5.5966796875, 5.87286376953125, 6.1490478515625, 6.42523193359375, 6.701416015625, 6.97760009765625, 7.2537841796875, 7.52996826171875, 7.80615234375, 8.08233642578125, 8.3585205078125, 8.63470458984375, 8.910888671875, 9.18707275390625, 9.4632568359375, 9.73944091796875, 10.015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 14.0, 8.0, 16.0, 17.0, 19.0, 15.0, 17.0, 26.0, 25.0, 47.0, 35.0, 42.0, 53.0, 42.0, 62.0, 43.0, 69.0, 38.0, 44.0, 44.0, 33.0, 37.0, 32.0, 35.0, 28.0, 33.0, 22.0, 19.0, 13.0, 10.0, 6.0, 8.0, 8.0, 8.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.7734375, -10.467041015625, -10.16064453125, -9.854248046875, -9.5478515625, -9.241455078125, -8.93505859375, -8.628662109375, -8.322265625, -8.015869140625, -7.70947265625, -7.403076171875, -7.0966796875, -6.790283203125, -6.48388671875, -6.177490234375, -5.87109375, -5.564697265625, -5.25830078125, -4.951904296875, -4.6455078125, -4.339111328125, -4.03271484375, -3.726318359375, -3.419921875, -3.113525390625, -2.80712890625, -2.500732421875, -2.1943359375, -1.887939453125, -1.58154296875, -1.275146484375, -0.96875, -0.662353515625, -0.35595703125, -0.049560546875, 0.2568359375, 0.563232421875, 0.86962890625, 1.176025390625, 1.482421875, 1.788818359375, 2.09521484375, 2.401611328125, 2.7080078125, 3.014404296875, 3.32080078125, 3.627197265625, 3.93359375, 4.239990234375, 4.54638671875, 4.852783203125, 5.1591796875, 5.465576171875, 5.77197265625, 6.078369140625, 6.384765625, 6.691162109375, 6.99755859375, 7.303955078125, 7.6103515625, 7.916748046875, 8.22314453125, 8.529541015625, 8.8359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 4.0, 13.0, 16.0, 17.0, 18.0, 26.0, 46.0, 68.0, 91.0, 141.0, 263.0, 411.0, 897.0, 2363.0, 8208.0, 68047.0, 908824.0, 48209.0, 7041.0, 1992.0, 803.0, 382.0, 232.0, 148.0, 76.0, 64.0, 31.0, 23.0, 27.0, 18.0, 12.0, 8.0, 6.0, 8.0, 5.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1796875, -8.85693359375, -8.5341796875, -8.21142578125, -7.888671875, -7.56591796875, -7.2431640625, -6.92041015625, -6.59765625, -6.27490234375, -5.9521484375, -5.62939453125, -5.306640625, -4.98388671875, -4.6611328125, -4.33837890625, -4.015625, -3.69287109375, -3.3701171875, -3.04736328125, -2.724609375, -2.40185546875, -2.0791015625, -1.75634765625, -1.43359375, -1.11083984375, -0.7880859375, -0.46533203125, -0.142578125, 0.18017578125, 0.5029296875, 0.82568359375, 1.1484375, 1.47119140625, 1.7939453125, 2.11669921875, 2.439453125, 2.76220703125, 3.0849609375, 3.40771484375, 3.73046875, 4.05322265625, 4.3759765625, 4.69873046875, 5.021484375, 5.34423828125, 5.6669921875, 5.98974609375, 6.3125, 6.63525390625, 6.9580078125, 7.28076171875, 7.603515625, 7.92626953125, 8.2490234375, 8.57177734375, 8.89453125, 9.21728515625, 9.5400390625, 9.86279296875, 10.185546875, 10.50830078125, 10.8310546875, 11.15380859375, 11.4765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 9.0, 19.0, 16.0, 19.0, 37.0, 54.0, 116.0, 166.0, 143.0, 153.0, 98.0, 49.0, 36.0, 30.0, 12.0, 9.0, 11.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008754730224609375, -0.0008492767810821533, -0.0008230805397033691, -0.000796884298324585, -0.0007706880569458008, -0.0007444918155670166, -0.0007182955741882324, -0.0006920993328094482, -0.0006659030914306641, -0.0006397068500518799, -0.0006135106086730957, -0.0005873143672943115, -0.0005611181259155273, -0.0005349218845367432, -0.000508725643157959, -0.0004825294017791748, -0.0004563331604003906, -0.00043013691902160645, -0.00040394067764282227, -0.0003777444362640381, -0.0003515481948852539, -0.0003253519535064697, -0.00029915571212768555, -0.00027295947074890137, -0.0002467632293701172, -0.000220566987991333, -0.00019437074661254883, -0.00016817450523376465, -0.00014197826385498047, -0.00011578202247619629, -8.958578109741211e-05, -6.338953971862793e-05, -3.719329833984375e-05, -1.099705696105957e-05, 1.519918441772461e-05, 4.139542579650879e-05, 6.759166717529297e-05, 9.378790855407715e-05, 0.00011998414993286133, 0.0001461803913116455, 0.0001723766326904297, 0.00019857287406921387, 0.00022476911544799805, 0.0002509653568267822, 0.0002771615982055664, 0.0003033578395843506, 0.00032955408096313477, 0.00035575032234191895, 0.0003819465637207031, 0.0004081428050994873, 0.0004343390464782715, 0.00046053528785705566, 0.00048673152923583984, 0.000512927770614624, 0.0005391240119934082, 0.0005653202533721924, 0.0005915164947509766, 0.0006177127361297607, 0.0006439089775085449, 0.0006701052188873291, 0.0006963014602661133, 0.0007224977016448975, 0.0007486939430236816, 0.0007748901844024658, 0.00080108642578125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 16.0, 13.0, 27.0, 43.0, 74.0, 166.0, 380.0, 1150.0, 4852.0, 37598.0, 906897.0, 87126.0, 7718.0, 1580.0, 499.0, 171.0, 88.0, 47.0, 29.0, 14.0, 20.0, 11.0, 12.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.4375, -11.133544921875, -10.82958984375, -10.525634765625, -10.2216796875, -9.917724609375, -9.61376953125, -9.309814453125, -9.005859375, -8.701904296875, -8.39794921875, -8.093994140625, -7.7900390625, -7.486083984375, -7.18212890625, -6.878173828125, -6.57421875, -6.270263671875, -5.96630859375, -5.662353515625, -5.3583984375, -5.054443359375, -4.75048828125, -4.446533203125, -4.142578125, -3.838623046875, -3.53466796875, -3.230712890625, -2.9267578125, -2.622802734375, -2.31884765625, -2.014892578125, -1.7109375, -1.406982421875, -1.10302734375, -0.799072265625, -0.4951171875, -0.191162109375, 0.11279296875, 0.416748046875, 0.720703125, 1.024658203125, 1.32861328125, 1.632568359375, 1.9365234375, 2.240478515625, 2.54443359375, 2.848388671875, 3.15234375, 3.456298828125, 3.76025390625, 4.064208984375, 4.3681640625, 4.672119140625, 4.97607421875, 5.280029296875, 5.583984375, 5.887939453125, 6.19189453125, 6.495849609375, 6.7998046875, 7.103759765625, 7.40771484375, 7.711669921875, 8.015625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 7.0, 2.0, 9.0, 10.0, 10.0, 9.0, 16.0, 38.0, 57.0, 83.0, 128.0, 187.0, 167.0, 92.0, 61.0, 38.0, 22.0, 19.0, 12.0, 8.0, 5.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.734375, -7.4820556640625, -7.229736328125, -6.9774169921875, -6.72509765625, -6.4727783203125, -6.220458984375, -5.9681396484375, -5.7158203125, -5.4635009765625, -5.211181640625, -4.9588623046875, -4.70654296875, -4.4542236328125, -4.201904296875, -3.9495849609375, -3.697265625, -3.4449462890625, -3.192626953125, -2.9403076171875, -2.68798828125, -2.4356689453125, -2.183349609375, -1.9310302734375, -1.6787109375, -1.4263916015625, -1.174072265625, -0.9217529296875, -0.66943359375, -0.4171142578125, -0.164794921875, 0.0875244140625, 0.33984375, 0.5921630859375, 0.844482421875, 1.0968017578125, 1.34912109375, 1.6014404296875, 1.853759765625, 2.1060791015625, 2.3583984375, 2.6107177734375, 2.863037109375, 3.1153564453125, 3.36767578125, 3.6199951171875, 3.872314453125, 4.1246337890625, 4.376953125, 4.6292724609375, 4.881591796875, 5.1339111328125, 5.38623046875, 5.6385498046875, 5.890869140625, 6.1431884765625, 6.3955078125, 6.6478271484375, 6.900146484375, 7.1524658203125, 7.40478515625, 7.6571044921875, 7.909423828125, 8.1617431640625, 8.4140625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 7.0, 13.0, 22.0, 53.0, 77.0, 128.0, 191.0, 190.0, 149.0, 74.0, 54.0, 27.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-175.62242126464844, -171.98858642578125, -168.35476684570312, -164.720947265625, -161.0871124267578, -157.45327758789062, -153.8194580078125, -150.18563842773438, -146.5518035888672, -142.91796875, -139.28414916992188, -135.65032958984375, -132.01649475097656, -128.38265991210938, -124.74884033203125, -121.1150131225586, -117.48118591308594, -113.84735870361328, -110.21353149414062, -106.57970428466797, -102.94587707519531, -99.31204986572266, -95.67822265625, -92.04439544677734, -88.41056823730469, -84.77674102783203, -81.14291381835938, -77.50908660888672, -73.87525939941406, -70.2414321899414, -66.60760498046875, -62.973777770996094, -59.33995819091797, -55.70613098144531, -52.072303771972656, -48.4384765625, -44.804649353027344, -41.17082214355469, -37.53699493408203, -33.903167724609375, -30.26934051513672, -26.635513305664062, -23.001686096191406, -19.36785888671875, -15.734031677246094, -12.100204467773438, -8.466377258300781, -4.832550048828125, -1.1987228393554688, 2.4351043701171875, 6.068931579589844, 9.7027587890625, 13.336585998535156, 16.970413208007812, 20.60424041748047, 24.238067626953125, 27.87189483642578, 31.505722045898438, 35.139549255371094, 38.77337646484375, 42.407203674316406, 46.04103088378906, 49.67485809326172, 53.308685302734375, 56.94251251220703]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 9.0, 17.0, 17.0, 9.0, 17.0, 20.0, 31.0, 29.0, 44.0, 50.0, 31.0, 39.0, 41.0, 37.0, 48.0, 54.0, 55.0, 49.0, 50.0, 50.0, 36.0, 47.0, 29.0, 26.0, 21.0, 19.0, 18.0, 15.0, 21.0, 14.0, 12.0, 8.0, 4.0, 9.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-55.95832061767578, -54.347618103027344, -52.73691177368164, -51.1262092590332, -49.515506744384766, -47.90480041503906, -46.294097900390625, -44.68339538574219, -43.07269287109375, -41.46199035644531, -39.85128402709961, -38.24058151245117, -36.629878997802734, -35.01917266845703, -33.408470153808594, -31.797767639160156, -30.187061309814453, -28.576356887817383, -26.965654373168945, -25.354949951171875, -23.744247436523438, -22.133543014526367, -20.522838592529297, -18.91213607788086, -17.30143165588379, -15.690728187561035, -14.080024719238281, -12.469320297241211, -10.858616828918457, -9.247913360595703, -7.637208938598633, -6.026505470275879, -4.415802001953125, -2.805098295211792, -1.194394588470459, 0.4163093566894531, 2.027012825012207, 3.637716293334961, 5.248420715332031, 6.859124183654785, 8.469827651977539, 10.080531120300293, 11.691234588623047, 13.301939010620117, 14.912642478942871, 16.523345947265625, 18.134050369262695, 19.744754791259766, 21.355457305908203, 22.966161727905273, 24.57686424255371, 26.18756866455078, 27.79827117919922, 29.40897560119629, 31.01968002319336, 32.6303825378418, 34.2410888671875, 35.85179138183594, 37.46249771118164, 39.07320022583008, 40.683902740478516, 42.29460906982422, 43.905311584472656, 45.516014099121094, 47.12671661376953]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 12.0, 24.0, 37.0, 50.0, 65.0, 129.0, 273.0, 649.0, 1698.0, 7217.0, 106455.0, 4058249.0, 14860.0, 2726.0, 936.0, 386.0, 199.0, 114.0, 56.0, 43.0, 19.0, 24.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -22.042724609375, -21.39794921875, -20.753173828125, -20.1083984375, -19.463623046875, -18.81884765625, -18.174072265625, -17.529296875, -16.884521484375, -16.23974609375, -15.594970703125, -14.9501953125, -14.305419921875, -13.66064453125, -13.015869140625, -12.37109375, -11.726318359375, -11.08154296875, -10.436767578125, -9.7919921875, -9.147216796875, -8.50244140625, -7.857666015625, -7.212890625, -6.568115234375, -5.92333984375, -5.278564453125, -4.6337890625, -3.989013671875, -3.34423828125, -2.699462890625, -2.0546875, -1.409912109375, -0.76513671875, -0.120361328125, 0.5244140625, 1.169189453125, 1.81396484375, 2.458740234375, 3.103515625, 3.748291015625, 4.39306640625, 5.037841796875, 5.6826171875, 6.327392578125, 6.97216796875, 7.616943359375, 8.26171875, 8.906494140625, 9.55126953125, 10.196044921875, 10.8408203125, 11.485595703125, 12.13037109375, 12.775146484375, 13.419921875, 14.064697265625, 14.70947265625, 15.354248046875, 15.9990234375, 16.643798828125, 17.28857421875, 17.933349609375, 18.578125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 5.0, 8.0, 26.0, 19.0, 39.0, 38.0, 57.0, 44.0, 55.0, 63.0, 77.0, 68.0, 69.0, 84.0, 73.0, 46.0, 44.0, 30.0, 37.0, 25.0, 21.0, 12.0, 13.0, 15.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.302734375, -2.22491455078125, -2.1470947265625, -2.06927490234375, -1.991455078125, -1.91363525390625, -1.8358154296875, -1.75799560546875, -1.68017578125, -1.60235595703125, -1.5245361328125, -1.44671630859375, -1.368896484375, -1.29107666015625, -1.2132568359375, -1.13543701171875, -1.0576171875, -0.97979736328125, -0.9019775390625, -0.82415771484375, -0.746337890625, -0.66851806640625, -0.5906982421875, -0.51287841796875, -0.43505859375, -0.35723876953125, -0.2794189453125, -0.20159912109375, -0.123779296875, -0.04595947265625, 0.0318603515625, 0.10968017578125, 0.1875, 0.26531982421875, 0.3431396484375, 0.42095947265625, 0.498779296875, 0.57659912109375, 0.6544189453125, 0.73223876953125, 0.81005859375, 0.88787841796875, 0.9656982421875, 1.04351806640625, 1.121337890625, 1.19915771484375, 1.2769775390625, 1.35479736328125, 1.4326171875, 1.51043701171875, 1.5882568359375, 1.66607666015625, 1.743896484375, 1.82171630859375, 1.8995361328125, 1.97735595703125, 2.05517578125, 2.13299560546875, 2.2108154296875, 2.28863525390625, 2.366455078125, 2.44427490234375, 2.5220947265625, 2.59991455078125, 2.677734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 1.0, 3.0, 7.0, 8.0, 13.0, 13.0, 24.0, 28.0, 34.0, 67.0, 98.0, 139.0, 211.0, 326.0, 479.0, 760.0, 1184.0, 1891.0, 3239.0, 5968.0, 13242.0, 44685.0, 3766883.0, 300570.0, 30892.0, 10735.0, 5134.0, 2713.0, 1709.0, 1077.0, 721.0, 502.0, 309.0, 201.0, 138.0, 82.0, 56.0, 43.0, 26.0, 19.0, 20.0, 11.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.4375, -15.9375, -15.4375, -14.9375, -14.4375, -13.9375, -13.4375, -12.9375, -12.4375, -11.9375, -11.4375, -10.9375, -10.4375, -9.9375, -9.4375, -8.9375, -8.4375, -7.9375, -7.4375, -6.9375, -6.4375, -5.9375, -5.4375, -4.9375, -4.4375, -3.9375, -3.4375, -2.9375, -2.4375, -1.9375, -1.4375, -0.9375, -0.4375, 0.0625, 0.5625, 1.0625, 1.5625, 2.0625, 2.5625, 3.0625, 3.5625, 4.0625, 4.5625, 5.0625, 5.5625, 6.0625, 6.5625, 7.0625, 7.5625, 8.0625, 8.5625, 9.0625, 9.5625, 10.0625, 10.5625, 11.0625, 11.5625, 12.0625, 12.5625, 13.0625, 13.5625, 14.0625, 14.5625, 15.0625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0, 15.0, 7.0, 22.0, 25.0, 51.0, 102.0, 1674.0, 1973.0, 85.0, 39.0, 19.0, 21.0, 7.0, 5.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.11328125, -4.9306640625, -4.748046875, -4.5654296875, -4.3828125, -4.2001953125, -4.017578125, -3.8349609375, -3.65234375, -3.4697265625, -3.287109375, -3.1044921875, -2.921875, -2.7392578125, -2.556640625, -2.3740234375, -2.19140625, -2.0087890625, -1.826171875, -1.6435546875, -1.4609375, -1.2783203125, -1.095703125, -0.9130859375, -0.73046875, -0.5478515625, -0.365234375, -0.1826171875, 0.0, 0.1826171875, 0.365234375, 0.5478515625, 0.73046875, 0.9130859375, 1.095703125, 1.2783203125, 1.4609375, 1.6435546875, 1.826171875, 2.0087890625, 2.19140625, 2.3740234375, 2.556640625, 2.7392578125, 2.921875, 3.1044921875, 3.287109375, 3.4697265625, 3.65234375, 3.8349609375, 4.017578125, 4.2001953125, 4.3828125, 4.5654296875, 4.748046875, 4.9306640625, 5.11328125, 5.2958984375, 5.478515625, 5.6611328125, 5.84375, 6.0263671875, 6.208984375, 6.3916015625, 6.57421875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 6.0, 25.0, 53.0, 107.0, 206.0, 306.0, 173.0, 77.0, 20.0, 16.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.01553344726562, -72.3567123413086, -70.69789123535156, -69.0390625, -67.38024139404297, -65.72142028808594, -64.0625991821289, -62.403778076171875, -60.74495315551758, -59.08613204956055, -57.42730712890625, -55.76848602294922, -54.10966491699219, -52.45083999633789, -50.79201889038086, -49.13319396972656, -47.47437286376953, -45.8155517578125, -44.1567268371582, -42.49790573120117, -40.83908462524414, -39.180259704589844, -37.52143859863281, -35.86261749267578, -34.20379638671875, -32.54497528076172, -30.886152267456055, -29.22732925415039, -27.568506240844727, -25.909683227539062, -24.25086212158203, -22.592039108276367, -20.933216094970703, -19.27439308166504, -17.615571975708008, -15.956748962402344, -14.29792594909668, -12.639103889465332, -10.980281829833984, -9.32145881652832, -7.662636756896973, -6.003814220428467, -4.344991683959961, -2.6861696243286133, -1.0273470878601074, 0.6314754486083984, 2.290297508239746, 3.94912052154541, 5.607942581176758, 7.266765117645264, 8.92558765411377, 10.584409713745117, 12.243232727050781, 13.902054786682129, 15.560876846313477, 17.21969985961914, 18.878520965576172, 20.537343978881836, 22.196165084838867, 23.85498809814453, 25.513811111450195, 27.17263412475586, 28.83145523071289, 30.490278244018555, 32.14910125732422]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 7.0, 9.0, 14.0, 18.0, 21.0, 31.0, 32.0, 41.0, 52.0, 42.0, 64.0, 53.0, 36.0, 54.0, 50.0, 59.0, 52.0, 44.0, 52.0, 26.0, 40.0, 39.0, 37.0, 26.0, 25.0, 11.0, 19.0, 9.0, 7.0, 6.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.444921493530273, -16.809663772583008, -16.174406051635742, -15.539148330688477, -14.903889656066895, -14.268631935119629, -13.633374214172363, -12.998115539550781, -12.362857818603516, -11.72760009765625, -11.092342376708984, -10.457084655761719, -9.821825981140137, -9.186568260192871, -8.551310539245605, -7.916052341461182, -7.280795097351074, -6.645537376403809, -6.010279178619385, -5.375021457672119, -4.739763259887695, -4.10450553894043, -3.469247817993164, -2.8339896202087402, -2.1987318992614746, -1.5634739398956299, -0.9282160997390747, -0.29295825958251953, 0.3422996997833252, 0.9775576591491699, 1.6128153800964355, 2.2480735778808594, 2.883331298828125, 3.5185892581939697, 4.1538472175598145, 4.78910493850708, 5.424363136291504, 6.0596208572387695, 6.694878578186035, 7.330136775970459, 7.965394496917725, 8.600652694702148, 9.235910415649414, 9.87116813659668, 10.506425857543945, 11.141683578491211, 11.776941299438477, 12.412199974060059, 13.047457695007324, 13.68271541595459, 14.317973136901855, 14.953231811523438, 15.588489532470703, 16.22374725341797, 16.859004974365234, 17.4942626953125, 18.129520416259766, 18.76477813720703, 19.400035858154297, 20.035293579101562, 20.670551300048828, 21.305809020996094, 21.94106674194336, 22.576326370239258, 23.211584091186523]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 14.0, 10.0, 29.0, 26.0, 35.0, 56.0, 69.0, 95.0, 170.0, 249.0, 409.0, 565.0, 869.0, 1502.0, 2400.0, 4006.0, 7086.0, 12947.0, 24169.0, 49184.0, 107130.0, 232988.0, 298263.0, 159839.0, 71606.0, 34430.0, 17405.0, 9425.0, 5404.0, 3075.0, 1842.0, 1136.0, 707.0, 472.0, 290.0, 200.0, 135.0, 104.0, 69.0, 35.0, 29.0, 21.0, 15.0, 15.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.02734375, -4.866455078125, -4.70556640625, -4.544677734375, -4.3837890625, -4.222900390625, -4.06201171875, -3.901123046875, -3.740234375, -3.579345703125, -3.41845703125, -3.257568359375, -3.0966796875, -2.935791015625, -2.77490234375, -2.614013671875, -2.453125, -2.292236328125, -2.13134765625, -1.970458984375, -1.8095703125, -1.648681640625, -1.48779296875, -1.326904296875, -1.166015625, -1.005126953125, -0.84423828125, -0.683349609375, -0.5224609375, -0.361572265625, -0.20068359375, -0.039794921875, 0.12109375, 0.281982421875, 0.44287109375, 0.603759765625, 0.7646484375, 0.925537109375, 1.08642578125, 1.247314453125, 1.408203125, 1.569091796875, 1.72998046875, 1.890869140625, 2.0517578125, 2.212646484375, 2.37353515625, 2.534423828125, 2.6953125, 2.856201171875, 3.01708984375, 3.177978515625, 3.3388671875, 3.499755859375, 3.66064453125, 3.821533203125, 3.982421875, 4.143310546875, 4.30419921875, 4.465087890625, 4.6259765625, 4.786865234375, 4.94775390625, 5.108642578125, 5.26953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 7.0, 6.0, 9.0, 12.0, 10.0, 14.0, 19.0, 16.0, 26.0, 24.0, 22.0, 23.0, 32.0, 31.0, 39.0, 38.0, 44.0, 44.0, 51.0, 41.0, 54.0, 45.0, 36.0, 45.0, 34.0, 35.0, 33.0, 30.0, 29.0, 25.0, 22.0, 14.0, 16.0, 15.0, 12.0, 10.0, 7.0, 5.0, 0.0, 6.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.291015625, -2.21319580078125, -2.1353759765625, -2.05755615234375, -1.979736328125, -1.90191650390625, -1.8240966796875, -1.74627685546875, -1.66845703125, -1.59063720703125, -1.5128173828125, -1.43499755859375, -1.357177734375, -1.27935791015625, -1.2015380859375, -1.12371826171875, -1.0458984375, -0.96807861328125, -0.8902587890625, -0.81243896484375, -0.734619140625, -0.65679931640625, -0.5789794921875, -0.50115966796875, -0.42333984375, -0.34552001953125, -0.2677001953125, -0.18988037109375, -0.112060546875, -0.03424072265625, 0.0435791015625, 0.12139892578125, 0.19921875, 0.27703857421875, 0.3548583984375, 0.43267822265625, 0.510498046875, 0.58831787109375, 0.6661376953125, 0.74395751953125, 0.82177734375, 0.89959716796875, 0.9774169921875, 1.05523681640625, 1.133056640625, 1.21087646484375, 1.2886962890625, 1.36651611328125, 1.4443359375, 1.52215576171875, 1.5999755859375, 1.67779541015625, 1.755615234375, 1.83343505859375, 1.9112548828125, 1.98907470703125, 2.06689453125, 2.14471435546875, 2.2225341796875, 2.30035400390625, 2.378173828125, 2.45599365234375, 2.5338134765625, 2.61163330078125, 2.689453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 7.0, 10.0, 19.0, 21.0, 40.0, 53.0, 106.0, 204.0, 388.0, 879.0, 2148.0, 7459.0, 46552.0, 699920.0, 262439.0, 20997.0, 4538.0, 1462.0, 636.0, 279.0, 177.0, 84.0, 44.0, 34.0, 19.0, 16.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.36376953125, -16.6025390625, -15.84130859375, -15.080078125, -14.31884765625, -13.5576171875, -12.79638671875, -12.03515625, -11.27392578125, -10.5126953125, -9.75146484375, -8.990234375, -8.22900390625, -7.4677734375, -6.70654296875, -5.9453125, -5.18408203125, -4.4228515625, -3.66162109375, -2.900390625, -2.13916015625, -1.3779296875, -0.61669921875, 0.14453125, 0.90576171875, 1.6669921875, 2.42822265625, 3.189453125, 3.95068359375, 4.7119140625, 5.47314453125, 6.234375, 6.99560546875, 7.7568359375, 8.51806640625, 9.279296875, 10.04052734375, 10.8017578125, 11.56298828125, 12.32421875, 13.08544921875, 13.8466796875, 14.60791015625, 15.369140625, 16.13037109375, 16.8916015625, 17.65283203125, 18.4140625, 19.17529296875, 19.9365234375, 20.69775390625, 21.458984375, 22.22021484375, 22.9814453125, 23.74267578125, 24.50390625, 25.26513671875, 26.0263671875, 26.78759765625, 27.548828125, 28.31005859375, 29.0712890625, 29.83251953125, 30.59375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 6.0, 2.0, 4.0, 8.0, 5.0, 12.0, 14.0, 20.0, 28.0, 35.0, 32.0, 38.0, 66.0, 65.0, 74.0, 72.0, 69.0, 78.0, 59.0, 53.0, 51.0, 44.0, 33.0, 27.0, 23.0, 22.0, 19.0, 12.0, 11.0, 4.0, 1.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.6875, -20.850830078125, -20.01416015625, -19.177490234375, -18.3408203125, -17.504150390625, -16.66748046875, -15.830810546875, -14.994140625, -14.157470703125, -13.32080078125, -12.484130859375, -11.6474609375, -10.810791015625, -9.97412109375, -9.137451171875, -8.30078125, -7.464111328125, -6.62744140625, -5.790771484375, -4.9541015625, -4.117431640625, -3.28076171875, -2.444091796875, -1.607421875, -0.770751953125, 0.06591796875, 0.902587890625, 1.7392578125, 2.575927734375, 3.41259765625, 4.249267578125, 5.0859375, 5.922607421875, 6.75927734375, 7.595947265625, 8.4326171875, 9.269287109375, 10.10595703125, 10.942626953125, 11.779296875, 12.615966796875, 13.45263671875, 14.289306640625, 15.1259765625, 15.962646484375, 16.79931640625, 17.635986328125, 18.47265625, 19.309326171875, 20.14599609375, 20.982666015625, 21.8193359375, 22.656005859375, 23.49267578125, 24.329345703125, 25.166015625, 26.002685546875, 26.83935546875, 27.676025390625, 28.5126953125, 29.349365234375, 30.18603515625, 31.022705078125, 31.859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 10.0, 8.0, 12.0, 8.0, 11.0, 21.0, 32.0, 37.0, 50.0, 72.0, 114.0, 288.0, 805.0, 3226.0, 27854.0, 991921.0, 20026.0, 2764.0, 695.0, 250.0, 100.0, 72.0, 40.0, 27.0, 29.0, 12.0, 11.0, 17.0, 11.0, 12.0, 5.0, 2.0, 7.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.671875, -29.7548828125, -28.837890625, -27.9208984375, -27.00390625, -26.0869140625, -25.169921875, -24.2529296875, -23.3359375, -22.4189453125, -21.501953125, -20.5849609375, -19.66796875, -18.7509765625, -17.833984375, -16.9169921875, -16.0, -15.0830078125, -14.166015625, -13.2490234375, -12.33203125, -11.4150390625, -10.498046875, -9.5810546875, -8.6640625, -7.7470703125, -6.830078125, -5.9130859375, -4.99609375, -4.0791015625, -3.162109375, -2.2451171875, -1.328125, -0.4111328125, 0.505859375, 1.4228515625, 2.33984375, 3.2568359375, 4.173828125, 5.0908203125, 6.0078125, 6.9248046875, 7.841796875, 8.7587890625, 9.67578125, 10.5927734375, 11.509765625, 12.4267578125, 13.34375, 14.2607421875, 15.177734375, 16.0947265625, 17.01171875, 17.9287109375, 18.845703125, 19.7626953125, 20.6796875, 21.5966796875, 22.513671875, 23.4306640625, 24.34765625, 25.2646484375, 26.181640625, 27.0986328125, 28.015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 20.0, 46.0, 124.0, 255.0, 289.0, 150.0, 58.0, 31.0, 11.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022640228271484375, -0.0021701157093048096, -0.0020762085914611816, -0.0019823014736175537, -0.0018883943557739258, -0.0017944872379302979, -0.00170058012008667, -0.001606673002243042, -0.001512765884399414, -0.0014188587665557861, -0.0013249516487121582, -0.0012310445308685303, -0.0011371374130249023, -0.0010432302951812744, -0.0009493231773376465, -0.0008554160594940186, -0.0007615089416503906, -0.0006676018238067627, -0.0005736947059631348, -0.00047978758811950684, -0.0003858804702758789, -0.000291973352432251, -0.00019806623458862305, -0.00010415911674499512, -1.0251998901367188e-05, 8.365511894226074e-05, 0.00017756223678588867, 0.0002714693546295166, 0.00036537647247314453, 0.00045928359031677246, 0.0005531907081604004, 0.0006470978260040283, 0.0007410049438476562, 0.0008349120616912842, 0.0009288191795349121, 0.00102272629737854, 0.001116633415222168, 0.001210540533065796, 0.0013044476509094238, 0.0013983547687530518, 0.0014922618865966797, 0.0015861690044403076, 0.0016800761222839355, 0.0017739832401275635, 0.0018678903579711914, 0.0019617974758148193, 0.0020557045936584473, 0.002149611711502075, 0.002243518829345703, 0.002337425947189331, 0.002431333065032959, 0.002525240182876587, 0.002619147300720215, 0.0027130544185638428, 0.0028069615364074707, 0.0029008686542510986, 0.0029947757720947266, 0.0030886828899383545, 0.0031825900077819824, 0.0032764971256256104, 0.0033704042434692383, 0.003464311361312866, 0.003558218479156494, 0.003652125597000122, 0.00374603271484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 9.0, 14.0, 18.0, 70.0, 135.0, 237.0, 539.0, 1279.0, 3402.0, 14659.0, 388488.0, 615455.0, 17829.0, 3965.0, 1396.0, 557.0, 258.0, 109.0, 44.0, 27.0, 17.0, 10.0, 5.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.9609375, -14.4459228515625, -13.930908203125, -13.4158935546875, -12.90087890625, -12.3858642578125, -11.870849609375, -11.3558349609375, -10.8408203125, -10.3258056640625, -9.810791015625, -9.2957763671875, -8.78076171875, -8.2657470703125, -7.750732421875, -7.2357177734375, -6.720703125, -6.2056884765625, -5.690673828125, -5.1756591796875, -4.66064453125, -4.1456298828125, -3.630615234375, -3.1156005859375, -2.6005859375, -2.0855712890625, -1.570556640625, -1.0555419921875, -0.54052734375, -0.0255126953125, 0.489501953125, 1.0045166015625, 1.51953125, 2.0345458984375, 2.549560546875, 3.0645751953125, 3.57958984375, 4.0946044921875, 4.609619140625, 5.1246337890625, 5.6396484375, 6.1546630859375, 6.669677734375, 7.1846923828125, 7.69970703125, 8.2147216796875, 8.729736328125, 9.2447509765625, 9.759765625, 10.2747802734375, 10.789794921875, 11.3048095703125, 11.81982421875, 12.3348388671875, 12.849853515625, 13.3648681640625, 13.8798828125, 14.3948974609375, 14.909912109375, 15.4249267578125, 15.93994140625, 16.4549560546875, 16.969970703125, 17.4849853515625, 18.0]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 2.0, 7.0, 11.0, 10.0, 24.0, 43.0, 53.0, 99.0, 139.0, 229.0, 155.0, 84.0, 48.0, 29.0, 18.0, 5.0, 11.0, 7.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.09375, -16.568359375, -16.04296875, -15.517578125, -14.9921875, -14.466796875, -13.94140625, -13.416015625, -12.890625, -12.365234375, -11.83984375, -11.314453125, -10.7890625, -10.263671875, -9.73828125, -9.212890625, -8.6875, -8.162109375, -7.63671875, -7.111328125, -6.5859375, -6.060546875, -5.53515625, -5.009765625, -4.484375, -3.958984375, -3.43359375, -2.908203125, -2.3828125, -1.857421875, -1.33203125, -0.806640625, -0.28125, 0.244140625, 0.76953125, 1.294921875, 1.8203125, 2.345703125, 2.87109375, 3.396484375, 3.921875, 4.447265625, 4.97265625, 5.498046875, 6.0234375, 6.548828125, 7.07421875, 7.599609375, 8.125, 8.650390625, 9.17578125, 9.701171875, 10.2265625, 10.751953125, 11.27734375, 11.802734375, 12.328125, 12.853515625, 13.37890625, 13.904296875, 14.4296875, 14.955078125, 15.48046875, 16.005859375, 16.53125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 11.0, 74.0, 318.0, 442.0, 129.0, 29.0, 5.0, 1.0, 1.0], "bins": [-972.9915161132812, -956.272705078125, -939.553955078125, -922.8351440429688, -906.1163940429688, -889.3975830078125, -872.6788330078125, -855.9600219726562, -839.2412109375, -822.5223999023438, -805.8036499023438, -789.0848388671875, -772.3660888671875, -755.6472778320312, -738.928466796875, -722.209716796875, -705.490966796875, -688.7721557617188, -672.0534057617188, -655.3345947265625, -638.6158447265625, -621.8970336914062, -605.17822265625, -588.45947265625, -571.7406616210938, -555.0218505859375, -538.3031005859375, -521.5842895507812, -504.8655090332031, -488.146728515625, -471.4279479980469, -454.70916748046875, -437.99029541015625, -421.2715148925781, -404.552734375, -387.83392333984375, -371.1151428222656, -354.3963623046875, -337.6775817871094, -320.95880126953125, -304.2400207519531, -287.521240234375, -270.8024597167969, -254.0836639404297, -237.3648681640625, -220.64608764648438, -203.92730712890625, -187.20852661132812, -170.48971557617188, -153.77093505859375, -137.05213928222656, -120.33335876464844, -103.61457061767578, -86.89578247070312, -70.177001953125, -53.458213806152344, -36.73943328857422, -20.020647048950195, -3.301860809326172, 13.416923522949219, 30.135711669921875, 46.85449981689453, 63.573280334472656, 80.29206848144531, 97.01085662841797]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 6.0, 11.0, 9.0, 11.0, 12.0, 15.0, 16.0, 20.0, 29.0, 44.0, 38.0, 36.0, 56.0, 58.0, 60.0, 63.0, 72.0, 68.0, 52.0, 52.0, 39.0, 39.0, 39.0, 27.0, 27.0, 16.0, 15.0, 17.0, 10.0, 7.0, 11.0, 5.0, 4.0, 6.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-112.86322021484375, -109.10414123535156, -105.3450698852539, -101.58599090576172, -97.82691955566406, -94.06784057617188, -90.30876159667969, -86.54969024658203, -82.79061889648438, -79.03153991699219, -75.27246856689453, -71.51338958740234, -67.75431823730469, -63.9952392578125, -60.23616409301758, -56.477088928222656, -52.71800994873047, -48.95893478393555, -45.199859619140625, -41.44078063964844, -37.68170928955078, -33.922630310058594, -30.163555145263672, -26.40447998046875, -22.645404815673828, -18.886329650878906, -15.127253532409668, -11.36817741394043, -7.609102249145508, -3.850027084350586, -0.09095001220703125, 3.6681251525878906, 7.4272003173828125, 11.186275482177734, 14.945351600646973, 18.70442771911621, 22.463502883911133, 26.222578048706055, 29.98165512084961, 33.74073028564453, 37.49980545043945, 41.258880615234375, 45.0179557800293, 48.77703094482422, 52.536109924316406, 56.29518127441406, 60.05426025390625, 63.81333541870117, 67.5724105834961, 71.33148956298828, 75.09056091308594, 78.84963989257812, 82.60871124267578, 86.36779022216797, 90.12686157226562, 93.88594055175781, 97.64501953125, 101.40409851074219, 105.16316986083984, 108.92224884033203, 112.68132019042969, 116.44039916992188, 120.19947814941406, 123.95854949951172, 127.71762084960938]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 6.0, 6.0, 5.0, 13.0, 16.0, 42.0, 74.0, 159.0, 607.0, 15412.0, 4176166.0, 1294.0, 277.0, 91.0, 52.0, 23.0, 16.0, 10.0, 4.0, 6.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-111.5, -108.654296875, -105.80859375, -102.962890625, -100.1171875, -97.271484375, -94.42578125, -91.580078125, -88.734375, -85.888671875, -83.04296875, -80.197265625, -77.3515625, -74.505859375, -71.66015625, -68.814453125, -65.96875, -63.123046875, -60.27734375, -57.431640625, -54.5859375, -51.740234375, -48.89453125, -46.048828125, -43.203125, -40.357421875, -37.51171875, -34.666015625, -31.8203125, -28.974609375, -26.12890625, -23.283203125, -20.4375, -17.591796875, -14.74609375, -11.900390625, -9.0546875, -6.208984375, -3.36328125, -0.517578125, 2.328125, 5.173828125, 8.01953125, 10.865234375, 13.7109375, 16.556640625, 19.40234375, 22.248046875, 25.09375, 27.939453125, 30.78515625, 33.630859375, 36.4765625, 39.322265625, 42.16796875, 45.013671875, 47.859375, 50.705078125, 53.55078125, 56.396484375, 59.2421875, 62.087890625, 64.93359375, 67.779296875, 70.625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 13.0, 8.0, 13.0, 22.0, 31.0, 37.0, 43.0, 60.0, 66.0, 86.0, 83.0, 103.0, 84.0, 92.0, 60.0, 45.0, 41.0, 31.0, 19.0, 16.0, 11.0, 8.0, 7.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.6021728515625, -5.423095703125, -5.2440185546875, -5.06494140625, -4.8858642578125, -4.706787109375, -4.5277099609375, -4.3486328125, -4.1695556640625, -3.990478515625, -3.8114013671875, -3.63232421875, -3.4532470703125, -3.274169921875, -3.0950927734375, -2.916015625, -2.7369384765625, -2.557861328125, -2.3787841796875, -2.19970703125, -2.0206298828125, -1.841552734375, -1.6624755859375, -1.4833984375, -1.3043212890625, -1.125244140625, -0.9461669921875, -0.76708984375, -0.5880126953125, -0.408935546875, -0.2298583984375, -0.05078125, 0.1282958984375, 0.307373046875, 0.4864501953125, 0.66552734375, 0.8446044921875, 1.023681640625, 1.2027587890625, 1.3818359375, 1.5609130859375, 1.739990234375, 1.9190673828125, 2.09814453125, 2.2772216796875, 2.456298828125, 2.6353759765625, 2.814453125, 2.9935302734375, 3.172607421875, 3.3516845703125, 3.53076171875, 3.7098388671875, 3.888916015625, 4.0679931640625, 4.2470703125, 4.4261474609375, 4.605224609375, 4.7843017578125, 4.96337890625, 5.1424560546875, 5.321533203125, 5.5006103515625, 5.6796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 4.0, 2.0, 8.0, 12.0, 20.0, 18.0, 28.0, 30.0, 50.0, 54.0, 68.0, 94.0, 113.0, 169.0, 261.0, 354.0, 603.0, 879.0, 1742.0, 3710.0, 10956.0, 339792.0, 3815371.0, 11541.0, 3810.0, 1817.0, 883.0, 537.0, 383.0, 265.0, 180.0, 138.0, 99.0, 51.0, 62.0, 38.0, 43.0, 28.0, 21.0, 9.0, 5.0, 7.0, 4.0, 7.0, 4.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.609375, -28.622802734375, -27.63623046875, -26.649658203125, -25.6630859375, -24.676513671875, -23.68994140625, -22.703369140625, -21.716796875, -20.730224609375, -19.74365234375, -18.757080078125, -17.7705078125, -16.783935546875, -15.79736328125, -14.810791015625, -13.82421875, -12.837646484375, -11.85107421875, -10.864501953125, -9.8779296875, -8.891357421875, -7.90478515625, -6.918212890625, -5.931640625, -4.945068359375, -3.95849609375, -2.971923828125, -1.9853515625, -0.998779296875, -0.01220703125, 0.974365234375, 1.9609375, 2.947509765625, 3.93408203125, 4.920654296875, 5.9072265625, 6.893798828125, 7.88037109375, 8.866943359375, 9.853515625, 10.840087890625, 11.82666015625, 12.813232421875, 13.7998046875, 14.786376953125, 15.77294921875, 16.759521484375, 17.74609375, 18.732666015625, 19.71923828125, 20.705810546875, 21.6923828125, 22.678955078125, 23.66552734375, 24.652099609375, 25.638671875, 26.625244140625, 27.61181640625, 28.598388671875, 29.5849609375, 30.571533203125, 31.55810546875, 32.544677734375, 33.53125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 8.0, 5.0, 22.0, 32.0, 3711.0, 204.0, 44.0, 17.0, 5.0, 5.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.7418212890625, -8.475830078125, -8.2098388671875, -7.94384765625, -7.6778564453125, -7.411865234375, -7.1458740234375, -6.8798828125, -6.6138916015625, -6.347900390625, -6.0819091796875, -5.81591796875, -5.5499267578125, -5.283935546875, -5.0179443359375, -4.751953125, -4.4859619140625, -4.219970703125, -3.9539794921875, -3.68798828125, -3.4219970703125, -3.156005859375, -2.8900146484375, -2.6240234375, -2.3580322265625, -2.092041015625, -1.8260498046875, -1.56005859375, -1.2940673828125, -1.028076171875, -0.7620849609375, -0.49609375, -0.2301025390625, 0.035888671875, 0.3018798828125, 0.56787109375, 0.8338623046875, 1.099853515625, 1.3658447265625, 1.6318359375, 1.8978271484375, 2.163818359375, 2.4298095703125, 2.69580078125, 2.9617919921875, 3.227783203125, 3.4937744140625, 3.759765625, 4.0257568359375, 4.291748046875, 4.5577392578125, 4.82373046875, 5.0897216796875, 5.355712890625, 5.6217041015625, 5.8876953125, 6.1536865234375, 6.419677734375, 6.6856689453125, 6.95166015625, 7.2176513671875, 7.483642578125, 7.7496337890625, 8.015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 4.0, 15.0, 18.0, 35.0, 40.0, 67.0, 85.0, 112.0, 102.0, 103.0, 82.0, 104.0, 49.0, 49.0, 39.0, 21.0, 15.0, 13.0, 14.0, 6.0, 1.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.559917449951172, -22.930341720581055, -22.300765991210938, -21.671188354492188, -21.04161262512207, -20.412036895751953, -19.782459259033203, -19.152883529663086, -18.52330780029297, -17.89373207092285, -17.264156341552734, -16.634578704833984, -16.005002975463867, -15.37542724609375, -14.745850563049316, -14.116273880004883, -13.486698150634766, -12.857122421264648, -12.227545738220215, -11.597969055175781, -10.968393325805664, -10.338817596435547, -9.709240913391113, -9.07966423034668, -8.450088500976562, -7.820512294769287, -7.190936088562012, -6.561359882354736, -5.931783676147461, -5.3022074699401855, -4.67263126373291, -4.043055057525635, -3.4134788513183594, -2.783902645111084, -2.1543264389038086, -1.5247502326965332, -0.8951740264892578, -0.2655978202819824, 0.36397838592529297, 0.9935545921325684, 1.6231307983398438, 2.252707004547119, 2.8822832107543945, 3.51185941696167, 4.141435623168945, 4.771011829376221, 5.400588035583496, 6.0301642417907715, 6.659740447998047, 7.289316654205322, 7.918892860412598, 8.548469543457031, 9.178045272827148, 9.807621002197266, 10.4371976852417, 11.066774368286133, 11.69635009765625, 12.325925827026367, 12.9555025100708, 13.585079193115234, 14.214654922485352, 14.844230651855469, 15.473807334899902, 16.103384017944336, 16.732959747314453]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 6.0, 14.0, 5.0, 3.0, 7.0, 17.0, 13.0, 19.0, 22.0, 33.0, 24.0, 25.0, 24.0, 33.0, 41.0, 41.0, 40.0, 48.0, 37.0, 38.0, 39.0, 45.0, 48.0, 36.0, 30.0, 31.0, 27.0, 33.0, 28.0, 29.0, 19.0, 25.0, 15.0, 11.0, 13.0, 11.0, 12.0, 10.0, 12.0, 5.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.374119758605957, -11.031984329223633, -10.689848899841309, -10.347713470458984, -10.005577087402344, -9.66344165802002, -9.321306228637695, -8.979170799255371, -8.637035369873047, -8.294899940490723, -7.952764511108398, -7.610628604888916, -7.268493175506592, -6.926357746124268, -6.584221839904785, -6.242086410522461, -5.899950981140137, -5.5578155517578125, -5.215680122375488, -4.873544216156006, -4.531408786773682, -4.189273357391357, -3.847137689590454, -3.505002021789551, -3.1628665924072266, -2.8207311630249023, -2.478595495223999, -2.1364598274230957, -1.7943243980407715, -1.4521888494491577, -1.110053300857544, -0.7679176330566406, -0.4257831573486328, -0.08364760875701904, 0.2584879398345947, 0.6006234884262085, 0.9427590370178223, 1.284894585609436, 1.6270301342010498, 1.9691658020019531, 2.3113012313842773, 2.6534366607666016, 2.995572328567505, 3.337707996368408, 3.6798434257507324, 4.021978855133057, 4.364114761352539, 4.706250190734863, 5.0483856201171875, 5.390521049499512, 5.732656478881836, 6.074792385101318, 6.416927814483643, 6.759063243865967, 7.101199150085449, 7.443334579467773, 7.785470008850098, 8.127605438232422, 8.469740867614746, 8.81187629699707, 9.154012680053711, 9.496148109436035, 9.83828353881836, 10.180418968200684, 10.522554397583008]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 3.0, 14.0, 16.0, 14.0, 26.0, 34.0, 47.0, 96.0, 160.0, 251.0, 488.0, 1011.0, 2343.0, 6628.0, 26415.0, 183329.0, 675983.0, 122525.0, 19828.0, 5421.0, 1952.0, 874.0, 463.0, 225.0, 117.0, 87.0, 69.0, 37.0, 27.0, 11.0, 13.0, 11.0, 10.0, 7.0, 2.0, 3.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.484375, -19.9217529296875, -19.359130859375, -18.7965087890625, -18.23388671875, -17.6712646484375, -17.108642578125, -16.5460205078125, -15.9833984375, -15.4207763671875, -14.858154296875, -14.2955322265625, -13.73291015625, -13.1702880859375, -12.607666015625, -12.0450439453125, -11.482421875, -10.9197998046875, -10.357177734375, -9.7945556640625, -9.23193359375, -8.6693115234375, -8.106689453125, -7.5440673828125, -6.9814453125, -6.4188232421875, -5.856201171875, -5.2935791015625, -4.73095703125, -4.1683349609375, -3.605712890625, -3.0430908203125, -2.48046875, -1.9178466796875, -1.355224609375, -0.7926025390625, -0.22998046875, 0.3326416015625, 0.895263671875, 1.4578857421875, 2.0205078125, 2.5831298828125, 3.145751953125, 3.7083740234375, 4.27099609375, 4.8336181640625, 5.396240234375, 5.9588623046875, 6.521484375, 7.0841064453125, 7.646728515625, 8.2093505859375, 8.77197265625, 9.3345947265625, 9.897216796875, 10.4598388671875, 11.0224609375, 11.5850830078125, 12.147705078125, 12.7103271484375, 13.27294921875, 13.8355712890625, 14.398193359375, 14.9608154296875, 15.5234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 10.0, 7.0, 13.0, 15.0, 20.0, 28.0, 28.0, 30.0, 46.0, 45.0, 57.0, 62.0, 67.0, 74.0, 79.0, 64.0, 71.0, 53.0, 48.0, 48.0, 25.0, 16.0, 26.0, 12.0, 11.0, 13.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.9296875, -5.7677001953125, -5.605712890625, -5.4437255859375, -5.28173828125, -5.1197509765625, -4.957763671875, -4.7957763671875, -4.6337890625, -4.4718017578125, -4.309814453125, -4.1478271484375, -3.98583984375, -3.8238525390625, -3.661865234375, -3.4998779296875, -3.337890625, -3.1759033203125, -3.013916015625, -2.8519287109375, -2.68994140625, -2.5279541015625, -2.365966796875, -2.2039794921875, -2.0419921875, -1.8800048828125, -1.718017578125, -1.5560302734375, -1.39404296875, -1.2320556640625, -1.070068359375, -0.9080810546875, -0.74609375, -0.5841064453125, -0.422119140625, -0.2601318359375, -0.09814453125, 0.0638427734375, 0.225830078125, 0.3878173828125, 0.5498046875, 0.7117919921875, 0.873779296875, 1.0357666015625, 1.19775390625, 1.3597412109375, 1.521728515625, 1.6837158203125, 1.845703125, 2.0076904296875, 2.169677734375, 2.3316650390625, 2.49365234375, 2.6556396484375, 2.817626953125, 2.9796142578125, 3.1416015625, 3.3035888671875, 3.465576171875, 3.6275634765625, 3.78955078125, 3.9515380859375, 4.113525390625, 4.2755126953125, 4.4375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 10.0, 8.0, 12.0, 15.0, 37.0, 47.0, 63.0, 109.0, 186.0, 368.0, 678.0, 1540.0, 4364.0, 18529.0, 136945.0, 729288.0, 130862.0, 18225.0, 4334.0, 1441.0, 619.0, 356.0, 150.0, 112.0, 78.0, 49.0, 29.0, 31.0, 21.0, 12.0, 14.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.875, -20.269775390625, -19.66455078125, -19.059326171875, -18.4541015625, -17.848876953125, -17.24365234375, -16.638427734375, -16.033203125, -15.427978515625, -14.82275390625, -14.217529296875, -13.6123046875, -13.007080078125, -12.40185546875, -11.796630859375, -11.19140625, -10.586181640625, -9.98095703125, -9.375732421875, -8.7705078125, -8.165283203125, -7.56005859375, -6.954833984375, -6.349609375, -5.744384765625, -5.13916015625, -4.533935546875, -3.9287109375, -3.323486328125, -2.71826171875, -2.113037109375, -1.5078125, -0.902587890625, -0.29736328125, 0.307861328125, 0.9130859375, 1.518310546875, 2.12353515625, 2.728759765625, 3.333984375, 3.939208984375, 4.54443359375, 5.149658203125, 5.7548828125, 6.360107421875, 6.96533203125, 7.570556640625, 8.17578125, 8.781005859375, 9.38623046875, 9.991455078125, 10.5966796875, 11.201904296875, 11.80712890625, 12.412353515625, 13.017578125, 13.622802734375, 14.22802734375, 14.833251953125, 15.4384765625, 16.043701171875, 16.64892578125, 17.254150390625, 17.859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 6.0, 0.0, 2.0, 5.0, 11.0, 13.0, 10.0, 16.0, 15.0, 32.0, 34.0, 32.0, 33.0, 43.0, 53.0, 49.0, 49.0, 50.0, 44.0, 61.0, 52.0, 44.0, 38.0, 42.0, 41.0, 27.0, 26.0, 37.0, 17.0, 24.0, 23.0, 17.0, 8.0, 11.0, 9.0, 6.0, 11.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.046875, -19.40625, -18.765625, -18.125, -17.484375, -16.84375, -16.203125, -15.5625, -14.921875, -14.28125, -13.640625, -13.0, -12.359375, -11.71875, -11.078125, -10.4375, -9.796875, -9.15625, -8.515625, -7.875, -7.234375, -6.59375, -5.953125, -5.3125, -4.671875, -4.03125, -3.390625, -2.75, -2.109375, -1.46875, -0.828125, -0.1875, 0.453125, 1.09375, 1.734375, 2.375, 3.015625, 3.65625, 4.296875, 4.9375, 5.578125, 6.21875, 6.859375, 7.5, 8.140625, 8.78125, 9.421875, 10.0625, 10.703125, 11.34375, 11.984375, 12.625, 13.265625, 13.90625, 14.546875, 15.1875, 15.828125, 16.46875, 17.109375, 17.75, 18.390625, 19.03125, 19.671875, 20.3125, 20.953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 9.0, 4.0, 6.0, 16.0, 15.0, 11.0, 20.0, 36.0, 48.0, 106.0, 150.0, 417.0, 1923.0, 38642.0, 986248.0, 18875.0, 1335.0, 306.0, 139.0, 87.0, 45.0, 34.0, 24.0, 16.0, 15.0, 10.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.8125, -21.8779296875, -20.943359375, -20.0087890625, -19.07421875, -18.1396484375, -17.205078125, -16.2705078125, -15.3359375, -14.4013671875, -13.466796875, -12.5322265625, -11.59765625, -10.6630859375, -9.728515625, -8.7939453125, -7.859375, -6.9248046875, -5.990234375, -5.0556640625, -4.12109375, -3.1865234375, -2.251953125, -1.3173828125, -0.3828125, 0.5517578125, 1.486328125, 2.4208984375, 3.35546875, 4.2900390625, 5.224609375, 6.1591796875, 7.09375, 8.0283203125, 8.962890625, 9.8974609375, 10.83203125, 11.7666015625, 12.701171875, 13.6357421875, 14.5703125, 15.5048828125, 16.439453125, 17.3740234375, 18.30859375, 19.2431640625, 20.177734375, 21.1123046875, 22.046875, 22.9814453125, 23.916015625, 24.8505859375, 25.78515625, 26.7197265625, 27.654296875, 28.5888671875, 29.5234375, 30.4580078125, 31.392578125, 32.3271484375, 33.26171875, 34.1962890625, 35.130859375, 36.0654296875, 37.0]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 9.0, 10.0, 20.0, 28.0, 44.0, 52.0, 78.0, 152.0, 168.0, 130.0, 100.0, 66.0, 33.0, 28.0, 24.0, 15.0, 11.0, 7.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012950897216796875, -0.0012351572513580322, -0.001175224781036377, -0.0011152923107147217, -0.0010553598403930664, -0.0009954273700714111, -0.0009354948997497559, -0.0008755624294281006, -0.0008156299591064453, -0.00075569748878479, -0.0006957650184631348, -0.0006358325481414795, -0.0005759000778198242, -0.0005159676074981689, -0.00045603513717651367, -0.0003961026668548584, -0.0003361701965332031, -0.00027623772621154785, -0.00021630525588989258, -0.0001563727855682373, -9.644031524658203e-05, -3.650784492492676e-05, 2.3424625396728516e-05, 8.335709571838379e-05, 0.00014328956604003906, 0.00020322203636169434, 0.0002631545066833496, 0.0003230869770050049, 0.00038301944732666016, 0.00044295191764831543, 0.0005028843879699707, 0.000562816858291626, 0.0006227493286132812, 0.0006826817989349365, 0.0007426142692565918, 0.0008025467395782471, 0.0008624792098999023, 0.0009224116802215576, 0.0009823441505432129, 0.0010422766208648682, 0.0011022090911865234, 0.0011621415615081787, 0.001222074031829834, 0.0012820065021514893, 0.0013419389724731445, 0.0014018714427947998, 0.001461803913116455, 0.0015217363834381104, 0.0015816688537597656, 0.001641601324081421, 0.0017015337944030762, 0.0017614662647247314, 0.0018213987350463867, 0.001881331205368042, 0.0019412636756896973, 0.0020011961460113525, 0.002061128616333008, 0.002121061086654663, 0.0021809935569763184, 0.0022409260272979736, 0.002300858497619629, 0.002360790967941284, 0.0024207234382629395, 0.0024806559085845947, 0.00254058837890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 18.0, 35.0, 41.0, 88.0, 146.0, 325.0, 708.0, 2155.0, 9913.0, 124047.0, 853798.0, 48930.0, 5697.0, 1493.0, 599.0, 250.0, 129.0, 58.0, 37.0, 22.0, 12.0, 15.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.140625, -18.6541748046875, -18.167724609375, -17.6812744140625, -17.19482421875, -16.7083740234375, -16.221923828125, -15.7354736328125, -15.2490234375, -14.7625732421875, -14.276123046875, -13.7896728515625, -13.30322265625, -12.8167724609375, -12.330322265625, -11.8438720703125, -11.357421875, -10.8709716796875, -10.384521484375, -9.8980712890625, -9.41162109375, -8.9251708984375, -8.438720703125, -7.9522705078125, -7.4658203125, -6.9793701171875, -6.492919921875, -6.0064697265625, -5.52001953125, -5.0335693359375, -4.547119140625, -4.0606689453125, -3.57421875, -3.0877685546875, -2.601318359375, -2.1148681640625, -1.62841796875, -1.1419677734375, -0.655517578125, -0.1690673828125, 0.3173828125, 0.8038330078125, 1.290283203125, 1.7767333984375, 2.26318359375, 2.7496337890625, 3.236083984375, 3.7225341796875, 4.208984375, 4.6954345703125, 5.181884765625, 5.6683349609375, 6.15478515625, 6.6412353515625, 7.127685546875, 7.6141357421875, 8.1005859375, 8.5870361328125, 9.073486328125, 9.5599365234375, 10.04638671875, 10.5328369140625, 11.019287109375, 11.5057373046875, 11.9921875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 9.0, 15.0, 19.0, 22.0, 37.0, 55.0, 52.0, 97.0, 158.0, 108.0, 103.0, 80.0, 66.0, 38.0, 40.0, 26.0, 26.0, 9.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.234375, -11.9078369140625, -11.581298828125, -11.2547607421875, -10.92822265625, -10.6016845703125, -10.275146484375, -9.9486083984375, -9.6220703125, -9.2955322265625, -8.968994140625, -8.6424560546875, -8.31591796875, -7.9893798828125, -7.662841796875, -7.3363037109375, -7.009765625, -6.6832275390625, -6.356689453125, -6.0301513671875, -5.70361328125, -5.3770751953125, -5.050537109375, -4.7239990234375, -4.3974609375, -4.0709228515625, -3.744384765625, -3.4178466796875, -3.09130859375, -2.7647705078125, -2.438232421875, -2.1116943359375, -1.78515625, -1.4586181640625, -1.132080078125, -0.8055419921875, -0.47900390625, -0.1524658203125, 0.174072265625, 0.5006103515625, 0.8271484375, 1.1536865234375, 1.480224609375, 1.8067626953125, 2.13330078125, 2.4598388671875, 2.786376953125, 3.1129150390625, 3.439453125, 3.7659912109375, 4.092529296875, 4.4190673828125, 4.74560546875, 5.0721435546875, 5.398681640625, 5.7252197265625, 6.0517578125, 6.3782958984375, 6.704833984375, 7.0313720703125, 7.35791015625, 7.6844482421875, 8.010986328125, 8.3375244140625, 8.6640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 9.0, 30.0, 216.0, 453.0, 239.0, 44.0, 11.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-874.15185546875, -857.1844482421875, -840.217041015625, -823.2496948242188, -806.2822875976562, -789.3148803710938, -772.3475341796875, -755.380126953125, -738.4127197265625, -721.4453125, -704.4779052734375, -687.5105590820312, -670.5431518554688, -653.5757446289062, -636.6083984375, -619.6409912109375, -602.673583984375, -585.7061767578125, -568.73876953125, -551.7714233398438, -534.8040161132812, -517.8366088867188, -500.8692321777344, -483.90185546875, -466.9344482421875, -449.967041015625, -432.9996643066406, -416.03228759765625, -399.06488037109375, -382.09747314453125, -365.1300964355469, -348.1627197265625, -331.1952819824219, -314.2279052734375, -297.260498046875, -280.2930908203125, -263.3257141113281, -246.3583221435547, -229.39093017578125, -212.4235382080078, -195.45614624023438, -178.48875427246094, -161.5213623046875, -144.55397033691406, -127.58657836914062, -110.61918640136719, -93.65179443359375, -76.68440246582031, -59.717010498046875, -42.74961853027344, -25.7822265625, -8.814834594726562, 8.152557373046875, 25.119949340820312, 42.08734130859375, 59.05473327636719, 76.02212524414062, 92.98951721191406, 109.9569091796875, 126.92430114746094, 143.89169311523438, 160.8590850830078, 177.82647705078125, 194.7938690185547, 211.76126098632812]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 12.0, 13.0, 13.0, 20.0, 23.0, 24.0, 27.0, 25.0, 39.0, 41.0, 35.0, 42.0, 49.0, 51.0, 47.0, 55.0, 49.0, 50.0, 50.0, 50.0, 43.0, 33.0, 37.0, 35.0, 29.0, 25.0, 11.0, 5.0, 9.0, 11.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-99.05447387695312, -96.16991424560547, -93.28535461425781, -90.40079498291016, -87.5162353515625, -84.63166809082031, -81.74711608886719, -78.862548828125, -75.97798919677734, -73.09342956542969, -70.20886993408203, -67.32431030273438, -64.43975067138672, -61.5551872253418, -58.67062759399414, -55.78606414794922, -52.90150833129883, -50.01694869995117, -47.132389068603516, -44.247825622558594, -41.36326599121094, -38.47870635986328, -35.594146728515625, -32.70958709716797, -29.82502555847168, -26.940465927124023, -24.055904388427734, -21.171344757080078, -18.286785125732422, -15.402223587036133, -12.517663955688477, -9.633102416992188, -6.748542785644531, -3.8639824390411377, -0.9794220924377441, 1.9051380157470703, 4.789698600769043, 7.674259185791016, 10.558818817138672, 13.443380355834961, 16.327939987182617, 19.212499618530273, 22.097061157226562, 24.98162078857422, 27.866180419921875, 30.750741958618164, 33.63529968261719, 36.51986312866211, 39.404422760009766, 42.28898239135742, 45.17354202270508, 48.05810546875, 50.942665100097656, 53.82722473144531, 56.71178436279297, 59.596343994140625, 62.48090362548828, 65.36546325683594, 68.2500228881836, 71.13458251953125, 74.0191421508789, 76.90370178222656, 79.78826904296875, 82.6728286743164, 85.55738830566406]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 8.0, 18.0, 15.0, 25.0, 29.0, 43.0, 70.0, 129.0, 238.0, 466.0, 929.0, 2614.0, 11770.0, 4015564.0, 150716.0, 7939.0, 2048.0, 833.0, 375.0, 183.0, 99.0, 59.0, 32.0, 22.0, 19.0, 10.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-43.59375, -42.34423828125, -41.0947265625, -39.84521484375, -38.595703125, -37.34619140625, -36.0966796875, -34.84716796875, -33.59765625, -32.34814453125, -31.0986328125, -29.84912109375, -28.599609375, -27.35009765625, -26.1005859375, -24.85107421875, -23.6015625, -22.35205078125, -21.1025390625, -19.85302734375, -18.603515625, -17.35400390625, -16.1044921875, -14.85498046875, -13.60546875, -12.35595703125, -11.1064453125, -9.85693359375, -8.607421875, -7.35791015625, -6.1083984375, -4.85888671875, -3.609375, -2.35986328125, -1.1103515625, 0.13916015625, 1.388671875, 2.63818359375, 3.8876953125, 5.13720703125, 6.38671875, 7.63623046875, 8.8857421875, 10.13525390625, 11.384765625, 12.63427734375, 13.8837890625, 15.13330078125, 16.3828125, 17.63232421875, 18.8818359375, 20.13134765625, 21.380859375, 22.63037109375, 23.8798828125, 25.12939453125, 26.37890625, 27.62841796875, 28.8779296875, 30.12744140625, 31.376953125, 32.62646484375, 33.8759765625, 35.12548828125, 36.375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 11.0, 7.0, 5.0, 16.0, 34.0, 35.0, 44.0, 63.0, 76.0, 81.0, 105.0, 99.0, 109.0, 73.0, 69.0, 55.0, 44.0, 32.0, 10.0, 13.0, 8.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6171875, -8.401611328125, -8.18603515625, -7.970458984375, -7.7548828125, -7.539306640625, -7.32373046875, -7.108154296875, -6.892578125, -6.677001953125, -6.46142578125, -6.245849609375, -6.0302734375, -5.814697265625, -5.59912109375, -5.383544921875, -5.16796875, -4.952392578125, -4.73681640625, -4.521240234375, -4.3056640625, -4.090087890625, -3.87451171875, -3.658935546875, -3.443359375, -3.227783203125, -3.01220703125, -2.796630859375, -2.5810546875, -2.365478515625, -2.14990234375, -1.934326171875, -1.71875, -1.503173828125, -1.28759765625, -1.072021484375, -0.8564453125, -0.640869140625, -0.42529296875, -0.209716796875, 0.005859375, 0.221435546875, 0.43701171875, 0.652587890625, 0.8681640625, 1.083740234375, 1.29931640625, 1.514892578125, 1.73046875, 1.946044921875, 2.16162109375, 2.377197265625, 2.5927734375, 2.808349609375, 3.02392578125, 3.239501953125, 3.455078125, 3.670654296875, 3.88623046875, 4.101806640625, 4.3173828125, 4.532958984375, 4.74853515625, 4.964111328125, 5.1796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 3.0, 7.0, 9.0, 12.0, 12.0, 19.0, 40.0, 43.0, 68.0, 102.0, 185.0, 320.0, 541.0, 935.0, 1852.0, 4274.0, 10786.0, 37301.0, 3698945.0, 392672.0, 29427.0, 9153.0, 3792.0, 1732.0, 824.0, 487.0, 283.0, 163.0, 91.0, 72.0, 42.0, 25.0, 28.0, 12.0, 10.0, 4.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-34.875, -33.955322265625, -33.03564453125, -32.115966796875, -31.1962890625, -30.276611328125, -29.35693359375, -28.437255859375, -27.517578125, -26.597900390625, -25.67822265625, -24.758544921875, -23.8388671875, -22.919189453125, -21.99951171875, -21.079833984375, -20.16015625, -19.240478515625, -18.32080078125, -17.401123046875, -16.4814453125, -15.561767578125, -14.64208984375, -13.722412109375, -12.802734375, -11.883056640625, -10.96337890625, -10.043701171875, -9.1240234375, -8.204345703125, -7.28466796875, -6.364990234375, -5.4453125, -4.525634765625, -3.60595703125, -2.686279296875, -1.7666015625, -0.846923828125, 0.07275390625, 0.992431640625, 1.912109375, 2.831787109375, 3.75146484375, 4.671142578125, 5.5908203125, 6.510498046875, 7.43017578125, 8.349853515625, 9.26953125, 10.189208984375, 11.10888671875, 12.028564453125, 12.9482421875, 13.867919921875, 14.78759765625, 15.707275390625, 16.626953125, 17.546630859375, 18.46630859375, 19.385986328125, 20.3056640625, 21.225341796875, 22.14501953125, 23.064697265625, 23.984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 9.0, 4.0, 15.0, 20.0, 28.0, 37.0, 89.0, 220.0, 3214.0, 228.0, 73.0, 38.0, 19.0, 14.0, 12.0, 9.0, 5.0, 6.0, 2.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.6484375, -15.252197265625, -14.85595703125, -14.459716796875, -14.0634765625, -13.667236328125, -13.27099609375, -12.874755859375, -12.478515625, -12.082275390625, -11.68603515625, -11.289794921875, -10.8935546875, -10.497314453125, -10.10107421875, -9.704833984375, -9.30859375, -8.912353515625, -8.51611328125, -8.119873046875, -7.7236328125, -7.327392578125, -6.93115234375, -6.534912109375, -6.138671875, -5.742431640625, -5.34619140625, -4.949951171875, -4.5537109375, -4.157470703125, -3.76123046875, -3.364990234375, -2.96875, -2.572509765625, -2.17626953125, -1.780029296875, -1.3837890625, -0.987548828125, -0.59130859375, -0.195068359375, 0.201171875, 0.597412109375, 0.99365234375, 1.389892578125, 1.7861328125, 2.182373046875, 2.57861328125, 2.974853515625, 3.37109375, 3.767333984375, 4.16357421875, 4.559814453125, 4.9560546875, 5.352294921875, 5.74853515625, 6.144775390625, 6.541015625, 6.937255859375, 7.33349609375, 7.729736328125, 8.1259765625, 8.522216796875, 8.91845703125, 9.314697265625, 9.7109375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 7.0, 9.0, 12.0, 14.0, 23.0, 47.0, 66.0, 108.0, 106.0, 136.0, 105.0, 87.0, 84.0, 63.0, 38.0, 19.0, 19.0, 16.0, 7.0, 12.0, 8.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.619911193847656, -51.10145568847656, -49.58300018310547, -48.064544677734375, -46.54608917236328, -45.02763366699219, -43.509178161621094, -41.99072265625, -40.472267150878906, -38.95381164550781, -37.43535614013672, -35.916900634765625, -34.39844512939453, -32.87998962402344, -31.36153221130371, -29.843076705932617, -28.32461929321289, -26.806163787841797, -25.287708282470703, -23.76925277709961, -22.250797271728516, -20.732341766357422, -19.213884353637695, -17.6954288482666, -16.176973342895508, -14.658517837524414, -13.14006233215332, -11.62160587310791, -10.103150367736816, -8.584694862365723, -7.0662384033203125, -5.547782897949219, -4.029331207275391, -2.5108754634857178, -0.9924197196960449, 0.526036262512207, 2.044491767883301, 3.5629472732543945, 5.081403732299805, 6.599859237670898, 8.118314743041992, 9.636770248413086, 11.15522575378418, 12.67368221282959, 14.192137718200684, 15.710593223571777, 17.229049682617188, 18.74750518798828, 20.265960693359375, 21.78441619873047, 23.302871704101562, 24.821327209472656, 26.33978271484375, 27.858238220214844, 29.37669563293457, 30.895151138305664, 32.413604736328125, 33.93206024169922, 35.45051574707031, 36.968971252441406, 38.4874267578125, 40.005882263183594, 41.52433776855469, 43.04279327392578, 44.56125259399414]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 9.0, 5.0, 11.0, 7.0, 14.0, 8.0, 29.0, 28.0, 20.0, 26.0, 26.0, 23.0, 24.0, 41.0, 26.0, 45.0, 39.0, 39.0, 48.0, 44.0, 47.0, 50.0, 49.0, 40.0, 40.0, 37.0, 34.0, 22.0, 21.0, 26.0, 14.0, 15.0, 26.0, 8.0, 13.0, 12.0, 4.0, 10.0, 6.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.727922439575195, -25.821088790893555, -24.914257049560547, -24.007423400878906, -23.100589752197266, -22.193756103515625, -21.286924362182617, -20.380090713500977, -19.47325897216797, -18.566425323486328, -17.65959358215332, -16.75275993347168, -15.845926284790039, -14.939093589782715, -14.03226089477539, -13.12542724609375, -12.21859359741211, -11.311760902404785, -10.404927253723145, -9.49809455871582, -8.59126091003418, -7.6844282150268555, -6.777595520019531, -5.870762348175049, -4.963929176330566, -4.057096004486084, -3.1502630710601807, -2.2434301376342773, -1.336596965789795, -0.4297637939453125, 0.4770689010620117, 1.3839020729064941, 2.2907333374023438, 3.197566509246826, 4.104399681091309, 5.011232376098633, 5.918065547943115, 6.824898719787598, 7.731731414794922, 8.638565063476562, 9.545397758483887, 10.452230453491211, 11.359064102172852, 12.265896797180176, 13.1727294921875, 14.07956314086914, 14.986395835876465, 15.893228530883789, 16.80006217956543, 17.70689582824707, 18.613727569580078, 19.52056121826172, 20.42739486694336, 21.334228515625, 22.241060256958008, 23.14789390563965, 24.054725646972656, 24.961559295654297, 25.868391036987305, 26.775224685668945, 27.682058334350586, 28.588890075683594, 29.495723724365234, 30.402557373046875, 31.309391021728516]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 6.0, 7.0, 10.0, 28.0, 34.0, 63.0, 94.0, 171.0, 344.0, 759.0, 1933.0, 5661.0, 20512.0, 93076.0, 497123.0, 344902.0, 62294.0, 14539.0, 4223.0, 1533.0, 622.0, 287.0, 133.0, 76.0, 56.0, 25.0, 9.0, 8.0, 10.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.40625, -11.839111328125, -11.27197265625, -10.704833984375, -10.1376953125, -9.570556640625, -9.00341796875, -8.436279296875, -7.869140625, -7.302001953125, -6.73486328125, -6.167724609375, -5.6005859375, -5.033447265625, -4.46630859375, -3.899169921875, -3.33203125, -2.764892578125, -2.19775390625, -1.630615234375, -1.0634765625, -0.496337890625, 0.07080078125, 0.637939453125, 1.205078125, 1.772216796875, 2.33935546875, 2.906494140625, 3.4736328125, 4.040771484375, 4.60791015625, 5.175048828125, 5.7421875, 6.309326171875, 6.87646484375, 7.443603515625, 8.0107421875, 8.577880859375, 9.14501953125, 9.712158203125, 10.279296875, 10.846435546875, 11.41357421875, 11.980712890625, 12.5478515625, 13.114990234375, 13.68212890625, 14.249267578125, 14.81640625, 15.383544921875, 15.95068359375, 16.517822265625, 17.0849609375, 17.652099609375, 18.21923828125, 18.786376953125, 19.353515625, 19.920654296875, 20.48779296875, 21.054931640625, 21.6220703125, 22.189208984375, 22.75634765625, 23.323486328125, 23.890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 1.0, 0.0, 8.0, 11.0, 12.0, 14.0, 20.0, 31.0, 31.0, 34.0, 53.0, 40.0, 61.0, 73.0, 74.0, 80.0, 87.0, 76.0, 63.0, 50.0, 47.0, 36.0, 29.0, 21.0, 17.0, 7.0, 9.0, 5.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.421875, -7.21685791015625, -7.0118408203125, -6.80682373046875, -6.601806640625, -6.39678955078125, -6.1917724609375, -5.98675537109375, -5.78173828125, -5.57672119140625, -5.3717041015625, -5.16668701171875, -4.961669921875, -4.75665283203125, -4.5516357421875, -4.34661865234375, -4.1416015625, -3.93658447265625, -3.7315673828125, -3.52655029296875, -3.321533203125, -3.11651611328125, -2.9114990234375, -2.70648193359375, -2.50146484375, -2.29644775390625, -2.0914306640625, -1.88641357421875, -1.681396484375, -1.47637939453125, -1.2713623046875, -1.06634521484375, -0.861328125, -0.65631103515625, -0.4512939453125, -0.24627685546875, -0.041259765625, 0.16375732421875, 0.3687744140625, 0.57379150390625, 0.77880859375, 0.98382568359375, 1.1888427734375, 1.39385986328125, 1.598876953125, 1.80389404296875, 2.0089111328125, 2.21392822265625, 2.4189453125, 2.62396240234375, 2.8289794921875, 3.03399658203125, 3.239013671875, 3.44403076171875, 3.6490478515625, 3.85406494140625, 4.05908203125, 4.26409912109375, 4.4691162109375, 4.67413330078125, 4.879150390625, 5.08416748046875, 5.2891845703125, 5.49420166015625, 5.69921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 7.0, 9.0, 15.0, 18.0, 25.0, 24.0, 30.0, 39.0, 65.0, 78.0, 123.0, 199.0, 319.0, 504.0, 1029.0, 2354.0, 6711.0, 25343.0, 133265.0, 615474.0, 211270.0, 36613.0, 9106.0, 3080.0, 1201.0, 594.0, 361.0, 210.0, 143.0, 100.0, 78.0, 41.0, 28.0, 26.0, 15.0, 19.0, 10.0, 8.0, 6.0, 0.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6796875, -14.1282958984375, -13.576904296875, -13.0255126953125, -12.47412109375, -11.9227294921875, -11.371337890625, -10.8199462890625, -10.2685546875, -9.7171630859375, -9.165771484375, -8.6143798828125, -8.06298828125, -7.5115966796875, -6.960205078125, -6.4088134765625, -5.857421875, -5.3060302734375, -4.754638671875, -4.2032470703125, -3.65185546875, -3.1004638671875, -2.549072265625, -1.9976806640625, -1.4462890625, -0.8948974609375, -0.343505859375, 0.2078857421875, 0.75927734375, 1.3106689453125, 1.862060546875, 2.4134521484375, 2.96484375, 3.5162353515625, 4.067626953125, 4.6190185546875, 5.17041015625, 5.7218017578125, 6.273193359375, 6.8245849609375, 7.3759765625, 7.9273681640625, 8.478759765625, 9.0301513671875, 9.58154296875, 10.1329345703125, 10.684326171875, 11.2357177734375, 11.787109375, 12.3385009765625, 12.889892578125, 13.4412841796875, 13.99267578125, 14.5440673828125, 15.095458984375, 15.6468505859375, 16.1982421875, 16.7496337890625, 17.301025390625, 17.8524169921875, 18.40380859375, 18.9552001953125, 19.506591796875, 20.0579833984375, 20.609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 12.0, 4.0, 9.0, 6.0, 10.0, 22.0, 16.0, 23.0, 18.0, 26.0, 31.0, 32.0, 26.0, 44.0, 51.0, 42.0, 40.0, 44.0, 46.0, 43.0, 45.0, 45.0, 39.0, 57.0, 36.0, 31.0, 32.0, 36.0, 21.0, 24.0, 13.0, 16.0, 7.0, 13.0, 11.0, 3.0, 9.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.09375, -19.442626953125, -18.79150390625, -18.140380859375, -17.4892578125, -16.838134765625, -16.18701171875, -15.535888671875, -14.884765625, -14.233642578125, -13.58251953125, -12.931396484375, -12.2802734375, -11.629150390625, -10.97802734375, -10.326904296875, -9.67578125, -9.024658203125, -8.37353515625, -7.722412109375, -7.0712890625, -6.420166015625, -5.76904296875, -5.117919921875, -4.466796875, -3.815673828125, -3.16455078125, -2.513427734375, -1.8623046875, -1.211181640625, -0.56005859375, 0.091064453125, 0.7421875, 1.393310546875, 2.04443359375, 2.695556640625, 3.3466796875, 3.997802734375, 4.64892578125, 5.300048828125, 5.951171875, 6.602294921875, 7.25341796875, 7.904541015625, 8.5556640625, 9.206787109375, 9.85791015625, 10.509033203125, 11.16015625, 11.811279296875, 12.46240234375, 13.113525390625, 13.7646484375, 14.415771484375, 15.06689453125, 15.718017578125, 16.369140625, 17.020263671875, 17.67138671875, 18.322509765625, 18.9736328125, 19.624755859375, 20.27587890625, 20.927001953125, 21.578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 9.0, 8.0, 18.0, 30.0, 39.0, 57.0, 139.0, 255.0, 625.0, 1905.0, 10040.0, 186240.0, 805012.0, 38080.0, 4178.0, 1100.0, 411.0, 176.0, 97.0, 46.0, 29.0, 23.0, 11.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.15673828125, -7.8681640625, -7.57958984375, -7.291015625, -7.00244140625, -6.7138671875, -6.42529296875, -6.13671875, -5.84814453125, -5.5595703125, -5.27099609375, -4.982421875, -4.69384765625, -4.4052734375, -4.11669921875, -3.828125, -3.53955078125, -3.2509765625, -2.96240234375, -2.673828125, -2.38525390625, -2.0966796875, -1.80810546875, -1.51953125, -1.23095703125, -0.9423828125, -0.65380859375, -0.365234375, -0.07666015625, 0.2119140625, 0.50048828125, 0.7890625, 1.07763671875, 1.3662109375, 1.65478515625, 1.943359375, 2.23193359375, 2.5205078125, 2.80908203125, 3.09765625, 3.38623046875, 3.6748046875, 3.96337890625, 4.251953125, 4.54052734375, 4.8291015625, 5.11767578125, 5.40625, 5.69482421875, 5.9833984375, 6.27197265625, 6.560546875, 6.84912109375, 7.1376953125, 7.42626953125, 7.71484375, 8.00341796875, 8.2919921875, 8.58056640625, 8.869140625, 9.15771484375, 9.4462890625, 9.73486328125, 10.0234375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 9.0, 7.0, 11.0, 22.0, 35.0, 38.0, 61.0, 90.0, 112.0, 133.0, 125.0, 114.0, 70.0, 54.0, 34.0, 18.0, 19.0, 14.0, 12.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00115966796875, -0.0011193007230758667, -0.0010789334774017334, -0.0010385662317276, -0.0009981989860534668, -0.0009578317403793335, -0.0009174644947052002, -0.0008770972490310669, -0.0008367300033569336, -0.0007963627576828003, -0.000755995512008667, -0.0007156282663345337, -0.0006752610206604004, -0.0006348937749862671, -0.0005945265293121338, -0.0005541592836380005, -0.0005137920379638672, -0.0004734247922897339, -0.0004330575466156006, -0.0003926903009414673, -0.000352323055267334, -0.0003119558095932007, -0.0002715885639190674, -0.00023122131824493408, -0.00019085407257080078, -0.00015048682689666748, -0.00011011958122253418, -6.975233554840088e-05, -2.9385089874267578e-05, 1.0982155799865723e-05, 5.1349401473999023e-05, 9.171664714813232e-05, 0.00013208389282226562, 0.00017245113849639893, 0.00021281838417053223, 0.00025318562984466553, 0.00029355287551879883, 0.00033392012119293213, 0.00037428736686706543, 0.00041465461254119873, 0.00045502185821533203, 0.0004953891038894653, 0.0005357563495635986, 0.0005761235952377319, 0.0006164908409118652, 0.0006568580865859985, 0.0006972253322601318, 0.0007375925779342651, 0.0007779598236083984, 0.0008183270692825317, 0.000858694314956665, 0.0008990615606307983, 0.0009394288063049316, 0.000979796051979065, 0.0010201632976531982, 0.0010605305433273315, 0.0011008977890014648, 0.0011412650346755981, 0.0011816322803497314, 0.0012219995260238647, 0.001262366771697998, 0.0013027340173721313, 0.0013431012630462646, 0.001383468508720398, 0.0014238357543945312]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 1.0, 9.0, 20.0, 51.0, 68.0, 127.0, 322.0, 846.0, 3593.0, 37488.0, 857882.0, 138915.0, 7000.0, 1358.0, 469.0, 212.0, 90.0, 38.0, 25.0, 13.0, 5.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6171875, -13.282470703125, -12.94775390625, -12.613037109375, -12.2783203125, -11.943603515625, -11.60888671875, -11.274169921875, -10.939453125, -10.604736328125, -10.27001953125, -9.935302734375, -9.6005859375, -9.265869140625, -8.93115234375, -8.596435546875, -8.26171875, -7.927001953125, -7.59228515625, -7.257568359375, -6.9228515625, -6.588134765625, -6.25341796875, -5.918701171875, -5.583984375, -5.249267578125, -4.91455078125, -4.579833984375, -4.2451171875, -3.910400390625, -3.57568359375, -3.240966796875, -2.90625, -2.571533203125, -2.23681640625, -1.902099609375, -1.5673828125, -1.232666015625, -0.89794921875, -0.563232421875, -0.228515625, 0.106201171875, 0.44091796875, 0.775634765625, 1.1103515625, 1.445068359375, 1.77978515625, 2.114501953125, 2.44921875, 2.783935546875, 3.11865234375, 3.453369140625, 3.7880859375, 4.122802734375, 4.45751953125, 4.792236328125, 5.126953125, 5.461669921875, 5.79638671875, 6.131103515625, 6.4658203125, 6.800537109375, 7.13525390625, 7.469970703125, 7.8046875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 11.0, 8.0, 12.0, 13.0, 19.0, 31.0, 46.0, 58.0, 69.0, 119.0, 96.0, 92.0, 91.0, 84.0, 57.0, 50.0, 42.0, 30.0, 19.0, 23.0, 10.0, 4.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.2734375, -8.038330078125, -7.80322265625, -7.568115234375, -7.3330078125, -7.097900390625, -6.86279296875, -6.627685546875, -6.392578125, -6.157470703125, -5.92236328125, -5.687255859375, -5.4521484375, -5.217041015625, -4.98193359375, -4.746826171875, -4.51171875, -4.276611328125, -4.04150390625, -3.806396484375, -3.5712890625, -3.336181640625, -3.10107421875, -2.865966796875, -2.630859375, -2.395751953125, -2.16064453125, -1.925537109375, -1.6904296875, -1.455322265625, -1.22021484375, -0.985107421875, -0.75, -0.514892578125, -0.27978515625, -0.044677734375, 0.1904296875, 0.425537109375, 0.66064453125, 0.895751953125, 1.130859375, 1.365966796875, 1.60107421875, 1.836181640625, 2.0712890625, 2.306396484375, 2.54150390625, 2.776611328125, 3.01171875, 3.246826171875, 3.48193359375, 3.717041015625, 3.9521484375, 4.187255859375, 4.42236328125, 4.657470703125, 4.892578125, 5.127685546875, 5.36279296875, 5.597900390625, 5.8330078125, 6.068115234375, 6.30322265625, 6.538330078125, 6.7734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 9.0, 20.0, 54.0, 106.0, 163.0, 226.0, 186.0, 117.0, 65.0, 26.0, 14.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-304.8187255859375, -297.9580078125, -291.0973205566406, -284.2366027832031, -277.3758850097656, -270.51519775390625, -263.65447998046875, -256.79376220703125, -249.93307495117188, -243.07237243652344, -236.21165466308594, -229.3509521484375, -222.49024963378906, -215.62954711914062, -208.76882934570312, -201.9081268310547, -195.0474090576172, -188.18670654296875, -181.32598876953125, -174.4652862548828, -167.60458374023438, -160.74386596679688, -153.88316345214844, -147.0224609375, -140.1617431640625, -133.30104064941406, -126.4403305053711, -119.57962036132812, -112.71891784667969, -105.85820770263672, -98.99749755859375, -92.13679504394531, -85.27609252929688, -78.4153823852539, -71.55467987060547, -64.6939697265625, -57.8332633972168, -50.972557067871094, -44.111846923828125, -37.25114059448242, -30.39043426513672, -23.529727935791016, -16.66901969909668, -9.808311462402344, -2.9476051330566406, 3.9131011962890625, 10.773811340332031, 17.634517669677734, 24.495223999023438, 31.35593032836914, 38.216636657714844, 45.07734680175781, 51.938053131103516, 58.79875946044922, 65.65946960449219, 72.52017211914062, 79.3808822631836, 86.24159240722656, 93.102294921875, 99.96300506591797, 106.82371520996094, 113.68441772460938, 120.54512786865234, 127.40583801269531, 134.26654052734375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 5.0, 9.0, 13.0, 17.0, 16.0, 17.0, 24.0, 23.0, 33.0, 31.0, 43.0, 45.0, 49.0, 40.0, 54.0, 55.0, 70.0, 59.0, 42.0, 46.0, 29.0, 45.0, 37.0, 29.0, 34.0, 21.0, 20.0, 16.0, 17.0, 12.0, 10.0, 7.0, 9.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.0716552734375, -102.79878234863281, -99.52590942382812, -96.2530288696289, -92.98015594482422, -89.70728302001953, -86.43440246582031, -83.16152954101562, -79.88865661621094, -76.61578369140625, -73.34291076660156, -70.07003021240234, -66.79715728759766, -63.52428436279297, -60.251407623291016, -56.97853088378906, -53.705657958984375, -50.43278503417969, -47.159908294677734, -43.88703155517578, -40.614158630371094, -37.341285705566406, -34.06840896606445, -30.795534133911133, -27.522659301757812, -24.249784469604492, -20.976909637451172, -17.70403480529785, -14.431159973144531, -11.158285140991211, -7.885410308837891, -4.61253547668457, -1.33966064453125, 1.9332141876220703, 5.206089019775391, 8.478963851928711, 11.751838684082031, 15.024713516235352, 18.297588348388672, 21.570463180541992, 24.843338012695312, 28.116212844848633, 31.389087677001953, 34.661964416503906, 37.934837341308594, 41.20771026611328, 44.480587005615234, 47.75346374511719, 51.026336669921875, 54.29920959472656, 57.572086334228516, 60.84496307373047, 64.11783599853516, 67.39070892333984, 70.66358947753906, 73.93646240234375, 77.20933532714844, 80.48220825195312, 83.75508117675781, 87.02796173095703, 90.30083465576172, 93.5737075805664, 96.84658813476562, 100.11946105957031, 103.392333984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 6.0, 5.0, 11.0, 12.0, 25.0, 32.0, 51.0, 73.0, 92.0, 167.0, 314.0, 525.0, 1057.0, 2560.0, 6244.0, 18467.0, 84768.0, 2935680.0, 1060714.0, 59462.0, 15024.0, 5173.0, 2007.0, 918.0, 400.0, 225.0, 119.0, 65.0, 29.0, 24.0, 13.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.15625, -16.7467041015625, -16.337158203125, -15.9276123046875, -15.51806640625, -15.1085205078125, -14.698974609375, -14.2894287109375, -13.8798828125, -13.4703369140625, -13.060791015625, -12.6512451171875, -12.24169921875, -11.8321533203125, -11.422607421875, -11.0130615234375, -10.603515625, -10.1939697265625, -9.784423828125, -9.3748779296875, -8.96533203125, -8.5557861328125, -8.146240234375, -7.7366943359375, -7.3271484375, -6.9176025390625, -6.508056640625, -6.0985107421875, -5.68896484375, -5.2794189453125, -4.869873046875, -4.4603271484375, -4.05078125, -3.6412353515625, -3.231689453125, -2.8221435546875, -2.41259765625, -2.0030517578125, -1.593505859375, -1.1839599609375, -0.7744140625, -0.3648681640625, 0.044677734375, 0.4542236328125, 0.86376953125, 1.2733154296875, 1.682861328125, 2.0924072265625, 2.501953125, 2.9114990234375, 3.321044921875, 3.7305908203125, 4.14013671875, 4.5496826171875, 4.959228515625, 5.3687744140625, 5.7783203125, 6.1878662109375, 6.597412109375, 7.0069580078125, 7.41650390625, 7.8260498046875, 8.235595703125, 8.6451416015625, 9.0546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 12.0, 12.0, 18.0, 16.0, 39.0, 42.0, 65.0, 73.0, 62.0, 80.0, 95.0, 100.0, 95.0, 79.0, 46.0, 48.0, 41.0, 32.0, 11.0, 17.0, 3.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.53125, -9.30157470703125, -9.0718994140625, -8.84222412109375, -8.612548828125, -8.38287353515625, -8.1531982421875, -7.92352294921875, -7.69384765625, -7.46417236328125, -7.2344970703125, -7.00482177734375, -6.775146484375, -6.54547119140625, -6.3157958984375, -6.08612060546875, -5.8564453125, -5.62677001953125, -5.3970947265625, -5.16741943359375, -4.937744140625, -4.70806884765625, -4.4783935546875, -4.24871826171875, -4.01904296875, -3.78936767578125, -3.5596923828125, -3.33001708984375, -3.100341796875, -2.87066650390625, -2.6409912109375, -2.41131591796875, -2.181640625, -1.95196533203125, -1.7222900390625, -1.49261474609375, -1.262939453125, -1.03326416015625, -0.8035888671875, -0.57391357421875, -0.34423828125, -0.11456298828125, 0.1151123046875, 0.34478759765625, 0.574462890625, 0.80413818359375, 1.0338134765625, 1.26348876953125, 1.4931640625, 1.72283935546875, 1.9525146484375, 2.18218994140625, 2.411865234375, 2.64154052734375, 2.8712158203125, 3.10089111328125, 3.33056640625, 3.56024169921875, 3.7899169921875, 4.01959228515625, 4.249267578125, 4.47894287109375, 4.7086181640625, 4.93829345703125, 5.16796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 7.0, 11.0, 7.0, 15.0, 14.0, 33.0, 38.0, 51.0, 120.0, 158.0, 202.0, 377.0, 721.0, 1308.0, 2497.0, 5076.0, 11579.0, 29422.0, 97706.0, 800214.0, 2979866.0, 186964.0, 46554.0, 16834.0, 7218.0, 3363.0, 1757.0, 870.0, 491.0, 289.0, 188.0, 107.0, 76.0, 37.0, 29.0, 18.0, 17.0, 5.0, 5.0, 15.0, 4.0, 1.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-12.84375, -12.489013671875, -12.13427734375, -11.779541015625, -11.4248046875, -11.070068359375, -10.71533203125, -10.360595703125, -10.005859375, -9.651123046875, -9.29638671875, -8.941650390625, -8.5869140625, -8.232177734375, -7.87744140625, -7.522705078125, -7.16796875, -6.813232421875, -6.45849609375, -6.103759765625, -5.7490234375, -5.394287109375, -5.03955078125, -4.684814453125, -4.330078125, -3.975341796875, -3.62060546875, -3.265869140625, -2.9111328125, -2.556396484375, -2.20166015625, -1.846923828125, -1.4921875, -1.137451171875, -0.78271484375, -0.427978515625, -0.0732421875, 0.281494140625, 0.63623046875, 0.990966796875, 1.345703125, 1.700439453125, 2.05517578125, 2.409912109375, 2.7646484375, 3.119384765625, 3.47412109375, 3.828857421875, 4.18359375, 4.538330078125, 4.89306640625, 5.247802734375, 5.6025390625, 5.957275390625, 6.31201171875, 6.666748046875, 7.021484375, 7.376220703125, 7.73095703125, 8.085693359375, 8.4404296875, 8.795166015625, 9.14990234375, 9.504638671875, 9.859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 3.0, 7.0, 4.0, 16.0, 19.0, 17.0, 25.0, 44.0, 45.0, 77.0, 94.0, 180.0, 321.0, 781.0, 1135.0, 561.0, 247.0, 148.0, 89.0, 62.0, 39.0, 36.0, 25.0, 22.0, 22.0, 7.0, 11.0, 6.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.125, -16.639404296875, -16.15380859375, -15.668212890625, -15.1826171875, -14.697021484375, -14.21142578125, -13.725830078125, -13.240234375, -12.754638671875, -12.26904296875, -11.783447265625, -11.2978515625, -10.812255859375, -10.32666015625, -9.841064453125, -9.35546875, -8.869873046875, -8.38427734375, -7.898681640625, -7.4130859375, -6.927490234375, -6.44189453125, -5.956298828125, -5.470703125, -4.985107421875, -4.49951171875, -4.013916015625, -3.5283203125, -3.042724609375, -2.55712890625, -2.071533203125, -1.5859375, -1.100341796875, -0.61474609375, -0.129150390625, 0.3564453125, 0.842041015625, 1.32763671875, 1.813232421875, 2.298828125, 2.784423828125, 3.27001953125, 3.755615234375, 4.2412109375, 4.726806640625, 5.21240234375, 5.697998046875, 6.18359375, 6.669189453125, 7.15478515625, 7.640380859375, 8.1259765625, 8.611572265625, 9.09716796875, 9.582763671875, 10.068359375, 10.553955078125, 11.03955078125, 11.525146484375, 12.0107421875, 12.496337890625, 12.98193359375, 13.467529296875, 13.953125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 21.0, 63.0, 188.0, 375.0, 253.0, 61.0, 21.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.5716094970703, -154.7948455810547, -146.01806640625, -137.24130249023438, -128.46453857421875, -119.6877670288086, -110.91099548339844, -102.13423156738281, -93.35746002197266, -84.5806884765625, -75.80392456054688, -67.02715301513672, -58.25038528442383, -49.47361755371094, -40.69684600830078, -31.92007827758789, -23.143310546875, -14.366541862487793, -5.589773178100586, 3.1869964599609375, 11.963764190673828, 20.74053192138672, 29.517303466796875, 38.294071197509766, 47.070838928222656, 55.84760665893555, 64.62437438964844, 73.4011459350586, 82.17791748046875, 90.95468139648438, 99.73145294189453, 108.50822448730469, 117.28500366210938, 126.06177520751953, 134.8385467529297, 143.6153106689453, 152.39207458496094, 161.16885375976562, 169.94561767578125, 178.72238159179688, 187.4991455078125, 196.27590942382812, 205.0526885986328, 213.82945251464844, 222.60621643066406, 231.38299560546875, 240.15975952148438, 248.9365234375, 257.71331787109375, 266.4900817871094, 275.266845703125, 284.04364013671875, 292.8204040527344, 301.59716796875, 310.3739318847656, 319.15069580078125, 327.9274597167969, 336.7042236328125, 345.4809875488281, 354.25775146484375, 363.0345458984375, 371.8113098144531, 380.58807373046875, 389.3648376464844, 398.1416015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 2.0, 10.0, 4.0, 4.0, 8.0, 4.0, 9.0, 13.0, 17.0, 17.0, 14.0, 15.0, 11.0, 25.0, 26.0, 30.0, 36.0, 33.0, 41.0, 45.0, 39.0, 57.0, 33.0, 46.0, 44.0, 37.0, 26.0, 44.0, 28.0, 38.0, 28.0, 31.0, 28.0, 21.0, 16.0, 16.0, 15.0, 22.0, 14.0, 10.0, 12.0, 10.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0], "bins": [-58.5560302734375, -56.81324768066406, -55.07046890258789, -53.32769012451172, -51.58490753173828, -49.842124938964844, -48.09934616088867, -46.3565673828125, -44.61378479003906, -42.871002197265625, -41.12822341918945, -39.38544464111328, -37.642662048339844, -35.899879455566406, -34.157100677490234, -32.41432189941406, -30.671539306640625, -28.92875862121582, -27.185977935791016, -25.44319725036621, -23.700416564941406, -21.9576358795166, -20.214855194091797, -18.472074508666992, -16.729293823242188, -14.986513137817383, -13.243732452392578, -11.500951766967773, -9.758171081542969, -8.015390396118164, -6.272609710693359, -4.529829025268555, -2.78704833984375, -1.0442676544189453, 0.6985130310058594, 2.441293716430664, 4.184074401855469, 5.926855087280273, 7.669635772705078, 9.412416458129883, 11.155197143554688, 12.897977828979492, 14.640758514404297, 16.3835391998291, 18.126319885253906, 19.86910057067871, 21.611881256103516, 23.35466194152832, 25.097442626953125, 26.84022331237793, 28.583003997802734, 30.32578468322754, 32.068565368652344, 33.81134796142578, 35.55412673950195, 37.296905517578125, 39.03968811035156, 40.782470703125, 42.52524948120117, 44.268028259277344, 46.01081085205078, 47.75359344482422, 49.49637222290039, 51.23915100097656, 52.98193359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 6.0, 15.0, 23.0, 29.0, 35.0, 55.0, 87.0, 113.0, 165.0, 266.0, 370.0, 681.0, 1184.0, 1929.0, 3563.0, 6737.0, 13792.0, 30517.0, 72033.0, 179951.0, 362059.0, 218626.0, 86504.0, 36036.0, 16215.0, 7828.0, 4073.0, 2226.0, 1278.0, 783.0, 470.0, 305.0, 177.0, 125.0, 88.0, 66.0, 43.0, 30.0, 14.0, 16.0, 7.0, 7.0, 5.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.34375, -9.07373046875, -8.8037109375, -8.53369140625, -8.263671875, -7.99365234375, -7.7236328125, -7.45361328125, -7.18359375, -6.91357421875, -6.6435546875, -6.37353515625, -6.103515625, -5.83349609375, -5.5634765625, -5.29345703125, -5.0234375, -4.75341796875, -4.4833984375, -4.21337890625, -3.943359375, -3.67333984375, -3.4033203125, -3.13330078125, -2.86328125, -2.59326171875, -2.3232421875, -2.05322265625, -1.783203125, -1.51318359375, -1.2431640625, -0.97314453125, -0.703125, -0.43310546875, -0.1630859375, 0.10693359375, 0.376953125, 0.64697265625, 0.9169921875, 1.18701171875, 1.45703125, 1.72705078125, 1.9970703125, 2.26708984375, 2.537109375, 2.80712890625, 3.0771484375, 3.34716796875, 3.6171875, 3.88720703125, 4.1572265625, 4.42724609375, 4.697265625, 4.96728515625, 5.2373046875, 5.50732421875, 5.77734375, 6.04736328125, 6.3173828125, 6.58740234375, 6.857421875, 7.12744140625, 7.3974609375, 7.66748046875, 7.9375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 8.0, 3.0, 10.0, 11.0, 17.0, 12.0, 21.0, 29.0, 34.0, 19.0, 50.0, 44.0, 43.0, 47.0, 52.0, 66.0, 58.0, 49.0, 66.0, 42.0, 57.0, 48.0, 41.0, 40.0, 17.0, 22.0, 26.0, 16.0, 11.0, 14.0, 6.0, 7.0, 3.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2890625, -5.1397705078125, -4.990478515625, -4.8411865234375, -4.69189453125, -4.5426025390625, -4.393310546875, -4.2440185546875, -4.0947265625, -3.9454345703125, -3.796142578125, -3.6468505859375, -3.49755859375, -3.3482666015625, -3.198974609375, -3.0496826171875, -2.900390625, -2.7510986328125, -2.601806640625, -2.4525146484375, -2.30322265625, -2.1539306640625, -2.004638671875, -1.8553466796875, -1.7060546875, -1.5567626953125, -1.407470703125, -1.2581787109375, -1.10888671875, -0.9595947265625, -0.810302734375, -0.6610107421875, -0.51171875, -0.3624267578125, -0.213134765625, -0.0638427734375, 0.08544921875, 0.2347412109375, 0.384033203125, 0.5333251953125, 0.6826171875, 0.8319091796875, 0.981201171875, 1.1304931640625, 1.27978515625, 1.4290771484375, 1.578369140625, 1.7276611328125, 1.876953125, 2.0262451171875, 2.175537109375, 2.3248291015625, 2.47412109375, 2.6234130859375, 2.772705078125, 2.9219970703125, 3.0712890625, 3.2205810546875, 3.369873046875, 3.5191650390625, 3.66845703125, 3.8177490234375, 3.967041015625, 4.1163330078125, 4.265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 0.0, 4.0, 4.0, 6.0, 13.0, 15.0, 21.0, 20.0, 49.0, 57.0, 106.0, 139.0, 211.0, 321.0, 546.0, 926.0, 1848.0, 4068.0, 11115.0, 44209.0, 289898.0, 587500.0, 79562.0, 17219.0, 5370.0, 2310.0, 1149.0, 697.0, 378.0, 253.0, 175.0, 108.0, 89.0, 52.0, 39.0, 20.0, 13.0, 10.0, 8.0, 14.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-17.078125, -16.578369140625, -16.07861328125, -15.578857421875, -15.0791015625, -14.579345703125, -14.07958984375, -13.579833984375, -13.080078125, -12.580322265625, -12.08056640625, -11.580810546875, -11.0810546875, -10.581298828125, -10.08154296875, -9.581787109375, -9.08203125, -8.582275390625, -8.08251953125, -7.582763671875, -7.0830078125, -6.583251953125, -6.08349609375, -5.583740234375, -5.083984375, -4.584228515625, -4.08447265625, -3.584716796875, -3.0849609375, -2.585205078125, -2.08544921875, -1.585693359375, -1.0859375, -0.586181640625, -0.08642578125, 0.413330078125, 0.9130859375, 1.412841796875, 1.91259765625, 2.412353515625, 2.912109375, 3.411865234375, 3.91162109375, 4.411376953125, 4.9111328125, 5.410888671875, 5.91064453125, 6.410400390625, 6.91015625, 7.409912109375, 7.90966796875, 8.409423828125, 8.9091796875, 9.408935546875, 9.90869140625, 10.408447265625, 10.908203125, 11.407958984375, 11.90771484375, 12.407470703125, 12.9072265625, 13.406982421875, 13.90673828125, 14.406494140625, 14.90625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 5.0, 14.0, 13.0, 16.0, 26.0, 23.0, 23.0, 22.0, 41.0, 49.0, 49.0, 56.0, 61.0, 50.0, 62.0, 60.0, 51.0, 44.0, 49.0, 39.0, 52.0, 32.0, 30.0, 28.0, 24.0, 23.0, 15.0, 11.0, 2.0, 1.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-26.859375, -26.120361328125, -25.38134765625, -24.642333984375, -23.9033203125, -23.164306640625, -22.42529296875, -21.686279296875, -20.947265625, -20.208251953125, -19.46923828125, -18.730224609375, -17.9912109375, -17.252197265625, -16.51318359375, -15.774169921875, -15.03515625, -14.296142578125, -13.55712890625, -12.818115234375, -12.0791015625, -11.340087890625, -10.60107421875, -9.862060546875, -9.123046875, -8.384033203125, -7.64501953125, -6.906005859375, -6.1669921875, -5.427978515625, -4.68896484375, -3.949951171875, -3.2109375, -2.471923828125, -1.73291015625, -0.993896484375, -0.2548828125, 0.484130859375, 1.22314453125, 1.962158203125, 2.701171875, 3.440185546875, 4.17919921875, 4.918212890625, 5.6572265625, 6.396240234375, 7.13525390625, 7.874267578125, 8.61328125, 9.352294921875, 10.09130859375, 10.830322265625, 11.5693359375, 12.308349609375, 13.04736328125, 13.786376953125, 14.525390625, 15.264404296875, 16.00341796875, 16.742431640625, 17.4814453125, 18.220458984375, 18.95947265625, 19.698486328125, 20.4375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 6.0, 9.0, 10.0, 16.0, 28.0, 73.0, 156.0, 423.0, 1842.0, 24613.0, 968193.0, 49795.0, 2574.0, 507.0, 153.0, 86.0, 32.0, 20.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.421875, -13.87939453125, -13.3369140625, -12.79443359375, -12.251953125, -11.70947265625, -11.1669921875, -10.62451171875, -10.08203125, -9.53955078125, -8.9970703125, -8.45458984375, -7.912109375, -7.36962890625, -6.8271484375, -6.28466796875, -5.7421875, -5.19970703125, -4.6572265625, -4.11474609375, -3.572265625, -3.02978515625, -2.4873046875, -1.94482421875, -1.40234375, -0.85986328125, -0.3173828125, 0.22509765625, 0.767578125, 1.31005859375, 1.8525390625, 2.39501953125, 2.9375, 3.47998046875, 4.0224609375, 4.56494140625, 5.107421875, 5.64990234375, 6.1923828125, 6.73486328125, 7.27734375, 7.81982421875, 8.3623046875, 8.90478515625, 9.447265625, 9.98974609375, 10.5322265625, 11.07470703125, 11.6171875, 12.15966796875, 12.7021484375, 13.24462890625, 13.787109375, 14.32958984375, 14.8720703125, 15.41455078125, 15.95703125, 16.49951171875, 17.0419921875, 17.58447265625, 18.126953125, 18.66943359375, 19.2119140625, 19.75439453125, 20.296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 0.0, 3.0, 9.0, 9.0, 6.0, 10.0, 19.0, 16.0, 25.0, 33.0, 42.0, 50.0, 64.0, 79.0, 90.0, 102.0, 96.0, 66.0, 66.0, 51.0, 39.0, 19.0, 15.0, 16.0, 14.0, 8.0, 13.0, 5.0, 5.0, 5.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0010395050048828125, -0.0010071098804473877, -0.0009747147560119629, -0.0009423196315765381, -0.0009099245071411133, -0.0008775293827056885, -0.0008451342582702637, -0.0008127391338348389, -0.0007803440093994141, -0.0007479488849639893, -0.0007155537605285645, -0.0006831586360931396, -0.0006507635116577148, -0.00061836838722229, -0.0005859732627868652, -0.0005535781383514404, -0.0005211830139160156, -0.0004887878894805908, -0.000456392765045166, -0.0004239976406097412, -0.0003916025161743164, -0.0003592073917388916, -0.0003268122673034668, -0.000294417142868042, -0.0002620220184326172, -0.00022962689399719238, -0.00019723176956176758, -0.00016483664512634277, -0.00013244152069091797, -0.00010004639625549316, -6.765127182006836e-05, -3.5256147384643555e-05, -2.86102294921875e-06, 2.9534101486206055e-05, 6.192922592163086e-05, 9.432435035705566e-05, 0.00012671947479248047, 0.00015911459922790527, 0.00019150972366333008, 0.00022390484809875488, 0.0002562999725341797, 0.0002886950969696045, 0.0003210902214050293, 0.0003534853458404541, 0.0003858804702758789, 0.0004182755947113037, 0.0004506707191467285, 0.0004830658435821533, 0.0005154609680175781, 0.0005478560924530029, 0.0005802512168884277, 0.0006126463413238525, 0.0006450414657592773, 0.0006774365901947021, 0.000709831714630127, 0.0007422268390655518, 0.0007746219635009766, 0.0008070170879364014, 0.0008394122123718262, 0.000871807336807251, 0.0009042024612426758, 0.0009365975856781006, 0.0009689927101135254, 0.0010013878345489502, 0.001033782958984375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 10.0, 7.0, 8.0, 12.0, 22.0, 28.0, 43.0, 59.0, 91.0, 134.0, 207.0, 376.0, 778.0, 1519.0, 3549.0, 11225.0, 59539.0, 569727.0, 347261.0, 39644.0, 8548.0, 2985.0, 1253.0, 601.0, 351.0, 190.0, 134.0, 84.0, 50.0, 33.0, 25.0, 17.0, 10.0, 5.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.703125, -6.50537109375, -6.3076171875, -6.10986328125, -5.912109375, -5.71435546875, -5.5166015625, -5.31884765625, -5.12109375, -4.92333984375, -4.7255859375, -4.52783203125, -4.330078125, -4.13232421875, -3.9345703125, -3.73681640625, -3.5390625, -3.34130859375, -3.1435546875, -2.94580078125, -2.748046875, -2.55029296875, -2.3525390625, -2.15478515625, -1.95703125, -1.75927734375, -1.5615234375, -1.36376953125, -1.166015625, -0.96826171875, -0.7705078125, -0.57275390625, -0.375, -0.17724609375, 0.0205078125, 0.21826171875, 0.416015625, 0.61376953125, 0.8115234375, 1.00927734375, 1.20703125, 1.40478515625, 1.6025390625, 1.80029296875, 1.998046875, 2.19580078125, 2.3935546875, 2.59130859375, 2.7890625, 2.98681640625, 3.1845703125, 3.38232421875, 3.580078125, 3.77783203125, 3.9755859375, 4.17333984375, 4.37109375, 4.56884765625, 4.7666015625, 4.96435546875, 5.162109375, 5.35986328125, 5.5576171875, 5.75537109375, 5.953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 7.0, 4.0, 4.0, 6.0, 10.0, 10.0, 15.0, 28.0, 39.0, 37.0, 51.0, 55.0, 57.0, 74.0, 84.0, 89.0, 61.0, 77.0, 60.0, 56.0, 35.0, 41.0, 34.0, 17.0, 12.0, 9.0, 9.0, 9.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.46600341796875, -4.2562255859375, -4.04644775390625, -3.836669921875, -3.62689208984375, -3.4171142578125, -3.20733642578125, -2.99755859375, -2.78778076171875, -2.5780029296875, -2.36822509765625, -2.158447265625, -1.94866943359375, -1.7388916015625, -1.52911376953125, -1.3193359375, -1.10955810546875, -0.8997802734375, -0.69000244140625, -0.480224609375, -0.27044677734375, -0.0606689453125, 0.14910888671875, 0.35888671875, 0.56866455078125, 0.7784423828125, 0.98822021484375, 1.197998046875, 1.40777587890625, 1.6175537109375, 1.82733154296875, 2.037109375, 2.24688720703125, 2.4566650390625, 2.66644287109375, 2.876220703125, 3.08599853515625, 3.2957763671875, 3.50555419921875, 3.71533203125, 3.92510986328125, 4.1348876953125, 4.34466552734375, 4.554443359375, 4.76422119140625, 4.9739990234375, 5.18377685546875, 5.3935546875, 5.60333251953125, 5.8131103515625, 6.02288818359375, 6.232666015625, 6.44244384765625, 6.6522216796875, 6.86199951171875, 7.07177734375, 7.28155517578125, 7.4913330078125, 7.70111083984375, 7.910888671875, 8.12066650390625, 8.3304443359375, 8.54022216796875, 8.75]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 14.0, 19.0, 64.0, 136.0, 240.0, 265.0, 168.0, 50.0, 25.0, 10.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.15135192871094, -208.01022338867188, -200.86911010742188, -193.72799682617188, -186.5868682861328, -179.44573974609375, -172.30462646484375, -165.16351318359375, -158.0223846435547, -150.88125610351562, -143.74014282226562, -136.59902954101562, -129.45790100097656, -122.31678009033203, -115.1756591796875, -108.03453826904297, -100.89341735839844, -93.7522964477539, -86.61117553710938, -79.47005462646484, -72.32893371582031, -65.18781280517578, -58.04669189453125, -50.90557098388672, -43.76445007324219, -36.623329162597656, -29.482208251953125, -22.341087341308594, -15.199966430664062, -8.058845520019531, -0.917724609375, 6.223396301269531, 13.364501953125, 20.50562286376953, 27.646743774414062, 34.787864685058594, 41.928985595703125, 49.070106506347656, 56.21122741699219, 63.35234832763672, 70.49346923828125, 77.63459014892578, 84.77571105957031, 91.91683197021484, 99.05795288085938, 106.1990737915039, 113.34019470214844, 120.48131561279297, 127.6224365234375, 134.7635498046875, 141.90467834472656, 149.04580688476562, 156.18692016601562, 163.32803344726562, 170.4691619873047, 177.61029052734375, 184.75140380859375, 191.89251708984375, 199.0336456298828, 206.17477416992188, 213.31588745117188, 220.45700073242188, 227.59812927246094, 234.7392578125, 241.88037109375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 3.0, 4.0, 8.0, 8.0, 6.0, 10.0, 8.0, 15.0, 23.0, 26.0, 30.0, 24.0, 36.0, 29.0, 48.0, 40.0, 46.0, 57.0, 59.0, 61.0, 61.0, 46.0, 44.0, 44.0, 28.0, 33.0, 30.0, 16.0, 17.0, 17.0, 13.0, 18.0, 11.0, 13.0, 14.0, 10.0, 6.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.922603607177734, -60.532447814941406, -58.14229202270508, -55.75213623046875, -53.361976623535156, -50.971824645996094, -48.5816650390625, -46.19150924682617, -43.801353454589844, -41.411197662353516, -39.02104187011719, -36.63088607788086, -34.24073028564453, -31.85057258605957, -29.46041488647461, -27.07025909423828, -24.680103302001953, -22.289947509765625, -19.899791717529297, -17.509634017944336, -15.119478225708008, -12.72932243347168, -10.339165687561035, -7.949008941650391, -5.5588531494140625, -3.168696880340576, -0.7785406112670898, 1.6116156578063965, 4.001771926879883, 6.391927719116211, 8.782084465026855, 11.1722412109375, 13.562400817871094, 15.952556610107422, 18.34271240234375, 20.73287010192871, 23.12302589416504, 25.513181686401367, 27.903339385986328, 30.293495178222656, 32.683650970458984, 35.07380676269531, 37.46396255493164, 39.85411834716797, 42.24427795410156, 44.634429931640625, 47.02458953857422, 49.41474533081055, 51.804901123046875, 54.1950569152832, 56.58521270751953, 58.97536849975586, 61.36552429199219, 63.75568389892578, 66.14583587646484, 68.53599548339844, 70.9261474609375, 73.3163070678711, 75.70645904541016, 78.09661865234375, 80.48677062988281, 82.8769302368164, 85.26708221435547, 87.65724182128906, 90.04740142822266]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 10.0, 8.0, 16.0, 21.0, 29.0, 54.0, 80.0, 166.0, 473.0, 2409.0, 39249.0, 4116515.0, 32155.0, 2212.0, 478.0, 174.0, 87.0, 48.0, 25.0, 19.0, 15.0, 12.0, 7.0, 5.0, 2.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.28125, -29.17919921875, -28.0771484375, -26.97509765625, -25.873046875, -24.77099609375, -23.6689453125, -22.56689453125, -21.46484375, -20.36279296875, -19.2607421875, -18.15869140625, -17.056640625, -15.95458984375, -14.8525390625, -13.75048828125, -12.6484375, -11.54638671875, -10.4443359375, -9.34228515625, -8.240234375, -7.13818359375, -6.0361328125, -4.93408203125, -3.83203125, -2.72998046875, -1.6279296875, -0.52587890625, 0.576171875, 1.67822265625, 2.7802734375, 3.88232421875, 4.984375, 6.08642578125, 7.1884765625, 8.29052734375, 9.392578125, 10.49462890625, 11.5966796875, 12.69873046875, 13.80078125, 14.90283203125, 16.0048828125, 17.10693359375, 18.208984375, 19.31103515625, 20.4130859375, 21.51513671875, 22.6171875, 23.71923828125, 24.8212890625, 25.92333984375, 27.025390625, 28.12744140625, 29.2294921875, 30.33154296875, 31.43359375, 32.53564453125, 33.6376953125, 34.73974609375, 35.841796875, 36.94384765625, 38.0458984375, 39.14794921875, 40.25]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 7.0, 4.0, 14.0, 12.0, 18.0, 19.0, 25.0, 27.0, 36.0, 39.0, 40.0, 63.0, 57.0, 51.0, 54.0, 56.0, 65.0, 64.0, 51.0, 60.0, 36.0, 37.0, 21.0, 25.0, 18.0, 19.0, 15.0, 8.0, 14.0, 8.0, 8.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.4512939453125, -3.308837890625, -3.1663818359375, -3.02392578125, -2.8814697265625, -2.739013671875, -2.5965576171875, -2.4541015625, -2.3116455078125, -2.169189453125, -2.0267333984375, -1.88427734375, -1.7418212890625, -1.599365234375, -1.4569091796875, -1.314453125, -1.1719970703125, -1.029541015625, -0.8870849609375, -0.74462890625, -0.6021728515625, -0.459716796875, -0.3172607421875, -0.1748046875, -0.0323486328125, 0.110107421875, 0.2525634765625, 0.39501953125, 0.5374755859375, 0.679931640625, 0.8223876953125, 0.96484375, 1.1072998046875, 1.249755859375, 1.3922119140625, 1.53466796875, 1.6771240234375, 1.819580078125, 1.9620361328125, 2.1044921875, 2.2469482421875, 2.389404296875, 2.5318603515625, 2.67431640625, 2.8167724609375, 2.959228515625, 3.1016845703125, 3.244140625, 3.3865966796875, 3.529052734375, 3.6715087890625, 3.81396484375, 3.9564208984375, 4.098876953125, 4.2413330078125, 4.3837890625, 4.5262451171875, 4.668701171875, 4.8111572265625, 4.95361328125, 5.0960693359375, 5.238525390625, 5.3809814453125, 5.5234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 7.0, 13.0, 17.0, 25.0, 30.0, 48.0, 90.0, 132.0, 277.0, 615.0, 1391.0, 3673.0, 11113.0, 41599.0, 286109.0, 3565961.0, 229711.0, 37667.0, 10000.0, 3215.0, 1255.0, 566.0, 301.0, 162.0, 81.0, 66.0, 56.0, 29.0, 24.0, 22.0, 10.0, 7.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.640625, -10.22265625, -9.8046875, -9.38671875, -8.96875, -8.55078125, -8.1328125, -7.71484375, -7.296875, -6.87890625, -6.4609375, -6.04296875, -5.625, -5.20703125, -4.7890625, -4.37109375, -3.953125, -3.53515625, -3.1171875, -2.69921875, -2.28125, -1.86328125, -1.4453125, -1.02734375, -0.609375, -0.19140625, 0.2265625, 0.64453125, 1.0625, 1.48046875, 1.8984375, 2.31640625, 2.734375, 3.15234375, 3.5703125, 3.98828125, 4.40625, 4.82421875, 5.2421875, 5.66015625, 6.078125, 6.49609375, 6.9140625, 7.33203125, 7.75, 8.16796875, 8.5859375, 9.00390625, 9.421875, 9.83984375, 10.2578125, 10.67578125, 11.09375, 11.51171875, 11.9296875, 12.34765625, 12.765625, 13.18359375, 13.6015625, 14.01953125, 14.4375, 14.85546875, 15.2734375, 15.69140625, 16.109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 5.0, 5.0, 5.0, 5.0, 10.0, 16.0, 18.0, 23.0, 27.0, 44.0, 87.0, 111.0, 227.0, 462.0, 1123.0, 971.0, 392.0, 185.0, 103.0, 73.0, 46.0, 33.0, 25.0, 24.0, 17.0, 16.0, 7.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.7265625, -11.3060302734375, -10.885498046875, -10.4649658203125, -10.04443359375, -9.6239013671875, -9.203369140625, -8.7828369140625, -8.3623046875, -7.9417724609375, -7.521240234375, -7.1007080078125, -6.68017578125, -6.2596435546875, -5.839111328125, -5.4185791015625, -4.998046875, -4.5775146484375, -4.156982421875, -3.7364501953125, -3.31591796875, -2.8953857421875, -2.474853515625, -2.0543212890625, -1.6337890625, -1.2132568359375, -0.792724609375, -0.3721923828125, 0.04833984375, 0.4688720703125, 0.889404296875, 1.3099365234375, 1.73046875, 2.1510009765625, 2.571533203125, 2.9920654296875, 3.41259765625, 3.8331298828125, 4.253662109375, 4.6741943359375, 5.0947265625, 5.5152587890625, 5.935791015625, 6.3563232421875, 6.77685546875, 7.1973876953125, 7.617919921875, 8.0384521484375, 8.458984375, 8.8795166015625, 9.300048828125, 9.7205810546875, 10.14111328125, 10.5616455078125, 10.982177734375, 11.4027099609375, 11.8232421875, 12.2437744140625, 12.664306640625, 13.0848388671875, 13.50537109375, 13.9259033203125, 14.346435546875, 14.7669677734375, 15.1875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 4.0, 6.0, 8.0, 7.0, 28.0, 55.0, 80.0, 169.0, 215.0, 188.0, 124.0, 52.0, 24.0, 16.0, 16.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.1895294189453, -157.32620239257812, -153.46287536621094, -149.59954833984375, -145.73622131347656, -141.87289428710938, -138.0095672607422, -134.146240234375, -130.28289794921875, -126.41957092285156, -122.55624389648438, -118.69291687011719, -114.82958984375, -110.96626281738281, -107.1029281616211, -103.2396011352539, -99.37628173828125, -95.51295471191406, -91.64962768554688, -87.78630065917969, -83.9229736328125, -80.05964660644531, -76.1963119506836, -72.3329849243164, -68.46965789794922, -64.60633087158203, -60.743003845214844, -56.87967300415039, -53.0163459777832, -49.153018951416016, -45.28968811035156, -41.426361083984375, -37.56304168701172, -33.69971466064453, -29.83638572692871, -25.97305679321289, -22.109729766845703, -18.246402740478516, -14.383073806762695, -10.519744873046875, -6.6564178466796875, -2.7930898666381836, 1.0702381134033203, 4.933566093444824, 8.796894073486328, 12.660221099853516, 16.523550033569336, 20.386878967285156, 24.250205993652344, 28.11353302001953, 31.97686195373535, 35.84019088745117, 39.70351791381836, 43.56684494018555, 47.43017578125, 51.29350280761719, 55.156829833984375, 59.02015686035156, 62.88348388671875, 66.74681091308594, 70.61013793945312, 74.47346496582031, 78.33679962158203, 82.20012664794922, 86.0634536743164]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 8.0, 10.0, 15.0, 12.0, 14.0, 20.0, 23.0, 26.0, 20.0, 31.0, 31.0, 34.0, 34.0, 40.0, 30.0, 52.0, 38.0, 40.0, 52.0, 35.0, 53.0, 48.0, 18.0, 35.0, 40.0, 29.0, 26.0, 29.0, 28.0, 24.0, 12.0, 13.0, 12.0, 7.0, 14.0, 3.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-54.968536376953125, -53.42902755737305, -51.88951873779297, -50.35000991821289, -48.81050109863281, -47.270992279052734, -45.731483459472656, -44.191978454589844, -42.6524658203125, -41.11295700073242, -39.573448181152344, -38.033939361572266, -36.49443054199219, -34.95492172241211, -33.41541290283203, -31.875905990600586, -30.33639907836914, -28.796890258789062, -27.257381439208984, -25.717872619628906, -24.178363800048828, -22.63885498046875, -21.099348068237305, -19.559839248657227, -18.02033042907715, -16.48082160949707, -14.941312789916992, -13.40180492401123, -11.862296104431152, -10.322787284851074, -8.783279418945312, -7.243770599365234, -5.704261779785156, -4.164752960205078, -2.625244617462158, -1.0857362747192383, 0.45377254486083984, 1.993281364440918, 3.5327892303466797, 5.072298049926758, 6.611806869506836, 8.151315689086914, 9.690824508666992, 11.230332374572754, 12.769841194152832, 14.30935001373291, 15.848857879638672, 17.38836669921875, 18.927875518798828, 20.467384338378906, 22.006893157958984, 23.546401977539062, 25.08591079711914, 26.62541961669922, 28.164926528930664, 29.704435348510742, 31.24394416809082, 32.783451080322266, 34.322959899902344, 35.86246871948242, 37.4019775390625, 38.94148635864258, 40.480995178222656, 42.020503997802734, 43.56001281738281]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 12.0, 18.0, 19.0, 22.0, 45.0, 79.0, 106.0, 176.0, 269.0, 407.0, 669.0, 1082.0, 1958.0, 3473.0, 6815.0, 14474.0, 33909.0, 86733.0, 247678.0, 387397.0, 159798.0, 57908.0, 23428.0, 10417.0, 5034.0, 2685.0, 1503.0, 897.0, 572.0, 332.0, 233.0, 140.0, 91.0, 58.0, 30.0, 23.0, 18.0, 11.0, 11.0, 8.0, 9.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.7926025390625, -7.507080078125, -7.2215576171875, -6.93603515625, -6.6505126953125, -6.364990234375, -6.0794677734375, -5.7939453125, -5.5084228515625, -5.222900390625, -4.9373779296875, -4.65185546875, -4.3663330078125, -4.080810546875, -3.7952880859375, -3.509765625, -3.2242431640625, -2.938720703125, -2.6531982421875, -2.36767578125, -2.0821533203125, -1.796630859375, -1.5111083984375, -1.2255859375, -0.9400634765625, -0.654541015625, -0.3690185546875, -0.08349609375, 0.2020263671875, 0.487548828125, 0.7730712890625, 1.05859375, 1.3441162109375, 1.629638671875, 1.9151611328125, 2.20068359375, 2.4862060546875, 2.771728515625, 3.0572509765625, 3.3427734375, 3.6282958984375, 3.913818359375, 4.1993408203125, 4.48486328125, 4.7703857421875, 5.055908203125, 5.3414306640625, 5.626953125, 5.9124755859375, 6.197998046875, 6.4835205078125, 6.76904296875, 7.0545654296875, 7.340087890625, 7.6256103515625, 7.9111328125, 8.1966552734375, 8.482177734375, 8.7677001953125, 9.05322265625, 9.3387451171875, 9.624267578125, 9.9097900390625, 10.1953125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 6.0, 7.0, 7.0, 8.0, 12.0, 15.0, 21.0, 23.0, 34.0, 28.0, 23.0, 47.0, 36.0, 49.0, 45.0, 53.0, 61.0, 40.0, 53.0, 49.0, 67.0, 41.0, 44.0, 31.0, 24.0, 26.0, 21.0, 30.0, 18.0, 16.0, 11.0, 11.0, 11.0, 6.0, 6.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.486480712890625, -3.34991455078125, -3.213348388671875, -3.0767822265625, -2.940216064453125, -2.80364990234375, -2.667083740234375, -2.530517578125, -2.393951416015625, -2.25738525390625, -2.120819091796875, -1.9842529296875, -1.847686767578125, -1.71112060546875, -1.574554443359375, -1.43798828125, -1.301422119140625, -1.16485595703125, -1.028289794921875, -0.8917236328125, -0.755157470703125, -0.61859130859375, -0.482025146484375, -0.345458984375, -0.208892822265625, -0.07232666015625, 0.064239501953125, 0.2008056640625, 0.337371826171875, 0.47393798828125, 0.610504150390625, 0.7470703125, 0.883636474609375, 1.02020263671875, 1.156768798828125, 1.2933349609375, 1.429901123046875, 1.56646728515625, 1.703033447265625, 1.839599609375, 1.976165771484375, 2.11273193359375, 2.249298095703125, 2.3858642578125, 2.522430419921875, 2.65899658203125, 2.795562744140625, 2.93212890625, 3.068695068359375, 3.20526123046875, 3.341827392578125, 3.4783935546875, 3.614959716796875, 3.75152587890625, 3.888092041015625, 4.024658203125, 4.161224365234375, 4.29779052734375, 4.434356689453125, 4.5709228515625, 4.707489013671875, 4.84405517578125, 4.980621337890625, 5.1171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 12.0, 8.0, 16.0, 30.0, 47.0, 57.0, 91.0, 131.0, 213.0, 415.0, 755.0, 1691.0, 4272.0, 14540.0, 75309.0, 636933.0, 263413.0, 36768.0, 8362.0, 2807.0, 1244.0, 589.0, 323.0, 172.0, 115.0, 68.0, 48.0, 36.0, 25.0, 13.0, 17.0, 5.0, 8.0, 7.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.3828125, -13.8253173828125, -13.267822265625, -12.7103271484375, -12.15283203125, -11.5953369140625, -11.037841796875, -10.4803466796875, -9.9228515625, -9.3653564453125, -8.807861328125, -8.2503662109375, -7.69287109375, -7.1353759765625, -6.577880859375, -6.0203857421875, -5.462890625, -4.9053955078125, -4.347900390625, -3.7904052734375, -3.23291015625, -2.6754150390625, -2.117919921875, -1.5604248046875, -1.0029296875, -0.4454345703125, 0.112060546875, 0.6695556640625, 1.22705078125, 1.7845458984375, 2.342041015625, 2.8995361328125, 3.45703125, 4.0145263671875, 4.572021484375, 5.1295166015625, 5.68701171875, 6.2445068359375, 6.802001953125, 7.3594970703125, 7.9169921875, 8.4744873046875, 9.031982421875, 9.5894775390625, 10.14697265625, 10.7044677734375, 11.261962890625, 11.8194580078125, 12.376953125, 12.9344482421875, 13.491943359375, 14.0494384765625, 14.60693359375, 15.1644287109375, 15.721923828125, 16.2794189453125, 16.8369140625, 17.3944091796875, 17.951904296875, 18.5093994140625, 19.06689453125, 19.6243896484375, 20.181884765625, 20.7393798828125, 21.296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 6.0, 6.0, 7.0, 14.0, 14.0, 30.0, 25.0, 38.0, 47.0, 50.0, 87.0, 62.0, 70.0, 60.0, 77.0, 62.0, 71.0, 61.0, 38.0, 37.0, 36.0, 19.0, 22.0, 12.0, 15.0, 12.0, 4.0, 6.0, 3.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.750244140625, -21.95361328125, -21.156982421875, -20.3603515625, -19.563720703125, -18.76708984375, -17.970458984375, -17.173828125, -16.377197265625, -15.58056640625, -14.783935546875, -13.9873046875, -13.190673828125, -12.39404296875, -11.597412109375, -10.80078125, -10.004150390625, -9.20751953125, -8.410888671875, -7.6142578125, -6.817626953125, -6.02099609375, -5.224365234375, -4.427734375, -3.631103515625, -2.83447265625, -2.037841796875, -1.2412109375, -0.444580078125, 0.35205078125, 1.148681640625, 1.9453125, 2.741943359375, 3.53857421875, 4.335205078125, 5.1318359375, 5.928466796875, 6.72509765625, 7.521728515625, 8.318359375, 9.114990234375, 9.91162109375, 10.708251953125, 11.5048828125, 12.301513671875, 13.09814453125, 13.894775390625, 14.69140625, 15.488037109375, 16.28466796875, 17.081298828125, 17.8779296875, 18.674560546875, 19.47119140625, 20.267822265625, 21.064453125, 21.861083984375, 22.65771484375, 23.454345703125, 24.2509765625, 25.047607421875, 25.84423828125, 26.640869140625, 27.4375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 9.0, 6.0, 14.0, 13.0, 13.0, 15.0, 26.0, 71.0, 84.0, 215.0, 430.0, 1151.0, 4628.0, 44070.0, 908497.0, 80852.0, 5951.0, 1505.0, 505.0, 212.0, 115.0, 71.0, 32.0, 19.0, 14.0, 13.0, 6.0, 2.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-12.75, -12.370361328125, -11.99072265625, -11.611083984375, -11.2314453125, -10.851806640625, -10.47216796875, -10.092529296875, -9.712890625, -9.333251953125, -8.95361328125, -8.573974609375, -8.1943359375, -7.814697265625, -7.43505859375, -7.055419921875, -6.67578125, -6.296142578125, -5.91650390625, -5.536865234375, -5.1572265625, -4.777587890625, -4.39794921875, -4.018310546875, -3.638671875, -3.259033203125, -2.87939453125, -2.499755859375, -2.1201171875, -1.740478515625, -1.36083984375, -0.981201171875, -0.6015625, -0.221923828125, 0.15771484375, 0.537353515625, 0.9169921875, 1.296630859375, 1.67626953125, 2.055908203125, 2.435546875, 2.815185546875, 3.19482421875, 3.574462890625, 3.9541015625, 4.333740234375, 4.71337890625, 5.093017578125, 5.47265625, 5.852294921875, 6.23193359375, 6.611572265625, 6.9912109375, 7.370849609375, 7.75048828125, 8.130126953125, 8.509765625, 8.889404296875, 9.26904296875, 9.648681640625, 10.0283203125, 10.407958984375, 10.78759765625, 11.167236328125, 11.546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 10.0, 9.0, 14.0, 17.0, 20.0, 21.0, 55.0, 58.0, 90.0, 92.0, 113.0, 96.0, 94.0, 64.0, 72.0, 48.0, 37.0, 16.0, 13.0, 9.0, 10.0, 7.0, 4.0, 5.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012416839599609375, -0.0012016892433166504, -0.0011616945266723633, -0.0011216998100280762, -0.001081705093383789, -0.001041710376739502, -0.0010017156600952148, -0.0009617209434509277, -0.0009217262268066406, -0.0008817315101623535, -0.0008417367935180664, -0.0008017420768737793, -0.0007617473602294922, -0.0007217526435852051, -0.000681757926940918, -0.0006417632102966309, -0.0006017684936523438, -0.0005617737770080566, -0.0005217790603637695, -0.0004817843437194824, -0.0004417896270751953, -0.0004017949104309082, -0.0003618001937866211, -0.000321805477142334, -0.0002818107604980469, -0.00024181604385375977, -0.00020182132720947266, -0.00016182661056518555, -0.00012183189392089844, -8.183717727661133e-05, -4.184246063232422e-05, -1.8477439880371094e-06, 3.814697265625e-05, 7.814168930053711e-05, 0.00011813640594482422, 0.00015813112258911133, 0.00019812583923339844, 0.00023812055587768555, 0.00027811527252197266, 0.00031810998916625977, 0.0003581047058105469, 0.000398099422454834, 0.0004380941390991211, 0.0004780888557434082, 0.0005180835723876953, 0.0005580782890319824, 0.0005980730056762695, 0.0006380677223205566, 0.0006780624389648438, 0.0007180571556091309, 0.000758051872253418, 0.0007980465888977051, 0.0008380413055419922, 0.0008780360221862793, 0.0009180307388305664, 0.0009580254554748535, 0.0009980201721191406, 0.0010380148887634277, 0.0010780096054077148, 0.001118004322052002, 0.001157999038696289, 0.0011979937553405762, 0.0012379884719848633, 0.0012779831886291504, 0.0013179779052734375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 3.0, 6.0, 6.0, 9.0, 13.0, 24.0, 37.0, 68.0, 141.0, 262.0, 554.0, 1847.0, 8759.0, 194142.0, 817727.0, 20282.0, 3019.0, 914.0, 358.0, 171.0, 76.0, 45.0, 26.0, 20.0, 14.0, 8.0, 11.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.375, -13.977783203125, -13.58056640625, -13.183349609375, -12.7861328125, -12.388916015625, -11.99169921875, -11.594482421875, -11.197265625, -10.800048828125, -10.40283203125, -10.005615234375, -9.6083984375, -9.211181640625, -8.81396484375, -8.416748046875, -8.01953125, -7.622314453125, -7.22509765625, -6.827880859375, -6.4306640625, -6.033447265625, -5.63623046875, -5.239013671875, -4.841796875, -4.444580078125, -4.04736328125, -3.650146484375, -3.2529296875, -2.855712890625, -2.45849609375, -2.061279296875, -1.6640625, -1.266845703125, -0.86962890625, -0.472412109375, -0.0751953125, 0.322021484375, 0.71923828125, 1.116455078125, 1.513671875, 1.910888671875, 2.30810546875, 2.705322265625, 3.1025390625, 3.499755859375, 3.89697265625, 4.294189453125, 4.69140625, 5.088623046875, 5.48583984375, 5.883056640625, 6.2802734375, 6.677490234375, 7.07470703125, 7.471923828125, 7.869140625, 8.266357421875, 8.66357421875, 9.060791015625, 9.4580078125, 9.855224609375, 10.25244140625, 10.649658203125, 11.046875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 9.0, 14.0, 14.0, 18.0, 37.0, 34.0, 59.0, 51.0, 70.0, 89.0, 77.0, 108.0, 98.0, 70.0, 63.0, 50.0, 28.0, 25.0, 27.0, 10.0, 9.0, 8.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4765625, -6.27899169921875, -6.0814208984375, -5.88385009765625, -5.686279296875, -5.48870849609375, -5.2911376953125, -5.09356689453125, -4.89599609375, -4.69842529296875, -4.5008544921875, -4.30328369140625, -4.105712890625, -3.90814208984375, -3.7105712890625, -3.51300048828125, -3.3154296875, -3.11785888671875, -2.9202880859375, -2.72271728515625, -2.525146484375, -2.32757568359375, -2.1300048828125, -1.93243408203125, -1.73486328125, -1.53729248046875, -1.3397216796875, -1.14215087890625, -0.944580078125, -0.74700927734375, -0.5494384765625, -0.35186767578125, -0.154296875, 0.04327392578125, 0.2408447265625, 0.43841552734375, 0.635986328125, 0.83355712890625, 1.0311279296875, 1.22869873046875, 1.42626953125, 1.62384033203125, 1.8214111328125, 2.01898193359375, 2.216552734375, 2.41412353515625, 2.6116943359375, 2.80926513671875, 3.0068359375, 3.20440673828125, 3.4019775390625, 3.59954833984375, 3.797119140625, 3.99468994140625, 4.1922607421875, 4.38983154296875, 4.58740234375, 4.78497314453125, 4.9825439453125, 5.18011474609375, 5.377685546875, 5.57525634765625, 5.7728271484375, 5.97039794921875, 6.16796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 9.0, 23.0, 69.0, 148.0, 302.0, 277.0, 117.0, 38.0, 13.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-232.25192260742188, -225.405517578125, -218.55911254882812, -211.71270751953125, -204.86630249023438, -198.0198974609375, -191.17349243164062, -184.32708740234375, -177.48068237304688, -170.63427734375, -163.78787231445312, -156.94146728515625, -150.09506225585938, -143.2486572265625, -136.40225219726562, -129.55584716796875, -122.70942687988281, -115.86302185058594, -109.01661682128906, -102.17021179199219, -95.32380676269531, -88.47740173339844, -81.63098907470703, -74.78458404541016, -67.93817901611328, -61.091773986816406, -54.24536895751953, -47.39896011352539, -40.552555084228516, -33.70615005493164, -26.8597412109375, -20.013336181640625, -13.16693115234375, -6.320525169372559, 0.5258808135986328, 7.372287750244141, 14.218692779541016, 21.06509780883789, 27.91150665283203, 34.757911682128906, 41.60431671142578, 48.450721740722656, 55.29712677001953, 62.14353561401367, 68.98994445800781, 75.83634948730469, 82.68275451660156, 89.52915954589844, 96.37556457519531, 103.22196960449219, 110.06837463378906, 116.91477966308594, 123.76118469238281, 130.6075897216797, 137.45401000976562, 144.3004150390625, 151.14682006835938, 157.99322509765625, 164.83963012695312, 171.68603515625, 178.53244018554688, 185.37884521484375, 192.22525024414062, 199.0716552734375, 205.91806030273438]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 10.0, 10.0, 14.0, 17.0, 24.0, 20.0, 35.0, 45.0, 43.0, 58.0, 66.0, 69.0, 74.0, 83.0, 68.0, 73.0, 53.0, 43.0, 47.0, 28.0, 30.0, 23.0, 19.0, 11.0, 10.0, 3.0, 6.0, 9.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-134.73545837402344, -131.5338592529297, -128.332275390625, -125.13067626953125, -121.9290771484375, -118.72747802734375, -115.52588653564453, -112.32429504394531, -109.12269592285156, -105.92109680175781, -102.7195053100586, -99.51791381835938, -96.31631469726562, -93.11471557617188, -89.91312408447266, -86.71153259277344, -83.50993347167969, -80.30833435058594, -77.10674285888672, -73.9051513671875, -70.70355224609375, -67.501953125, -64.30036163330078, -61.0987663269043, -57.89717102050781, -54.69557571411133, -51.493980407714844, -48.29238510131836, -45.090789794921875, -41.88919448852539, -38.687599182128906, -35.48600387573242, -32.28441619873047, -29.082820892333984, -25.8812255859375, -22.679630279541016, -19.47803497314453, -16.276439666748047, -13.074844360351562, -9.873249053955078, -6.671653747558594, -3.4700584411621094, -0.268463134765625, 2.9331321716308594, 6.134727478027344, 9.336322784423828, 12.537918090820312, 15.739513397216797, 18.94110870361328, 22.142704010009766, 25.34429931640625, 28.545894622802734, 31.74748992919922, 34.9490852355957, 38.15068054199219, 41.35227584838867, 44.553871154785156, 47.75546646118164, 50.957061767578125, 54.15865707397461, 57.360252380371094, 60.56184768676758, 63.76344299316406, 66.96504211425781, 70.16663360595703]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 28.0, 34.0, 42.0, 79.0, 125.0, 241.0, 473.0, 898.0, 2119.0, 5005.0, 13577.0, 44691.0, 213656.0, 1983772.0, 1685998.0, 183156.0, 39602.0, 12278.0, 4707.0, 1958.0, 882.0, 444.0, 208.0, 114.0, 68.0, 32.0, 32.0, 15.0, 9.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.77734375, -6.57171630859375, -6.3660888671875, -6.16046142578125, -5.954833984375, -5.74920654296875, -5.5435791015625, -5.33795166015625, -5.13232421875, -4.92669677734375, -4.7210693359375, -4.51544189453125, -4.309814453125, -4.10418701171875, -3.8985595703125, -3.69293212890625, -3.4873046875, -3.28167724609375, -3.0760498046875, -2.87042236328125, -2.664794921875, -2.45916748046875, -2.2535400390625, -2.04791259765625, -1.84228515625, -1.63665771484375, -1.4310302734375, -1.22540283203125, -1.019775390625, -0.81414794921875, -0.6085205078125, -0.40289306640625, -0.197265625, 0.00836181640625, 0.2139892578125, 0.41961669921875, 0.625244140625, 0.83087158203125, 1.0364990234375, 1.24212646484375, 1.44775390625, 1.65338134765625, 1.8590087890625, 2.06463623046875, 2.270263671875, 2.47589111328125, 2.6815185546875, 2.88714599609375, 3.0927734375, 3.29840087890625, 3.5040283203125, 3.70965576171875, 3.915283203125, 4.12091064453125, 4.3265380859375, 4.53216552734375, 4.73779296875, 4.94342041015625, 5.1490478515625, 5.35467529296875, 5.560302734375, 5.76593017578125, 5.9715576171875, 6.17718505859375, 6.3828125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 8.0, 15.0, 29.0, 28.0, 37.0, 67.0, 65.0, 67.0, 60.0, 92.0, 91.0, 81.0, 81.0, 74.0, 47.0, 52.0, 33.0, 28.0, 12.0, 9.0, 13.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9609375, -8.7430419921875, -8.525146484375, -8.3072509765625, -8.08935546875, -7.8714599609375, -7.653564453125, -7.4356689453125, -7.2177734375, -6.9998779296875, -6.781982421875, -6.5640869140625, -6.34619140625, -6.1282958984375, -5.910400390625, -5.6925048828125, -5.474609375, -5.2567138671875, -5.038818359375, -4.8209228515625, -4.60302734375, -4.3851318359375, -4.167236328125, -3.9493408203125, -3.7314453125, -3.5135498046875, -3.295654296875, -3.0777587890625, -2.85986328125, -2.6419677734375, -2.424072265625, -2.2061767578125, -1.98828125, -1.7703857421875, -1.552490234375, -1.3345947265625, -1.11669921875, -0.8988037109375, -0.680908203125, -0.4630126953125, -0.2451171875, -0.0272216796875, 0.190673828125, 0.4085693359375, 0.62646484375, 0.8443603515625, 1.062255859375, 1.2801513671875, 1.498046875, 1.7159423828125, 1.933837890625, 2.1517333984375, 2.36962890625, 2.5875244140625, 2.805419921875, 3.0233154296875, 3.2412109375, 3.4591064453125, 3.677001953125, 3.8948974609375, 4.11279296875, 4.3306884765625, 4.548583984375, 4.7664794921875, 4.984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 10.0, 9.0, 9.0, 17.0, 24.0, 30.0, 40.0, 69.0, 115.0, 189.0, 357.0, 727.0, 1596.0, 4215.0, 12935.0, 53957.0, 392717.0, 3298953.0, 359055.0, 50514.0, 11892.0, 3720.0, 1487.0, 712.0, 362.0, 231.0, 114.0, 83.0, 51.0, 31.0, 16.0, 13.0, 9.0, 7.0, 3.0, 6.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.90625, -10.559814453125, -10.21337890625, -9.866943359375, -9.5205078125, -9.174072265625, -8.82763671875, -8.481201171875, -8.134765625, -7.788330078125, -7.44189453125, -7.095458984375, -6.7490234375, -6.402587890625, -6.05615234375, -5.709716796875, -5.36328125, -5.016845703125, -4.67041015625, -4.323974609375, -3.9775390625, -3.631103515625, -3.28466796875, -2.938232421875, -2.591796875, -2.245361328125, -1.89892578125, -1.552490234375, -1.2060546875, -0.859619140625, -0.51318359375, -0.166748046875, 0.1796875, 0.526123046875, 0.87255859375, 1.218994140625, 1.5654296875, 1.911865234375, 2.25830078125, 2.604736328125, 2.951171875, 3.297607421875, 3.64404296875, 3.990478515625, 4.3369140625, 4.683349609375, 5.02978515625, 5.376220703125, 5.72265625, 6.069091796875, 6.41552734375, 6.761962890625, 7.1083984375, 7.454833984375, 7.80126953125, 8.147705078125, 8.494140625, 8.840576171875, 9.18701171875, 9.533447265625, 9.8798828125, 10.226318359375, 10.57275390625, 10.919189453125, 11.265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 1.0, 6.0, 5.0, 10.0, 9.0, 11.0, 18.0, 12.0, 33.0, 45.0, 60.0, 85.0, 121.0, 211.0, 324.0, 572.0, 814.0, 660.0, 406.0, 212.0, 130.0, 91.0, 63.0, 61.0, 26.0, 31.0, 22.0, 12.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9140625, -10.504150390625, -10.09423828125, -9.684326171875, -9.2744140625, -8.864501953125, -8.45458984375, -8.044677734375, -7.634765625, -7.224853515625, -6.81494140625, -6.405029296875, -5.9951171875, -5.585205078125, -5.17529296875, -4.765380859375, -4.35546875, -3.945556640625, -3.53564453125, -3.125732421875, -2.7158203125, -2.305908203125, -1.89599609375, -1.486083984375, -1.076171875, -0.666259765625, -0.25634765625, 0.153564453125, 0.5634765625, 0.973388671875, 1.38330078125, 1.793212890625, 2.203125, 2.613037109375, 3.02294921875, 3.432861328125, 3.8427734375, 4.252685546875, 4.66259765625, 5.072509765625, 5.482421875, 5.892333984375, 6.30224609375, 6.712158203125, 7.1220703125, 7.531982421875, 7.94189453125, 8.351806640625, 8.76171875, 9.171630859375, 9.58154296875, 9.991455078125, 10.4013671875, 10.811279296875, 11.22119140625, 11.631103515625, 12.041015625, 12.450927734375, 12.86083984375, 13.270751953125, 13.6806640625, 14.090576171875, 14.50048828125, 14.910400390625, 15.3203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 10.0, 28.0, 62.0, 159.0, 321.0, 247.0, 101.0, 29.0, 17.0, 7.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.401123046875, -199.29710388183594, -193.19309997558594, -187.08908081054688, -180.98507690429688, -174.8810577392578, -168.77703857421875, -162.67303466796875, -156.56903076171875, -150.4650115966797, -144.3610076904297, -138.25698852539062, -132.15298461914062, -126.04896545410156, -119.94495391845703, -113.8409423828125, -107.73692321777344, -101.6329116821289, -95.52890014648438, -89.42488098144531, -83.32087707519531, -77.21685791015625, -71.11284637451172, -65.00883483886719, -58.904823303222656, -52.800811767578125, -46.696800231933594, -40.5927848815918, -34.488773345947266, -28.384761810302734, -22.280746459960938, -16.176734924316406, -10.072738647460938, -3.96872615814209, 2.135286331176758, 8.239299774169922, 14.343311309814453, 20.447322845458984, 26.55133819580078, 32.65534973144531, 38.759361267089844, 44.863372802734375, 50.967384338378906, 57.0713996887207, 63.175411224365234, 69.2794189453125, 75.38343811035156, 81.4874496459961, 87.59146118164062, 93.69547271728516, 99.79948425292969, 105.90350341796875, 112.00750732421875, 118.11152648925781, 124.21553802490234, 130.31954956054688, 136.42355346679688, 142.52757263183594, 148.63157653808594, 154.735595703125, 160.839599609375, 166.94361877441406, 173.04763793945312, 179.15164184570312, 185.2556610107422]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 10.0, 13.0, 16.0, 20.0, 24.0, 25.0, 25.0, 30.0, 27.0, 35.0, 47.0, 51.0, 37.0, 51.0, 46.0, 54.0, 66.0, 50.0, 64.0, 37.0, 44.0, 29.0, 26.0, 34.0, 24.0, 20.0, 21.0, 17.0, 14.0, 7.0, 8.0, 6.0, 8.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-74.07620239257812, -72.036376953125, -69.99654388427734, -67.95671844482422, -65.91688537597656, -63.87705993652344, -61.83723068237305, -59.797401428222656, -57.75757598876953, -55.71774673461914, -53.67791748046875, -51.638092041015625, -49.598262786865234, -47.558433532714844, -45.51860427856445, -43.47877502441406, -41.43894577026367, -39.39911651611328, -37.35928726196289, -35.3194580078125, -33.279632568359375, -31.239803314208984, -29.199974060058594, -27.160144805908203, -25.120317459106445, -23.080488204956055, -21.040660858154297, -19.000831604003906, -16.961002349853516, -14.921175003051758, -12.881345748901367, -10.841517448425293, -8.801689147949219, -6.7618608474731445, -4.722032070159912, -2.6822032928466797, -0.6423749923706055, 1.3974533081054688, 3.4372825622558594, 5.477110862731934, 7.516939163208008, 9.556767463684082, 11.596595764160156, 13.636425018310547, 15.676253318786621, 17.716081619262695, 19.755910873413086, 21.795738220214844, 23.835567474365234, 25.875396728515625, 27.915224075317383, 29.955053329467773, 31.99488067626953, 34.03470993041992, 36.07453918457031, 38.1143684387207, 40.154197692871094, 42.194026947021484, 44.233856201171875, 46.273681640625, 48.31351089477539, 50.35334014892578, 52.39316940307617, 54.43299865722656, 56.47282409667969]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 4.0, 6.0, 8.0, 21.0, 13.0, 25.0, 33.0, 40.0, 56.0, 103.0, 136.0, 215.0, 346.0, 542.0, 843.0, 1525.0, 2638.0, 5082.0, 9656.0, 19202.0, 38868.0, 79229.0, 162595.0, 292990.0, 220266.0, 107316.0, 52659.0, 26001.0, 13026.0, 6688.0, 3469.0, 1935.0, 1139.0, 689.0, 406.0, 246.0, 162.0, 106.0, 92.0, 35.0, 35.0, 32.0, 19.0, 15.0, 8.0, 9.0, 8.0, 5.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0], "bins": [-6.68359375, -6.4853515625, -6.287109375, -6.0888671875, -5.890625, -5.6923828125, -5.494140625, -5.2958984375, -5.09765625, -4.8994140625, -4.701171875, -4.5029296875, -4.3046875, -4.1064453125, -3.908203125, -3.7099609375, -3.51171875, -3.3134765625, -3.115234375, -2.9169921875, -2.71875, -2.5205078125, -2.322265625, -2.1240234375, -1.92578125, -1.7275390625, -1.529296875, -1.3310546875, -1.1328125, -0.9345703125, -0.736328125, -0.5380859375, -0.33984375, -0.1416015625, 0.056640625, 0.2548828125, 0.453125, 0.6513671875, 0.849609375, 1.0478515625, 1.24609375, 1.4443359375, 1.642578125, 1.8408203125, 2.0390625, 2.2373046875, 2.435546875, 2.6337890625, 2.83203125, 3.0302734375, 3.228515625, 3.4267578125, 3.625, 3.8232421875, 4.021484375, 4.2197265625, 4.41796875, 4.6162109375, 4.814453125, 5.0126953125, 5.2109375, 5.4091796875, 5.607421875, 5.8056640625, 6.00390625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 4.0, 7.0, 18.0, 13.0, 16.0, 16.0, 30.0, 36.0, 42.0, 51.0, 40.0, 53.0, 71.0, 72.0, 69.0, 70.0, 67.0, 60.0, 56.0, 44.0, 41.0, 29.0, 29.0, 13.0, 12.0, 13.0, 13.0, 6.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.34765625, -7.177642822265625, -7.00762939453125, -6.837615966796875, -6.6676025390625, -6.497589111328125, -6.32757568359375, -6.157562255859375, -5.987548828125, -5.817535400390625, -5.64752197265625, -5.477508544921875, -5.3074951171875, -5.137481689453125, -4.96746826171875, -4.797454833984375, -4.62744140625, -4.457427978515625, -4.28741455078125, -4.117401123046875, -3.9473876953125, -3.777374267578125, -3.60736083984375, -3.437347412109375, -3.267333984375, -3.097320556640625, -2.92730712890625, -2.757293701171875, -2.5872802734375, -2.417266845703125, -2.24725341796875, -2.077239990234375, -1.9072265625, -1.737213134765625, -1.56719970703125, -1.397186279296875, -1.2271728515625, -1.057159423828125, -0.88714599609375, -0.717132568359375, -0.547119140625, -0.377105712890625, -0.20709228515625, -0.037078857421875, 0.1329345703125, 0.302947998046875, 0.47296142578125, 0.642974853515625, 0.81298828125, 0.983001708984375, 1.15301513671875, 1.323028564453125, 1.4930419921875, 1.663055419921875, 1.83306884765625, 2.003082275390625, 2.173095703125, 2.343109130859375, 2.51312255859375, 2.683135986328125, 2.8531494140625, 3.023162841796875, 3.19317626953125, 3.363189697265625, 3.533203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 10.0, 7.0, 9.0, 23.0, 25.0, 31.0, 35.0, 54.0, 67.0, 104.0, 133.0, 186.0, 278.0, 364.0, 534.0, 779.0, 1314.0, 2213.0, 4562.0, 12163.0, 47834.0, 271652.0, 588167.0, 85530.0, 18777.0, 6266.0, 2796.0, 1646.0, 999.0, 591.0, 395.0, 270.0, 210.0, 158.0, 114.0, 74.0, 42.0, 33.0, 29.0, 23.0, 7.0, 11.0, 9.0, 6.0, 8.0, 3.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.421875, -11.0015869140625, -10.581298828125, -10.1610107421875, -9.74072265625, -9.3204345703125, -8.900146484375, -8.4798583984375, -8.0595703125, -7.6392822265625, -7.218994140625, -6.7987060546875, -6.37841796875, -5.9581298828125, -5.537841796875, -5.1175537109375, -4.697265625, -4.2769775390625, -3.856689453125, -3.4364013671875, -3.01611328125, -2.5958251953125, -2.175537109375, -1.7552490234375, -1.3349609375, -0.9146728515625, -0.494384765625, -0.0740966796875, 0.34619140625, 0.7664794921875, 1.186767578125, 1.6070556640625, 2.02734375, 2.4476318359375, 2.867919921875, 3.2882080078125, 3.70849609375, 4.1287841796875, 4.549072265625, 4.9693603515625, 5.3896484375, 5.8099365234375, 6.230224609375, 6.6505126953125, 7.07080078125, 7.4910888671875, 7.911376953125, 8.3316650390625, 8.751953125, 9.1722412109375, 9.592529296875, 10.0128173828125, 10.43310546875, 10.8533935546875, 11.273681640625, 11.6939697265625, 12.1142578125, 12.5345458984375, 12.954833984375, 13.3751220703125, 13.79541015625, 14.2156982421875, 14.635986328125, 15.0562744140625, 15.4765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 5.0, 3.0, 13.0, 17.0, 24.0, 22.0, 15.0, 40.0, 37.0, 53.0, 63.0, 50.0, 77.0, 65.0, 65.0, 80.0, 56.0, 55.0, 57.0, 39.0, 43.0, 36.0, 18.0, 16.0, 13.0, 11.0, 9.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.4375, -20.61376953125, -19.7900390625, -18.96630859375, -18.142578125, -17.31884765625, -16.4951171875, -15.67138671875, -14.84765625, -14.02392578125, -13.2001953125, -12.37646484375, -11.552734375, -10.72900390625, -9.9052734375, -9.08154296875, -8.2578125, -7.43408203125, -6.6103515625, -5.78662109375, -4.962890625, -4.13916015625, -3.3154296875, -2.49169921875, -1.66796875, -0.84423828125, -0.0205078125, 0.80322265625, 1.626953125, 2.45068359375, 3.2744140625, 4.09814453125, 4.921875, 5.74560546875, 6.5693359375, 7.39306640625, 8.216796875, 9.04052734375, 9.8642578125, 10.68798828125, 11.51171875, 12.33544921875, 13.1591796875, 13.98291015625, 14.806640625, 15.63037109375, 16.4541015625, 17.27783203125, 18.1015625, 18.92529296875, 19.7490234375, 20.57275390625, 21.396484375, 22.22021484375, 23.0439453125, 23.86767578125, 24.69140625, 25.51513671875, 26.3388671875, 27.16259765625, 27.986328125, 28.81005859375, 29.6337890625, 30.45751953125, 31.28125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 16.0, 30.0, 67.0, 193.0, 881.0, 9316.0, 972112.0, 63269.0, 2079.0, 369.0, 117.0, 41.0, 11.0, 12.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.7578125, -15.1451416015625, -14.532470703125, -13.9197998046875, -13.30712890625, -12.6944580078125, -12.081787109375, -11.4691162109375, -10.8564453125, -10.2437744140625, -9.631103515625, -9.0184326171875, -8.40576171875, -7.7930908203125, -7.180419921875, -6.5677490234375, -5.955078125, -5.3424072265625, -4.729736328125, -4.1170654296875, -3.50439453125, -2.8917236328125, -2.279052734375, -1.6663818359375, -1.0537109375, -0.4410400390625, 0.171630859375, 0.7843017578125, 1.39697265625, 2.0096435546875, 2.622314453125, 3.2349853515625, 3.84765625, 4.4603271484375, 5.072998046875, 5.6856689453125, 6.29833984375, 6.9110107421875, 7.523681640625, 8.1363525390625, 8.7490234375, 9.3616943359375, 9.974365234375, 10.5870361328125, 11.19970703125, 11.8123779296875, 12.425048828125, 13.0377197265625, 13.650390625, 14.2630615234375, 14.875732421875, 15.4884033203125, 16.10107421875, 16.7137451171875, 17.326416015625, 17.9390869140625, 18.5517578125, 19.1644287109375, 19.777099609375, 20.3897705078125, 21.00244140625, 21.6151123046875, 22.227783203125, 22.8404541015625, 23.453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 18.0, 17.0, 31.0, 35.0, 49.0, 46.0, 90.0, 104.0, 152.0, 109.0, 88.0, 55.0, 37.0, 41.0, 17.0, 28.0, 11.0, 5.0, 12.0, 4.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001926422119140625, -0.001872330904006958, -0.001818239688873291, -0.001764148473739624, -0.001710057258605957, -0.00165596604347229, -0.001601874828338623, -0.001547783613204956, -0.001493692398071289, -0.001439601182937622, -0.001385509967803955, -0.001331418752670288, -0.001277327537536621, -0.001223236322402954, -0.0011691451072692871, -0.0011150538921356201, -0.0010609626770019531, -0.0010068714618682861, -0.0009527802467346191, -0.0008986890316009521, -0.0008445978164672852, -0.0007905066013336182, -0.0007364153861999512, -0.0006823241710662842, -0.0006282329559326172, -0.0005741417407989502, -0.0005200505256652832, -0.0004659593105316162, -0.0004118680953979492, -0.0003577768802642822, -0.00030368566513061523, -0.00024959444999694824, -0.00019550323486328125, -0.00014141201972961426, -8.732080459594727e-05, -3.3229589462280273e-05, 2.086162567138672e-05, 7.495284080505371e-05, 0.0001290440559387207, 0.0001831352710723877, 0.0002372264862060547, 0.0002913177013397217, 0.00034540891647338867, 0.00039950013160705566, 0.00045359134674072266, 0.0005076825618743896, 0.0005617737770080566, 0.0006158649921417236, 0.0006699562072753906, 0.0007240474224090576, 0.0007781386375427246, 0.0008322298526763916, 0.0008863210678100586, 0.0009404122829437256, 0.0009945034980773926, 0.0010485947132110596, 0.0011026859283447266, 0.0011567771434783936, 0.0012108683586120605, 0.0012649595737457275, 0.0013190507888793945, 0.0013731420040130615, 0.0014272332191467285, 0.0014813244342803955, 0.0015354156494140625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 11.0, 12.0, 8.0, 35.0, 57.0, 108.0, 278.0, 761.0, 3224.0, 28486.0, 950788.0, 58687.0, 4485.0, 1008.0, 350.0, 126.0, 62.0, 27.0, 15.0, 6.0, 5.0, 5.0, 8.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.1328125, -13.7569580078125, -13.381103515625, -13.0052490234375, -12.62939453125, -12.2535400390625, -11.877685546875, -11.5018310546875, -11.1259765625, -10.7501220703125, -10.374267578125, -9.9984130859375, -9.62255859375, -9.2467041015625, -8.870849609375, -8.4949951171875, -8.119140625, -7.7432861328125, -7.367431640625, -6.9915771484375, -6.61572265625, -6.2398681640625, -5.864013671875, -5.4881591796875, -5.1123046875, -4.7364501953125, -4.360595703125, -3.9847412109375, -3.60888671875, -3.2330322265625, -2.857177734375, -2.4813232421875, -2.10546875, -1.7296142578125, -1.353759765625, -0.9779052734375, -0.60205078125, -0.2261962890625, 0.149658203125, 0.5255126953125, 0.9013671875, 1.2772216796875, 1.653076171875, 2.0289306640625, 2.40478515625, 2.7806396484375, 3.156494140625, 3.5323486328125, 3.908203125, 4.2840576171875, 4.659912109375, 5.0357666015625, 5.41162109375, 5.7874755859375, 6.163330078125, 6.5391845703125, 6.9150390625, 7.2908935546875, 7.666748046875, 8.0426025390625, 8.41845703125, 8.7943115234375, 9.170166015625, 9.5460205078125, 9.921875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 15.0, 20.0, 32.0, 38.0, 60.0, 80.0, 123.0, 144.0, 138.0, 104.0, 63.0, 62.0, 36.0, 26.0, 17.0, 16.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6875, -7.3922119140625, -7.096923828125, -6.8016357421875, -6.50634765625, -6.2110595703125, -5.915771484375, -5.6204833984375, -5.3251953125, -5.0299072265625, -4.734619140625, -4.4393310546875, -4.14404296875, -3.8487548828125, -3.553466796875, -3.2581787109375, -2.962890625, -2.6676025390625, -2.372314453125, -2.0770263671875, -1.78173828125, -1.4864501953125, -1.191162109375, -0.8958740234375, -0.6005859375, -0.3052978515625, -0.010009765625, 0.2852783203125, 0.58056640625, 0.8758544921875, 1.171142578125, 1.4664306640625, 1.76171875, 2.0570068359375, 2.352294921875, 2.6475830078125, 2.94287109375, 3.2381591796875, 3.533447265625, 3.8287353515625, 4.1240234375, 4.4193115234375, 4.714599609375, 5.0098876953125, 5.30517578125, 5.6004638671875, 5.895751953125, 6.1910400390625, 6.486328125, 6.7816162109375, 7.076904296875, 7.3721923828125, 7.66748046875, 7.9627685546875, 8.258056640625, 8.5533447265625, 8.8486328125, 9.1439208984375, 9.439208984375, 9.7344970703125, 10.02978515625, 10.3250732421875, 10.620361328125, 10.9156494140625, 11.2109375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 9.0, 12.0, 20.0, 36.0, 35.0, 76.0, 88.0, 169.0, 177.0, 118.0, 89.0, 56.0, 48.0, 18.0, 13.0, 9.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.28850555419922, -89.34164428710938, -86.39478302001953, -83.44792175292969, -80.50105285644531, -77.55419158935547, -74.60733032226562, -71.66046905517578, -68.71360778808594, -65.7667465209961, -62.819881439208984, -59.87302017211914, -56.92615509033203, -53.97929382324219, -51.032432556152344, -48.0855712890625, -45.138702392578125, -42.19184112548828, -39.24497604370117, -36.29811477661133, -33.35124969482422, -30.404388427734375, -27.45752716064453, -24.510663986206055, -21.563800811767578, -18.6169376373291, -15.670075416564941, -12.723213195800781, -9.776350021362305, -6.829486846923828, -3.8826255798339844, -0.9357624053955078, 2.0111007690429688, 4.957963466644287, 7.9048261642456055, 10.851688385009766, 13.798551559448242, 16.74541473388672, 19.692276000976562, 22.63913917541504, 25.586002349853516, 28.532865524291992, 31.47972869873047, 34.42658996582031, 37.373451232910156, 40.320316314697266, 43.26717758178711, 46.21404266357422, 49.16090393066406, 52.107765197753906, 55.054630279541016, 58.00149154663086, 60.94835662841797, 63.89521789550781, 66.84207916259766, 69.7889404296875, 72.73580932617188, 75.68267059326172, 78.62953186035156, 81.57640075683594, 84.52326202392578, 87.47012329101562, 90.41698455810547, 93.36384582519531, 96.31070709228516]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 8.0, 6.0, 7.0, 15.0, 10.0, 8.0, 20.0, 21.0, 24.0, 31.0, 32.0, 44.0, 40.0, 40.0, 44.0, 52.0, 90.0, 70.0, 62.0, 54.0, 36.0, 42.0, 30.0, 40.0, 19.0, 37.0, 24.0, 20.0, 17.0, 14.0, 7.0, 12.0, 1.0, 1.0, 5.0, 3.0, 7.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-84.497314453125, -82.14225006103516, -79.78717803955078, -77.43211364746094, -75.0770492553711, -72.72198486328125, -70.36691284179688, -68.01184844970703, -65.65678405761719, -63.30171585083008, -60.946651458740234, -58.591583251953125, -56.23651885986328, -53.88145065307617, -51.52638244628906, -49.17131805419922, -46.816246032714844, -44.461177825927734, -42.10611343383789, -39.75104522705078, -37.39598083496094, -35.04091262817383, -32.68584442138672, -30.330778121948242, -27.975711822509766, -25.62064552307129, -23.265579223632812, -20.910511016845703, -18.555444717407227, -16.20037841796875, -13.845311164855957, -11.490243911743164, -9.135177612304688, -6.780110836029053, -4.425044059753418, -2.069977283477783, 0.28508949279785156, 2.640155792236328, 4.995223045349121, 7.350290298461914, 9.70535659790039, 12.060422897338867, 14.41549015045166, 16.770557403564453, 19.12562370300293, 21.480690002441406, 23.835758209228516, 26.190824508666992, 28.54589080810547, 30.900957107543945, 33.25602340698242, 35.61109161376953, 37.966156005859375, 40.321224212646484, 42.676292419433594, 45.03135681152344, 47.38642501831055, 49.741493225097656, 52.0965576171875, 54.45162582397461, 56.80669403076172, 59.16175842285156, 61.51682662963867, 63.87189483642578, 66.22695922851562]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 6.0, 7.0, 4.0, 9.0, 6.0, 16.0, 34.0, 40.0, 74.0, 133.0, 220.0, 451.0, 962.0, 2147.0, 5155.0, 13705.0, 42890.0, 190101.0, 1378925.0, 2160479.0, 307545.0, 60314.0, 18338.0, 6900.0, 3033.0, 1408.0, 696.0, 343.0, 156.0, 102.0, 40.0, 25.0, 9.0, 5.0, 2.0, 1.0, 1.0], "bins": [-7.62109375, -7.455902099609375, -7.29071044921875, -7.125518798828125, -6.9603271484375, -6.795135498046875, -6.62994384765625, -6.464752197265625, -6.299560546875, -6.134368896484375, -5.96917724609375, -5.803985595703125, -5.6387939453125, -5.473602294921875, -5.30841064453125, -5.143218994140625, -4.97802734375, -4.812835693359375, -4.64764404296875, -4.482452392578125, -4.3172607421875, -4.152069091796875, -3.98687744140625, -3.821685791015625, -3.656494140625, -3.491302490234375, -3.32611083984375, -3.160919189453125, -2.9957275390625, -2.830535888671875, -2.66534423828125, -2.500152587890625, -2.3349609375, -2.169769287109375, -2.00457763671875, -1.839385986328125, -1.6741943359375, -1.509002685546875, -1.34381103515625, -1.178619384765625, -1.013427734375, -0.848236083984375, -0.68304443359375, -0.517852783203125, -0.3526611328125, -0.187469482421875, -0.02227783203125, 0.142913818359375, 0.30810546875, 0.473297119140625, 0.63848876953125, 0.803680419921875, 0.9688720703125, 1.134063720703125, 1.29925537109375, 1.464447021484375, 1.629638671875, 1.794830322265625, 1.96002197265625, 2.125213623046875, 2.2904052734375, 2.455596923828125, 2.62078857421875, 2.785980224609375, 2.951171875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 14.0, 21.0, 28.0, 49.0, 56.0, 84.0, 87.0, 93.0, 98.0, 103.0, 104.0, 78.0, 53.0, 43.0, 24.0, 21.0, 16.0, 14.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.2734375, -12.020355224609375, -11.76727294921875, -11.514190673828125, -11.2611083984375, -11.008026123046875, -10.75494384765625, -10.501861572265625, -10.248779296875, -9.995697021484375, -9.74261474609375, -9.489532470703125, -9.2364501953125, -8.983367919921875, -8.73028564453125, -8.477203369140625, -8.22412109375, -7.971038818359375, -7.71795654296875, -7.464874267578125, -7.2117919921875, -6.958709716796875, -6.70562744140625, -6.452545166015625, -6.199462890625, -5.946380615234375, -5.69329833984375, -5.440216064453125, -5.1871337890625, -4.934051513671875, -4.68096923828125, -4.427886962890625, -4.1748046875, -3.921722412109375, -3.66864013671875, -3.415557861328125, -3.1624755859375, -2.909393310546875, -2.65631103515625, -2.403228759765625, -2.150146484375, -1.897064208984375, -1.64398193359375, -1.390899658203125, -1.1378173828125, -0.884735107421875, -0.63165283203125, -0.378570556640625, -0.12548828125, 0.127593994140625, 0.38067626953125, 0.633758544921875, 0.8868408203125, 1.139923095703125, 1.39300537109375, 1.646087646484375, 1.899169921875, 2.152252197265625, 2.40533447265625, 2.658416748046875, 2.9114990234375, 3.164581298828125, 3.41766357421875, 3.670745849609375, 3.923828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 4.0, 12.0, 16.0, 23.0, 39.0, 62.0, 89.0, 167.0, 368.0, 1073.0, 4627.0, 32564.0, 724281.0, 3339385.0, 79268.0, 9079.0, 1867.0, 602.0, 302.0, 156.0, 114.0, 78.0, 40.0, 20.0, 16.0, 15.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7890625, -11.2803955078125, -10.771728515625, -10.2630615234375, -9.75439453125, -9.2457275390625, -8.737060546875, -8.2283935546875, -7.7197265625, -7.2110595703125, -6.702392578125, -6.1937255859375, -5.68505859375, -5.1763916015625, -4.667724609375, -4.1590576171875, -3.650390625, -3.1417236328125, -2.633056640625, -2.1243896484375, -1.61572265625, -1.1070556640625, -0.598388671875, -0.0897216796875, 0.4189453125, 0.9276123046875, 1.436279296875, 1.9449462890625, 2.45361328125, 2.9622802734375, 3.470947265625, 3.9796142578125, 4.48828125, 4.9969482421875, 5.505615234375, 6.0142822265625, 6.52294921875, 7.0316162109375, 7.540283203125, 8.0489501953125, 8.5576171875, 9.0662841796875, 9.574951171875, 10.0836181640625, 10.59228515625, 11.1009521484375, 11.609619140625, 12.1182861328125, 12.626953125, 13.1356201171875, 13.644287109375, 14.1529541015625, 14.66162109375, 15.1702880859375, 15.678955078125, 16.1876220703125, 16.6962890625, 17.2049560546875, 17.713623046875, 18.2222900390625, 18.73095703125, 19.2396240234375, 19.748291015625, 20.2569580078125, 20.765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 2.0, 14.0, 14.0, 18.0, 24.0, 38.0, 34.0, 53.0, 81.0, 105.0, 131.0, 235.0, 370.0, 632.0, 718.0, 570.0, 346.0, 185.0, 149.0, 92.0, 51.0, 55.0, 42.0, 23.0, 16.0, 11.0, 10.0, 11.0, 8.0, 4.0, 6.0, 7.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.742431640625, -8.42236328125, -8.102294921875, -7.7822265625, -7.462158203125, -7.14208984375, -6.822021484375, -6.501953125, -6.181884765625, -5.86181640625, -5.541748046875, -5.2216796875, -4.901611328125, -4.58154296875, -4.261474609375, -3.94140625, -3.621337890625, -3.30126953125, -2.981201171875, -2.6611328125, -2.341064453125, -2.02099609375, -1.700927734375, -1.380859375, -1.060791015625, -0.74072265625, -0.420654296875, -0.1005859375, 0.219482421875, 0.53955078125, 0.859619140625, 1.1796875, 1.499755859375, 1.81982421875, 2.139892578125, 2.4599609375, 2.780029296875, 3.10009765625, 3.420166015625, 3.740234375, 4.060302734375, 4.38037109375, 4.700439453125, 5.0205078125, 5.340576171875, 5.66064453125, 5.980712890625, 6.30078125, 6.620849609375, 6.94091796875, 7.260986328125, 7.5810546875, 7.901123046875, 8.22119140625, 8.541259765625, 8.861328125, 9.181396484375, 9.50146484375, 9.821533203125, 10.1416015625, 10.461669921875, 10.78173828125, 11.101806640625, 11.421875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 20.0, 30.0, 72.0, 199.0, 292.0, 217.0, 105.0, 32.0, 9.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-173.59999084472656, -168.24278259277344, -162.8855743408203, -157.52838134765625, -152.17117309570312, -146.81396484375, -141.45675659179688, -136.09954833984375, -130.74234008789062, -125.3851318359375, -120.0279312133789, -114.67072296142578, -109.31352233886719, -103.95631408691406, -98.59910583496094, -93.24189758300781, -87.88470458984375, -82.52749633789062, -77.17029571533203, -71.8130874633789, -66.45588684082031, -61.09867858886719, -55.74147033691406, -50.3842658996582, -45.027061462402344, -39.669857025146484, -34.312652587890625, -28.9554443359375, -23.59823989868164, -18.24103546142578, -12.883827209472656, -7.526622772216797, -2.169403076171875, 3.187802314758301, 8.545007705688477, 13.902214050292969, 19.259418487548828, 24.616622924804688, 29.973831176757812, 35.33103561401367, 40.68824005126953, 46.04544448852539, 51.40264892578125, 56.759857177734375, 62.117061614990234, 67.4742660522461, 72.83147430419922, 78.18867492675781, 83.54588317871094, 88.90309143066406, 94.26029205322266, 99.61750030517578, 104.97470092773438, 110.3319091796875, 115.68911743164062, 121.04632568359375, 126.40352630615234, 131.76072692871094, 137.11793518066406, 142.4751434326172, 147.8323516845703, 153.18954467773438, 158.5467529296875, 163.90396118164062, 169.26116943359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 4.0, 12.0, 15.0, 15.0, 13.0, 23.0, 21.0, 28.0, 34.0, 42.0, 52.0, 50.0, 67.0, 65.0, 66.0, 62.0, 60.0, 50.0, 54.0, 57.0, 43.0, 30.0, 34.0, 29.0, 19.0, 21.0, 9.0, 9.0, 8.0, 8.0, 0.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-79.02796936035156, -76.88227081298828, -74.736572265625, -72.59087371826172, -70.44517517089844, -68.29946899414062, -66.15377044677734, -64.00807189941406, -61.86237335205078, -59.7166748046875, -57.57097625732422, -55.42527389526367, -53.27957534790039, -51.13387680053711, -48.98817443847656, -46.84247589111328, -44.69677734375, -42.55107879638672, -40.40538024902344, -38.25967788696289, -36.11397933959961, -33.96828079223633, -31.822580337524414, -29.6768798828125, -27.53118133544922, -25.385482788085938, -23.239782333374023, -21.09408187866211, -18.948383331298828, -16.802684783935547, -14.656984329223633, -12.511284828186035, -10.365592956542969, -8.219893455505371, -6.074193954467773, -3.928494453430176, -1.7827949523925781, 0.36290454864501953, 2.508604049682617, 4.654303550720215, 6.8000030517578125, 8.94570255279541, 11.091402053833008, 13.237101554870605, 15.382801055908203, 17.528499603271484, 19.6742000579834, 21.819900512695312, 23.965599060058594, 26.111297607421875, 28.25699806213379, 30.402698516845703, 32.548397064208984, 34.694095611572266, 36.83979797363281, 38.985496520996094, 41.131195068359375, 43.276893615722656, 45.42259216308594, 47.568294525146484, 49.713993072509766, 51.85969161987305, 54.005393981933594, 56.151092529296875, 58.296791076660156]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 9.0, 20.0, 34.0, 54.0, 67.0, 101.0, 163.0, 250.0, 397.0, 683.0, 1201.0, 2059.0, 3993.0, 8459.0, 18480.0, 43100.0, 105588.0, 265691.0, 340148.0, 149893.0, 59868.0, 25470.0, 11189.0, 5196.0, 2721.0, 1506.0, 835.0, 515.0, 314.0, 193.0, 123.0, 68.0, 56.0, 32.0, 23.0, 17.0, 6.0, 12.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.2265625, -5.9793701171875, -5.732177734375, -5.4849853515625, -5.23779296875, -4.9906005859375, -4.743408203125, -4.4962158203125, -4.2490234375, -4.0018310546875, -3.754638671875, -3.5074462890625, -3.26025390625, -3.0130615234375, -2.765869140625, -2.5186767578125, -2.271484375, -2.0242919921875, -1.777099609375, -1.5299072265625, -1.28271484375, -1.0355224609375, -0.788330078125, -0.5411376953125, -0.2939453125, -0.0467529296875, 0.200439453125, 0.4476318359375, 0.69482421875, 0.9420166015625, 1.189208984375, 1.4364013671875, 1.68359375, 1.9307861328125, 2.177978515625, 2.4251708984375, 2.67236328125, 2.9195556640625, 3.166748046875, 3.4139404296875, 3.6611328125, 3.9083251953125, 4.155517578125, 4.4027099609375, 4.64990234375, 4.8970947265625, 5.144287109375, 5.3914794921875, 5.638671875, 5.8858642578125, 6.133056640625, 6.3802490234375, 6.62744140625, 6.8746337890625, 7.121826171875, 7.3690185546875, 7.6162109375, 7.8634033203125, 8.110595703125, 8.3577880859375, 8.60498046875, 8.8521728515625, 9.099365234375, 9.3465576171875, 9.59375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 10.0, 13.0, 9.0, 19.0, 21.0, 29.0, 44.0, 55.0, 65.0, 64.0, 62.0, 69.0, 78.0, 68.0, 67.0, 72.0, 47.0, 60.0, 33.0, 21.0, 24.0, 23.0, 17.0, 9.0, 8.0, 9.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.328125, -8.136993408203125, -7.94586181640625, -7.754730224609375, -7.5635986328125, -7.372467041015625, -7.18133544921875, -6.990203857421875, -6.799072265625, -6.607940673828125, -6.41680908203125, -6.225677490234375, -6.0345458984375, -5.843414306640625, -5.65228271484375, -5.461151123046875, -5.27001953125, -5.078887939453125, -4.88775634765625, -4.696624755859375, -4.5054931640625, -4.314361572265625, -4.12322998046875, -3.932098388671875, -3.740966796875, -3.549835205078125, -3.35870361328125, -3.167572021484375, -2.9764404296875, -2.785308837890625, -2.59417724609375, -2.403045654296875, -2.2119140625, -2.020782470703125, -1.82965087890625, -1.638519287109375, -1.4473876953125, -1.256256103515625, -1.06512451171875, -0.873992919921875, -0.682861328125, -0.491729736328125, -0.30059814453125, -0.109466552734375, 0.0816650390625, 0.272796630859375, 0.46392822265625, 0.655059814453125, 0.84619140625, 1.037322998046875, 1.22845458984375, 1.419586181640625, 1.6107177734375, 1.801849365234375, 1.99298095703125, 2.184112548828125, 2.375244140625, 2.566375732421875, 2.75750732421875, 2.948638916015625, 3.1397705078125, 3.330902099609375, 3.52203369140625, 3.713165283203125, 3.904296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 15.0, 18.0, 37.0, 34.0, 41.0, 61.0, 102.0, 152.0, 202.0, 383.0, 534.0, 1014.0, 2043.0, 5361.0, 21625.0, 154822.0, 743725.0, 94609.0, 15375.0, 4205.0, 1783.0, 897.0, 539.0, 330.0, 203.0, 126.0, 95.0, 62.0, 41.0, 23.0, 19.0, 17.0, 8.0, 16.0, 7.0, 2.0, 6.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.265625, -16.697509765625, -16.12939453125, -15.561279296875, -14.9931640625, -14.425048828125, -13.85693359375, -13.288818359375, -12.720703125, -12.152587890625, -11.58447265625, -11.016357421875, -10.4482421875, -9.880126953125, -9.31201171875, -8.743896484375, -8.17578125, -7.607666015625, -7.03955078125, -6.471435546875, -5.9033203125, -5.335205078125, -4.76708984375, -4.198974609375, -3.630859375, -3.062744140625, -2.49462890625, -1.926513671875, -1.3583984375, -0.790283203125, -0.22216796875, 0.345947265625, 0.9140625, 1.482177734375, 2.05029296875, 2.618408203125, 3.1865234375, 3.754638671875, 4.32275390625, 4.890869140625, 5.458984375, 6.027099609375, 6.59521484375, 7.163330078125, 7.7314453125, 8.299560546875, 8.86767578125, 9.435791015625, 10.00390625, 10.572021484375, 11.14013671875, 11.708251953125, 12.2763671875, 12.844482421875, 13.41259765625, 13.980712890625, 14.548828125, 15.116943359375, 15.68505859375, 16.253173828125, 16.8212890625, 17.389404296875, 17.95751953125, 18.525634765625, 19.09375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 11.0, 4.0, 17.0, 10.0, 17.0, 22.0, 28.0, 27.0, 25.0, 34.0, 39.0, 42.0, 61.0, 52.0, 53.0, 59.0, 65.0, 66.0, 49.0, 53.0, 35.0, 36.0, 36.0, 27.0, 33.0, 16.0, 19.0, 14.0, 9.0, 12.0, 5.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.03125, -20.4228515625, -19.814453125, -19.2060546875, -18.59765625, -17.9892578125, -17.380859375, -16.7724609375, -16.1640625, -15.5556640625, -14.947265625, -14.3388671875, -13.73046875, -13.1220703125, -12.513671875, -11.9052734375, -11.296875, -10.6884765625, -10.080078125, -9.4716796875, -8.86328125, -8.2548828125, -7.646484375, -7.0380859375, -6.4296875, -5.8212890625, -5.212890625, -4.6044921875, -3.99609375, -3.3876953125, -2.779296875, -2.1708984375, -1.5625, -0.9541015625, -0.345703125, 0.2626953125, 0.87109375, 1.4794921875, 2.087890625, 2.6962890625, 3.3046875, 3.9130859375, 4.521484375, 5.1298828125, 5.73828125, 6.3466796875, 6.955078125, 7.5634765625, 8.171875, 8.7802734375, 9.388671875, 9.9970703125, 10.60546875, 11.2138671875, 11.822265625, 12.4306640625, 13.0390625, 13.6474609375, 14.255859375, 14.8642578125, 15.47265625, 16.0810546875, 16.689453125, 17.2978515625, 17.90625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 15.0, 18.0, 32.0, 51.0, 82.0, 199.0, 465.0, 1177.0, 4266.0, 28874.0, 510261.0, 468008.0, 28816.0, 4180.0, 1179.0, 427.0, 211.0, 108.0, 61.0, 29.0, 20.0, 19.0, 8.0, 13.0, 8.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.19140625, -5.97027587890625, -5.7491455078125, -5.52801513671875, -5.306884765625, -5.08575439453125, -4.8646240234375, -4.64349365234375, -4.42236328125, -4.20123291015625, -3.9801025390625, -3.75897216796875, -3.537841796875, -3.31671142578125, -3.0955810546875, -2.87445068359375, -2.6533203125, -2.43218994140625, -2.2110595703125, -1.98992919921875, -1.768798828125, -1.54766845703125, -1.3265380859375, -1.10540771484375, -0.88427734375, -0.66314697265625, -0.4420166015625, -0.22088623046875, 0.000244140625, 0.22137451171875, 0.4425048828125, 0.66363525390625, 0.884765625, 1.10589599609375, 1.3270263671875, 1.54815673828125, 1.769287109375, 1.99041748046875, 2.2115478515625, 2.43267822265625, 2.65380859375, 2.87493896484375, 3.0960693359375, 3.31719970703125, 3.538330078125, 3.75946044921875, 3.9805908203125, 4.20172119140625, 4.4228515625, 4.64398193359375, 4.8651123046875, 5.08624267578125, 5.307373046875, 5.52850341796875, 5.7496337890625, 5.97076416015625, 6.19189453125, 6.41302490234375, 6.6341552734375, 6.85528564453125, 7.076416015625, 7.29754638671875, 7.5186767578125, 7.73980712890625, 7.9609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 13.0, 9.0, 16.0, 18.0, 30.0, 24.0, 36.0, 50.0, 43.0, 69.0, 87.0, 96.0, 69.0, 78.0, 67.0, 48.0, 38.0, 35.0, 24.0, 29.0, 15.0, 14.0, 12.0, 12.0, 6.0, 4.0, 4.0, 11.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012674331665039062, -0.0012329965829849243, -0.0011985599994659424, -0.0011641234159469604, -0.0011296868324279785, -0.0010952502489089966, -0.0010608136653900146, -0.0010263770818710327, -0.0009919404983520508, -0.0009575039148330688, -0.0009230673313140869, -0.000888630747795105, -0.000854194164276123, -0.0008197575807571411, -0.0007853209972381592, -0.0007508844137191772, -0.0007164478302001953, -0.0006820112466812134, -0.0006475746631622314, -0.0006131380796432495, -0.0005787014961242676, -0.0005442649126052856, -0.0005098283290863037, -0.0004753917455673218, -0.00044095516204833984, -0.0004065185785293579, -0.000372081995010376, -0.00033764541149139404, -0.0003032088279724121, -0.0002687722444534302, -0.00023433566093444824, -0.0001998990774154663, -0.00016546249389648438, -0.00013102591037750244, -9.658932685852051e-05, -6.215274333953857e-05, -2.771615982055664e-05, 6.720423698425293e-06, 4.1157007217407227e-05, 7.559359073638916e-05, 0.0001100301742553711, 0.00014446675777435303, 0.00017890334129333496, 0.0002133399248123169, 0.00024777650833129883, 0.00028221309185028076, 0.0003166496753692627, 0.00035108625888824463, 0.00038552284240722656, 0.0004199594259262085, 0.00045439600944519043, 0.0004888325929641724, 0.0005232691764831543, 0.0005577057600021362, 0.0005921423435211182, 0.0006265789270401001, 0.000661015510559082, 0.000695452094078064, 0.0007298886775970459, 0.0007643252611160278, 0.0007987618446350098, 0.0008331984281539917, 0.0008676350116729736, 0.0009020715951919556, 0.0009365081787109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 6.0, 5.0, 9.0, 9.0, 10.0, 14.0, 25.0, 28.0, 50.0, 65.0, 120.0, 171.0, 266.0, 427.0, 784.0, 1554.0, 3347.0, 9176.0, 37268.0, 227487.0, 640746.0, 97598.0, 18834.0, 5646.0, 2280.0, 1107.0, 549.0, 341.0, 193.0, 131.0, 95.0, 55.0, 36.0, 30.0, 23.0, 17.0, 13.0, 11.0, 11.0, 6.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.83050537109375, -3.7039794921875, -3.57745361328125, -3.450927734375, -3.32440185546875, -3.1978759765625, -3.07135009765625, -2.94482421875, -2.81829833984375, -2.6917724609375, -2.56524658203125, -2.438720703125, -2.31219482421875, -2.1856689453125, -2.05914306640625, -1.9326171875, -1.80609130859375, -1.6795654296875, -1.55303955078125, -1.426513671875, -1.29998779296875, -1.1734619140625, -1.04693603515625, -0.92041015625, -0.79388427734375, -0.6673583984375, -0.54083251953125, -0.414306640625, -0.28778076171875, -0.1612548828125, -0.03472900390625, 0.091796875, 0.21832275390625, 0.3448486328125, 0.47137451171875, 0.597900390625, 0.72442626953125, 0.8509521484375, 0.97747802734375, 1.10400390625, 1.23052978515625, 1.3570556640625, 1.48358154296875, 1.610107421875, 1.73663330078125, 1.8631591796875, 1.98968505859375, 2.1162109375, 2.24273681640625, 2.3692626953125, 2.49578857421875, 2.622314453125, 2.74884033203125, 2.8753662109375, 3.00189208984375, 3.12841796875, 3.25494384765625, 3.3814697265625, 3.50799560546875, 3.634521484375, 3.76104736328125, 3.8875732421875, 4.01409912109375, 4.140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 3.0, 12.0, 19.0, 17.0, 21.0, 33.0, 35.0, 42.0, 65.0, 71.0, 86.0, 102.0, 78.0, 83.0, 79.0, 65.0, 49.0, 28.0, 30.0, 19.0, 16.0, 17.0, 6.0, 5.0, 6.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0234375, -4.87493896484375, -4.7264404296875, -4.57794189453125, -4.429443359375, -4.28094482421875, -4.1324462890625, -3.98394775390625, -3.83544921875, -3.68695068359375, -3.5384521484375, -3.38995361328125, -3.241455078125, -3.09295654296875, -2.9444580078125, -2.79595947265625, -2.6474609375, -2.49896240234375, -2.3504638671875, -2.20196533203125, -2.053466796875, -1.90496826171875, -1.7564697265625, -1.60797119140625, -1.45947265625, -1.31097412109375, -1.1624755859375, -1.01397705078125, -0.865478515625, -0.71697998046875, -0.5684814453125, -0.41998291015625, -0.271484375, -0.12298583984375, 0.0255126953125, 0.17401123046875, 0.322509765625, 0.47100830078125, 0.6195068359375, 0.76800537109375, 0.91650390625, 1.06500244140625, 1.2135009765625, 1.36199951171875, 1.510498046875, 1.65899658203125, 1.8074951171875, 1.95599365234375, 2.1044921875, 2.25299072265625, 2.4014892578125, 2.54998779296875, 2.698486328125, 2.84698486328125, 2.9954833984375, 3.14398193359375, 3.29248046875, 3.44097900390625, 3.5894775390625, 3.73797607421875, 3.886474609375, 4.03497314453125, 4.1834716796875, 4.33197021484375, 4.48046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 13.0, 17.0, 27.0, 47.0, 68.0, 120.0, 162.0, 214.0, 105.0, 69.0, 50.0, 42.0, 16.0, 13.0, 10.0, 5.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-111.75297546386719, -108.66079711914062, -105.5686264038086, -102.47644805908203, -99.38427734375, -96.29209899902344, -93.19992065429688, -90.10774993896484, -87.01557922363281, -83.92340087890625, -80.83123016357422, -77.73905181884766, -74.64688110351562, -71.55470275878906, -68.4625244140625, -65.37035369873047, -62.278175354003906, -59.18600082397461, -56.09382629394531, -53.00164794921875, -49.90947723388672, -46.817298889160156, -43.72512435913086, -40.63294982910156, -37.540775299072266, -34.44860076904297, -31.356426239013672, -28.264249801635742, -25.172075271606445, -22.07990074157715, -18.98772430419922, -15.895549774169922, -12.803375244140625, -9.711200714111328, -6.619025230407715, -3.5268497467041016, -0.4346752166748047, 2.657499313354492, 5.749675750732422, 8.841850280761719, 11.934024810791016, 15.026199340820312, 18.11837387084961, 21.21055030822754, 24.302724838256836, 27.394899368286133, 30.487075805664062, 33.57925033569336, 36.671424865722656, 39.76359939575195, 42.85577392578125, 45.94795227050781, 49.040122985839844, 52.132301330566406, 55.2244758605957, 58.316650390625, 61.4088249206543, 64.5009994506836, 67.59317779541016, 70.68534851074219, 73.77752685546875, 76.86969757080078, 79.96187591552734, 83.05404663085938, 86.14622497558594]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 7.0, 2.0, 6.0, 11.0, 9.0, 9.0, 10.0, 13.0, 26.0, 23.0, 28.0, 25.0, 33.0, 36.0, 33.0, 45.0, 69.0, 87.0, 101.0, 73.0, 60.0, 37.0, 38.0, 38.0, 25.0, 32.0, 32.0, 15.0, 17.0, 14.0, 17.0, 6.0, 5.0, 7.0, 10.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.12016296386719, -66.59635925292969, -64.07254791259766, -61.548744201660156, -59.02493667602539, -56.501129150390625, -53.977325439453125, -51.45351791381836, -48.929710388183594, -46.40590286254883, -43.88209915161133, -41.35829162597656, -38.8344841003418, -36.31067657470703, -33.78687286376953, -31.263065338134766, -28.739261627197266, -26.215456008911133, -23.691648483276367, -21.167842864990234, -18.64403533935547, -16.120229721069336, -13.596424102783203, -11.072616577148438, -8.548810958862305, -6.0250043869018555, -3.5011982917785645, -0.9773921966552734, 1.5464143753051758, 4.070220947265625, 6.594026565551758, 9.117834091186523, 11.641639709472656, 14.165446281433105, 16.689252853393555, 19.213058471679688, 21.736865997314453, 24.260671615600586, 26.78447723388672, 29.308284759521484, 31.832090377807617, 34.35589599609375, 36.879703521728516, 39.40351104736328, 41.92731475830078, 44.45112228393555, 46.97492980957031, 49.49873352050781, 52.02254104614258, 54.546348571777344, 57.070152282714844, 59.59395980834961, 62.117767333984375, 64.64157104492188, 67.16537475585938, 69.6891860961914, 72.2129898071289, 74.7367935180664, 77.26060485839844, 79.78440856933594, 82.30821228027344, 84.83202362060547, 87.35582733154297, 89.879638671875, 92.4034423828125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 10.0, 13.0, 16.0, 23.0, 38.0, 57.0, 70.0, 149.0, 213.0, 383.0, 668.0, 1251.0, 2560.0, 5511.0, 12973.0, 39082.0, 182394.0, 1331849.0, 2192989.0, 334742.0, 58277.0, 17495.0, 6911.0, 3175.0, 1475.0, 799.0, 441.0, 250.0, 151.0, 109.0, 62.0, 46.0, 27.0, 20.0, 11.0, 11.0, 9.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.0916748046875, -4.933349609375, -4.7750244140625, -4.61669921875, -4.4583740234375, -4.300048828125, -4.1417236328125, -3.9833984375, -3.8250732421875, -3.666748046875, -3.5084228515625, -3.35009765625, -3.1917724609375, -3.033447265625, -2.8751220703125, -2.716796875, -2.5584716796875, -2.400146484375, -2.2418212890625, -2.08349609375, -1.9251708984375, -1.766845703125, -1.6085205078125, -1.4501953125, -1.2918701171875, -1.133544921875, -0.9752197265625, -0.81689453125, -0.6585693359375, -0.500244140625, -0.3419189453125, -0.18359375, -0.0252685546875, 0.133056640625, 0.2913818359375, 0.44970703125, 0.6080322265625, 0.766357421875, 0.9246826171875, 1.0830078125, 1.2413330078125, 1.399658203125, 1.5579833984375, 1.71630859375, 1.8746337890625, 2.032958984375, 2.1912841796875, 2.349609375, 2.5079345703125, 2.666259765625, 2.8245849609375, 2.98291015625, 3.1412353515625, 3.299560546875, 3.4578857421875, 3.6162109375, 3.7745361328125, 3.932861328125, 4.0911865234375, 4.24951171875, 4.4078369140625, 4.566162109375, 4.7244873046875, 4.8828125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 8.0, 5.0, 8.0, 10.0, 8.0, 14.0, 10.0, 19.0, 22.0, 21.0, 28.0, 23.0, 24.0, 29.0, 38.0, 32.0, 46.0, 40.0, 43.0, 37.0, 47.0, 39.0, 35.0, 48.0, 33.0, 40.0, 38.0, 31.0, 32.0, 28.0, 26.0, 20.0, 15.0, 13.0, 12.0, 11.0, 9.0, 9.0, 8.0, 10.0, 6.0, 0.0, 8.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.048828125, -2.9493408203125, -2.849853515625, -2.7503662109375, -2.65087890625, -2.5513916015625, -2.451904296875, -2.3524169921875, -2.2529296875, -2.1534423828125, -2.053955078125, -1.9544677734375, -1.85498046875, -1.7554931640625, -1.656005859375, -1.5565185546875, -1.45703125, -1.3575439453125, -1.258056640625, -1.1585693359375, -1.05908203125, -0.9595947265625, -0.860107421875, -0.7606201171875, -0.6611328125, -0.5616455078125, -0.462158203125, -0.3626708984375, -0.26318359375, -0.1636962890625, -0.064208984375, 0.0352783203125, 0.134765625, 0.2342529296875, 0.333740234375, 0.4332275390625, 0.53271484375, 0.6322021484375, 0.731689453125, 0.8311767578125, 0.9306640625, 1.0301513671875, 1.129638671875, 1.2291259765625, 1.32861328125, 1.4281005859375, 1.527587890625, 1.6270751953125, 1.7265625, 1.8260498046875, 1.925537109375, 2.0250244140625, 2.12451171875, 2.2239990234375, 2.323486328125, 2.4229736328125, 2.5224609375, 2.6219482421875, 2.721435546875, 2.8209228515625, 2.92041015625, 3.0198974609375, 3.119384765625, 3.2188720703125, 3.318359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 16.0, 12.0, 25.0, 23.0, 35.0, 57.0, 99.0, 167.0, 301.0, 802.0, 3874.0, 63711.0, 3958137.0, 157495.0, 7073.0, 1224.0, 435.0, 236.0, 163.0, 102.0, 73.0, 57.0, 44.0, 40.0, 15.0, 16.0, 13.0, 10.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -16.78662109375, -16.1044921875, -15.42236328125, -14.740234375, -14.05810546875, -13.3759765625, -12.69384765625, -12.01171875, -11.32958984375, -10.6474609375, -9.96533203125, -9.283203125, -8.60107421875, -7.9189453125, -7.23681640625, -6.5546875, -5.87255859375, -5.1904296875, -4.50830078125, -3.826171875, -3.14404296875, -2.4619140625, -1.77978515625, -1.09765625, -0.41552734375, 0.2666015625, 0.94873046875, 1.630859375, 2.31298828125, 2.9951171875, 3.67724609375, 4.359375, 5.04150390625, 5.7236328125, 6.40576171875, 7.087890625, 7.77001953125, 8.4521484375, 9.13427734375, 9.81640625, 10.49853515625, 11.1806640625, 11.86279296875, 12.544921875, 13.22705078125, 13.9091796875, 14.59130859375, 15.2734375, 15.95556640625, 16.6376953125, 17.31982421875, 18.001953125, 18.68408203125, 19.3662109375, 20.04833984375, 20.73046875, 21.41259765625, 22.0947265625, 22.77685546875, 23.458984375, 24.14111328125, 24.8232421875, 25.50537109375, 26.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 13.0, 18.0, 49.0, 73.0, 100.0, 234.0, 549.0, 1131.0, 1007.0, 419.0, 217.0, 87.0, 62.0, 36.0, 25.0, 13.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0546875, -7.5479736328125, -7.041259765625, -6.5345458984375, -6.02783203125, -5.5211181640625, -5.014404296875, -4.5076904296875, -4.0009765625, -3.4942626953125, -2.987548828125, -2.4808349609375, -1.97412109375, -1.4674072265625, -0.960693359375, -0.4539794921875, 0.052734375, 0.5594482421875, 1.066162109375, 1.5728759765625, 2.07958984375, 2.5863037109375, 3.093017578125, 3.5997314453125, 4.1064453125, 4.6131591796875, 5.119873046875, 5.6265869140625, 6.13330078125, 6.6400146484375, 7.146728515625, 7.6534423828125, 8.16015625, 8.6668701171875, 9.173583984375, 9.6802978515625, 10.18701171875, 10.6937255859375, 11.200439453125, 11.7071533203125, 12.2138671875, 12.7205810546875, 13.227294921875, 13.7340087890625, 14.24072265625, 14.7474365234375, 15.254150390625, 15.7608642578125, 16.267578125, 16.7742919921875, 17.281005859375, 17.7877197265625, 18.29443359375, 18.8011474609375, 19.307861328125, 19.8145751953125, 20.3212890625, 20.8280029296875, 21.334716796875, 21.8414306640625, 22.34814453125, 22.8548583984375, 23.361572265625, 23.8682861328125, 24.375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 8.0, 8.0, 14.0, 47.0, 149.0, 246.0, 257.0, 149.0, 61.0, 26.0, 11.0, 9.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.5615463256836, -79.55257415771484, -74.54360961914062, -69.53463745117188, -64.52566528320312, -59.516693115234375, -54.50772476196289, -49.498756408691406, -44.489784240722656, -39.480812072753906, -34.47184371948242, -29.462873458862305, -24.453903198242188, -19.44493293762207, -14.435962677001953, -9.426994323730469, -4.418022155761719, 0.5909481048583984, 5.599918365478516, 10.608888626098633, 15.61785888671875, 20.626829147338867, 25.635799407958984, 30.64476776123047, 35.65373992919922, 40.66271209716797, 45.67168045043945, 50.68064880371094, 55.68962097167969, 60.69859313964844, 65.70756530761719, 70.7165298461914, 75.72549438476562, 80.73446655273438, 85.74343872070312, 90.75240325927734, 95.7613754272461, 100.77034759521484, 105.77931213378906, 110.78828430175781, 115.79725646972656, 120.80622863769531, 125.81520080566406, 130.8241729736328, 135.8331298828125, 140.84210205078125, 145.85107421875, 150.86004638671875, 155.8690185546875, 160.87799072265625, 165.886962890625, 170.89593505859375, 175.9049072265625, 180.9138641357422, 185.92283630371094, 190.9318084716797, 195.94078063964844, 200.9497528076172, 205.95872497558594, 210.9676971435547, 215.97665405273438, 220.98562622070312, 225.99459838867188, 231.00357055664062, 236.01254272460938]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 9.0, 7.0, 8.0, 5.0, 22.0, 14.0, 16.0, 24.0, 24.0, 24.0, 35.0, 35.0, 42.0, 51.0, 66.0, 48.0, 58.0, 56.0, 61.0, 58.0, 42.0, 52.0, 40.0, 33.0, 23.0, 32.0, 24.0, 28.0, 13.0, 11.0, 11.0, 9.0, 8.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-71.04045867919922, -69.17880249023438, -67.31714630126953, -65.45549011230469, -63.59383773803711, -61.73218536376953, -59.87052917480469, -58.008872985839844, -56.147216796875, -54.285560607910156, -52.42390823364258, -50.562252044677734, -48.70059585571289, -46.83894348144531, -44.97728729248047, -43.115631103515625, -41.25397872924805, -39.3923225402832, -37.530670166015625, -35.66901397705078, -33.80735778808594, -31.945703506469727, -30.084049224853516, -28.222393035888672, -26.36073875427246, -24.49908447265625, -22.637428283691406, -20.775774002075195, -18.914119720458984, -17.05246353149414, -15.19080924987793, -13.329154014587402, -11.46750259399414, -9.605847358703613, -7.744192600250244, -5.882537841796875, -4.020882606506348, -2.1592273712158203, -0.2975730895996094, 1.564082145690918, 3.4257373809814453, 5.287392616271973, 7.149047374725342, 9.010702133178711, 10.872357368469238, 12.734012603759766, 14.595666885375977, 16.457321166992188, 18.31897735595703, 20.180631637573242, 22.042287826538086, 23.903942108154297, 25.76559829711914, 27.62725257873535, 29.488906860351562, 31.350563049316406, 33.21221923828125, 35.073875427246094, 36.93552780151367, 38.797183990478516, 40.65884017944336, 42.52049255371094, 44.38214874267578, 46.243804931640625, 48.1054573059082]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 7.0, 6.0, 7.0, 8.0, 20.0, 21.0, 33.0, 62.0, 76.0, 125.0, 181.0, 209.0, 338.0, 510.0, 759.0, 1179.0, 2037.0, 3607.0, 6389.0, 12366.0, 25724.0, 56637.0, 126296.0, 255028.0, 279357.0, 148707.0, 66786.0, 30107.0, 14538.0, 7471.0, 3830.0, 2251.0, 1384.0, 832.0, 559.0, 374.0, 250.0, 149.0, 107.0, 68.0, 55.0, 45.0, 29.0, 16.0, 12.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.765625, -5.5740966796875, -5.382568359375, -5.1910400390625, -4.99951171875, -4.8079833984375, -4.616455078125, -4.4249267578125, -4.2333984375, -4.0418701171875, -3.850341796875, -3.6588134765625, -3.46728515625, -3.2757568359375, -3.084228515625, -2.8927001953125, -2.701171875, -2.5096435546875, -2.318115234375, -2.1265869140625, -1.93505859375, -1.7435302734375, -1.552001953125, -1.3604736328125, -1.1689453125, -0.9774169921875, -0.785888671875, -0.5943603515625, -0.40283203125, -0.2113037109375, -0.019775390625, 0.1717529296875, 0.36328125, 0.5548095703125, 0.746337890625, 0.9378662109375, 1.12939453125, 1.3209228515625, 1.512451171875, 1.7039794921875, 1.8955078125, 2.0870361328125, 2.278564453125, 2.4700927734375, 2.66162109375, 2.8531494140625, 3.044677734375, 3.2362060546875, 3.427734375, 3.6192626953125, 3.810791015625, 4.0023193359375, 4.19384765625, 4.3853759765625, 4.576904296875, 4.7684326171875, 4.9599609375, 5.1514892578125, 5.343017578125, 5.5345458984375, 5.72607421875, 5.9176025390625, 6.109130859375, 6.3006591796875, 6.4921875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 18.0, 12.0, 17.0, 15.0, 26.0, 16.0, 19.0, 39.0, 31.0, 36.0, 52.0, 47.0, 49.0, 52.0, 49.0, 52.0, 49.0, 56.0, 44.0, 36.0, 24.0, 32.0, 28.0, 34.0, 17.0, 29.0, 23.0, 14.0, 21.0, 5.0, 5.0, 14.0, 7.0, 5.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.6640625, -4.535430908203125, -4.40679931640625, -4.278167724609375, -4.1495361328125, -4.020904541015625, -3.89227294921875, -3.763641357421875, -3.635009765625, -3.506378173828125, -3.37774658203125, -3.249114990234375, -3.1204833984375, -2.991851806640625, -2.86322021484375, -2.734588623046875, -2.60595703125, -2.477325439453125, -2.34869384765625, -2.220062255859375, -2.0914306640625, -1.962799072265625, -1.83416748046875, -1.705535888671875, -1.576904296875, -1.448272705078125, -1.31964111328125, -1.191009521484375, -1.0623779296875, -0.933746337890625, -0.80511474609375, -0.676483154296875, -0.5478515625, -0.419219970703125, -0.29058837890625, -0.161956787109375, -0.0333251953125, 0.095306396484375, 0.22393798828125, 0.352569580078125, 0.481201171875, 0.609832763671875, 0.73846435546875, 0.867095947265625, 0.9957275390625, 1.124359130859375, 1.25299072265625, 1.381622314453125, 1.51025390625, 1.638885498046875, 1.76751708984375, 1.896148681640625, 2.0247802734375, 2.153411865234375, 2.28204345703125, 2.410675048828125, 2.539306640625, 2.667938232421875, 2.79656982421875, 2.925201416015625, 3.0538330078125, 3.182464599609375, 3.31109619140625, 3.439727783203125, 3.568359375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 7.0, 7.0, 6.0, 6.0, 12.0, 20.0, 26.0, 34.0, 60.0, 71.0, 109.0, 195.0, 387.0, 792.0, 1980.0, 5957.0, 29010.0, 240136.0, 686808.0, 66433.0, 11182.0, 3024.0, 1092.0, 540.0, 280.0, 123.0, 83.0, 44.0, 40.0, 28.0, 18.0, 10.0, 6.0, 8.0, 9.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.546875, -19.0216064453125, -18.496337890625, -17.9710693359375, -17.44580078125, -16.9205322265625, -16.395263671875, -15.8699951171875, -15.3447265625, -14.8194580078125, -14.294189453125, -13.7689208984375, -13.24365234375, -12.7183837890625, -12.193115234375, -11.6678466796875, -11.142578125, -10.6173095703125, -10.092041015625, -9.5667724609375, -9.04150390625, -8.5162353515625, -7.990966796875, -7.4656982421875, -6.9404296875, -6.4151611328125, -5.889892578125, -5.3646240234375, -4.83935546875, -4.3140869140625, -3.788818359375, -3.2635498046875, -2.73828125, -2.2130126953125, -1.687744140625, -1.1624755859375, -0.63720703125, -0.1119384765625, 0.413330078125, 0.9385986328125, 1.4638671875, 1.9891357421875, 2.514404296875, 3.0396728515625, 3.56494140625, 4.0902099609375, 4.615478515625, 5.1407470703125, 5.666015625, 6.1912841796875, 6.716552734375, 7.2418212890625, 7.76708984375, 8.2923583984375, 8.817626953125, 9.3428955078125, 9.8681640625, 10.3934326171875, 10.918701171875, 11.4439697265625, 11.96923828125, 12.4945068359375, 13.019775390625, 13.5450439453125, 14.0703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 5.0, 8.0, 11.0, 14.0, 16.0, 29.0, 34.0, 24.0, 22.0, 38.0, 42.0, 42.0, 55.0, 55.0, 65.0, 60.0, 42.0, 56.0, 50.0, 36.0, 45.0, 43.0, 23.0, 25.0, 23.0, 19.0, 15.0, 17.0, 19.0, 18.0, 5.0, 13.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.65625, -17.132568359375, -16.60888671875, -16.085205078125, -15.5615234375, -15.037841796875, -14.51416015625, -13.990478515625, -13.466796875, -12.943115234375, -12.41943359375, -11.895751953125, -11.3720703125, -10.848388671875, -10.32470703125, -9.801025390625, -9.27734375, -8.753662109375, -8.22998046875, -7.706298828125, -7.1826171875, -6.658935546875, -6.13525390625, -5.611572265625, -5.087890625, -4.564208984375, -4.04052734375, -3.516845703125, -2.9931640625, -2.469482421875, -1.94580078125, -1.422119140625, -0.8984375, -0.374755859375, 0.14892578125, 0.672607421875, 1.1962890625, 1.719970703125, 2.24365234375, 2.767333984375, 3.291015625, 3.814697265625, 4.33837890625, 4.862060546875, 5.3857421875, 5.909423828125, 6.43310546875, 6.956787109375, 7.48046875, 8.004150390625, 8.52783203125, 9.051513671875, 9.5751953125, 10.098876953125, 10.62255859375, 11.146240234375, 11.669921875, 12.193603515625, 12.71728515625, 13.240966796875, 13.7646484375, 14.288330078125, 14.81201171875, 15.335693359375, 15.859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 8.0, 7.0, 7.0, 11.0, 21.0, 24.0, 32.0, 57.0, 82.0, 140.0, 183.0, 297.0, 532.0, 1012.0, 1987.0, 3981.0, 9100.0, 24289.0, 80722.0, 492804.0, 319636.0, 74227.0, 22978.0, 8610.0, 3681.0, 1840.0, 941.0, 504.0, 253.0, 184.0, 133.0, 76.0, 47.0, 37.0, 21.0, 17.0, 13.0, 11.0, 11.0, 6.0, 10.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.818359375, -3.70916748046875, -3.5999755859375, -3.49078369140625, -3.381591796875, -3.27239990234375, -3.1632080078125, -3.05401611328125, -2.94482421875, -2.83563232421875, -2.7264404296875, -2.61724853515625, -2.508056640625, -2.39886474609375, -2.2896728515625, -2.18048095703125, -2.0712890625, -1.96209716796875, -1.8529052734375, -1.74371337890625, -1.634521484375, -1.52532958984375, -1.4161376953125, -1.30694580078125, -1.19775390625, -1.08856201171875, -0.9793701171875, -0.87017822265625, -0.760986328125, -0.65179443359375, -0.5426025390625, -0.43341064453125, -0.32421875, -0.21502685546875, -0.1058349609375, 0.00335693359375, 0.112548828125, 0.22174072265625, 0.3309326171875, 0.44012451171875, 0.54931640625, 0.65850830078125, 0.7677001953125, 0.87689208984375, 0.986083984375, 1.09527587890625, 1.2044677734375, 1.31365966796875, 1.4228515625, 1.53204345703125, 1.6412353515625, 1.75042724609375, 1.859619140625, 1.96881103515625, 2.0780029296875, 2.18719482421875, 2.29638671875, 2.40557861328125, 2.5147705078125, 2.62396240234375, 2.733154296875, 2.84234619140625, 2.9515380859375, 3.06072998046875, 3.169921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 9.0, 11.0, 19.0, 16.0, 31.0, 31.0, 68.0, 103.0, 157.0, 150.0, 129.0, 94.0, 53.0, 40.0, 20.0, 21.0, 7.0, 7.0, 8.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017671585083007812, -0.0017026811838150024, -0.0016382038593292236, -0.0015737265348434448, -0.001509249210357666, -0.0014447718858718872, -0.0013802945613861084, -0.0013158172369003296, -0.0012513399124145508, -0.001186862587928772, -0.0011223852634429932, -0.0010579079389572144, -0.0009934306144714355, -0.0009289532899856567, -0.0008644759654998779, -0.0007999986410140991, -0.0007355213165283203, -0.0006710439920425415, -0.0006065666675567627, -0.0005420893430709839, -0.0004776120185852051, -0.00041313469409942627, -0.00034865736961364746, -0.00028418004512786865, -0.00021970272064208984, -0.00015522539615631104, -9.074807167053223e-05, -2.6270747184753418e-05, 3.820657730102539e-05, 0.0001026839017868042, 0.000167161226272583, 0.00023163855075836182, 0.0002961158752441406, 0.00036059319972991943, 0.00042507052421569824, 0.000489547848701477, 0.0005540251731872559, 0.0006185024976730347, 0.0006829798221588135, 0.0007474571466445923, 0.0008119344711303711, 0.0008764117956161499, 0.0009408891201019287, 0.0010053664445877075, 0.0010698437690734863, 0.0011343210935592651, 0.001198798418045044, 0.0012632757425308228, 0.0013277530670166016, 0.0013922303915023804, 0.0014567077159881592, 0.001521185040473938, 0.0015856623649597168, 0.0016501396894454956, 0.0017146170139312744, 0.0017790943384170532, 0.001843571662902832, 0.0019080489873886108, 0.0019725263118743896, 0.0020370036363601685, 0.0021014809608459473, 0.002165958285331726, 0.002230435609817505, 0.0022949129343032837, 0.0023593902587890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 10.0, 25.0, 28.0, 57.0, 129.0, 335.0, 848.0, 2970.0, 14304.0, 138289.0, 807201.0, 71848.0, 9207.0, 2152.0, 670.0, 242.0, 102.0, 65.0, 28.0, 16.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.1875, -8.9654541015625, -8.743408203125, -8.5213623046875, -8.29931640625, -8.0772705078125, -7.855224609375, -7.6331787109375, -7.4111328125, -7.1890869140625, -6.967041015625, -6.7449951171875, -6.52294921875, -6.3009033203125, -6.078857421875, -5.8568115234375, -5.634765625, -5.4127197265625, -5.190673828125, -4.9686279296875, -4.74658203125, -4.5245361328125, -4.302490234375, -4.0804443359375, -3.8583984375, -3.6363525390625, -3.414306640625, -3.1922607421875, -2.97021484375, -2.7481689453125, -2.526123046875, -2.3040771484375, -2.08203125, -1.8599853515625, -1.637939453125, -1.4158935546875, -1.19384765625, -0.9718017578125, -0.749755859375, -0.5277099609375, -0.3056640625, -0.0836181640625, 0.138427734375, 0.3604736328125, 0.58251953125, 0.8045654296875, 1.026611328125, 1.2486572265625, 1.470703125, 1.6927490234375, 1.914794921875, 2.1368408203125, 2.35888671875, 2.5809326171875, 2.802978515625, 3.0250244140625, 3.2470703125, 3.4691162109375, 3.691162109375, 3.9132080078125, 4.13525390625, 4.3572998046875, 4.579345703125, 4.8013916015625, 5.0234375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 9.0, 10.0, 17.0, 15.0, 31.0, 27.0, 37.0, 60.0, 73.0, 78.0, 83.0, 91.0, 99.0, 87.0, 48.0, 45.0, 28.0, 38.0, 28.0, 17.0, 12.0, 13.0, 6.0, 8.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.7388916015625, -4.583251953125, -4.4276123046875, -4.27197265625, -4.1163330078125, -3.960693359375, -3.8050537109375, -3.6494140625, -3.4937744140625, -3.338134765625, -3.1824951171875, -3.02685546875, -2.8712158203125, -2.715576171875, -2.5599365234375, -2.404296875, -2.2486572265625, -2.093017578125, -1.9373779296875, -1.78173828125, -1.6260986328125, -1.470458984375, -1.3148193359375, -1.1591796875, -1.0035400390625, -0.847900390625, -0.6922607421875, -0.53662109375, -0.3809814453125, -0.225341796875, -0.0697021484375, 0.0859375, 0.2415771484375, 0.397216796875, 0.5528564453125, 0.70849609375, 0.8641357421875, 1.019775390625, 1.1754150390625, 1.3310546875, 1.4866943359375, 1.642333984375, 1.7979736328125, 1.95361328125, 2.1092529296875, 2.264892578125, 2.4205322265625, 2.576171875, 2.7318115234375, 2.887451171875, 3.0430908203125, 3.19873046875, 3.3543701171875, 3.510009765625, 3.6656494140625, 3.8212890625, 3.9769287109375, 4.132568359375, 4.2882080078125, 4.44384765625, 4.5994873046875, 4.755126953125, 4.9107666015625, 5.06640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 14.0, 25.0, 56.0, 104.0, 256.0, 263.0, 135.0, 55.0, 33.0, 19.0, 12.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4195327758789, -60.40513610839844, -56.39073944091797, -52.3763427734375, -48.36194610595703, -44.34754943847656, -40.333152770996094, -36.318756103515625, -32.304359436035156, -28.289962768554688, -24.27556610107422, -20.26116943359375, -16.24677276611328, -12.232376098632812, -8.217979431152344, -4.203582763671875, -0.18918609619140625, 3.8252105712890625, 7.839607238769531, 11.85400390625, 15.868400573730469, 19.882797241210938, 23.897193908691406, 27.911590576171875, 31.925987243652344, 35.94038391113281, 39.95478057861328, 43.96917724609375, 47.98357391357422, 51.99797058105469, 56.012367248535156, 60.026763916015625, 64.04116821289062, 68.0555648803711, 72.06996154785156, 76.08435821533203, 80.0987548828125, 84.11315155029297, 88.12754821777344, 92.1419448852539, 96.15634155273438, 100.17073822021484, 104.18513488769531, 108.19953155517578, 112.21392822265625, 116.22832489013672, 120.24272155761719, 124.25711822509766, 128.27151489257812, 132.28591918945312, 136.30030822753906, 140.314697265625, 144.3291015625, 148.343505859375, 152.35789489746094, 156.37228393554688, 160.38668823242188, 164.40109252929688, 168.4154815673828, 172.42987060546875, 176.44427490234375, 180.45867919921875, 184.4730682373047, 188.48745727539062, 192.50186157226562]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 8.0, 4.0, 10.0, 16.0, 19.0, 16.0, 23.0, 17.0, 21.0, 32.0, 29.0, 27.0, 43.0, 52.0, 81.0, 86.0, 75.0, 65.0, 46.0, 40.0, 37.0, 39.0, 30.0, 29.0, 25.0, 21.0, 6.0, 17.0, 10.0, 11.0, 18.0, 11.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.536033630371094, -56.27876281738281, -54.021488189697266, -51.764217376708984, -49.50694274902344, -47.249671936035156, -44.992401123046875, -42.735130310058594, -40.47785568237305, -38.220584869384766, -35.96331024169922, -33.70603942871094, -31.448766708374023, -29.19149398803711, -26.934223175048828, -24.676950454711914, -22.419677734375, -20.162405014038086, -17.905132293701172, -15.64786148071289, -13.390588760375977, -11.133316040039062, -8.876044273376465, -6.618772506713867, -4.361499786376953, -2.1042275428771973, 0.1530447006225586, 2.4103169441223145, 4.66758918762207, 6.924861907958984, 9.182133674621582, 11.43940544128418, 13.696685791015625, 15.953958511352539, 18.211231231689453, 20.468502044677734, 22.72577476501465, 24.983047485351562, 27.240318298339844, 29.497591018676758, 31.754863739013672, 34.01213455200195, 36.2694091796875, 38.52667999267578, 40.78395080566406, 43.04122543334961, 45.29849624633789, 47.55577087402344, 49.81304168701172, 52.0703125, 54.32758712768555, 56.58485794067383, 58.842132568359375, 61.099403381347656, 63.35667419433594, 65.61394500732422, 67.8712158203125, 70.12848663330078, 72.38575744628906, 74.64303588867188, 76.90030670166016, 79.15757751464844, 81.41484832763672, 83.672119140625, 85.92939758300781]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 14.0, 15.0, 13.0, 31.0, 47.0, 93.0, 117.0, 217.0, 430.0, 901.0, 1950.0, 4778.0, 13112.0, 51985.0, 340319.0, 2334943.0, 1250852.0, 151984.0, 28004.0, 8301.0, 3265.0, 1393.0, 685.0, 319.0, 198.0, 95.0, 64.0, 35.0, 25.0, 22.0, 16.0, 16.0, 3.0, 7.0, 1.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.74609375, -5.57611083984375, -5.4061279296875, -5.23614501953125, -5.066162109375, -4.89617919921875, -4.7261962890625, -4.55621337890625, -4.38623046875, -4.21624755859375, -4.0462646484375, -3.87628173828125, -3.706298828125, -3.53631591796875, -3.3663330078125, -3.19635009765625, -3.0263671875, -2.85638427734375, -2.6864013671875, -2.51641845703125, -2.346435546875, -2.17645263671875, -2.0064697265625, -1.83648681640625, -1.66650390625, -1.49652099609375, -1.3265380859375, -1.15655517578125, -0.986572265625, -0.81658935546875, -0.6466064453125, -0.47662353515625, -0.306640625, -0.13665771484375, 0.0333251953125, 0.20330810546875, 0.373291015625, 0.54327392578125, 0.7132568359375, 0.88323974609375, 1.05322265625, 1.22320556640625, 1.3931884765625, 1.56317138671875, 1.733154296875, 1.90313720703125, 2.0731201171875, 2.24310302734375, 2.4130859375, 2.58306884765625, 2.7530517578125, 2.92303466796875, 3.093017578125, 3.26300048828125, 3.4329833984375, 3.60296630859375, 3.77294921875, 3.94293212890625, 4.1129150390625, 4.28289794921875, 4.452880859375, 4.62286376953125, 4.7928466796875, 4.96282958984375, 5.1328125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 7.0, 3.0, 6.0, 7.0, 11.0, 11.0, 12.0, 12.0, 17.0, 16.0, 18.0, 19.0, 25.0, 37.0, 33.0, 37.0, 37.0, 47.0, 46.0, 31.0, 57.0, 55.0, 49.0, 37.0, 33.0, 29.0, 29.0, 37.0, 35.0, 20.0, 25.0, 21.0, 25.0, 19.0, 14.0, 12.0, 13.0, 8.0, 10.0, 7.0, 13.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.619140625, -3.50701904296875, -3.3948974609375, -3.28277587890625, -3.170654296875, -3.05853271484375, -2.9464111328125, -2.83428955078125, -2.72216796875, -2.61004638671875, -2.4979248046875, -2.38580322265625, -2.273681640625, -2.16156005859375, -2.0494384765625, -1.93731689453125, -1.8251953125, -1.71307373046875, -1.6009521484375, -1.48883056640625, -1.376708984375, -1.26458740234375, -1.1524658203125, -1.04034423828125, -0.92822265625, -0.81610107421875, -0.7039794921875, -0.59185791015625, -0.479736328125, -0.36761474609375, -0.2554931640625, -0.14337158203125, -0.03125, 0.08087158203125, 0.1929931640625, 0.30511474609375, 0.417236328125, 0.52935791015625, 0.6414794921875, 0.75360107421875, 0.86572265625, 0.97784423828125, 1.0899658203125, 1.20208740234375, 1.314208984375, 1.42633056640625, 1.5384521484375, 1.65057373046875, 1.7626953125, 1.87481689453125, 1.9869384765625, 2.09906005859375, 2.211181640625, 2.32330322265625, 2.4354248046875, 2.54754638671875, 2.65966796875, 2.77178955078125, 2.8839111328125, 2.99603271484375, 3.108154296875, 3.22027587890625, 3.3323974609375, 3.44451904296875, 3.556640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 9.0, 6.0, 8.0, 12.0, 18.0, 25.0, 32.0, 63.0, 95.0, 127.0, 269.0, 582.0, 1721.0, 9652.0, 145235.0, 3883283.0, 141019.0, 9212.0, 1669.0, 565.0, 276.0, 146.0, 79.0, 46.0, 36.0, 34.0, 13.0, 13.0, 10.0, 10.0, 4.0, 5.0, 1.0, 4.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.6143798828125, -17.103759765625, -16.5931396484375, -16.08251953125, -15.5718994140625, -15.061279296875, -14.5506591796875, -14.0400390625, -13.5294189453125, -13.018798828125, -12.5081787109375, -11.99755859375, -11.4869384765625, -10.976318359375, -10.4656982421875, -9.955078125, -9.4444580078125, -8.933837890625, -8.4232177734375, -7.91259765625, -7.4019775390625, -6.891357421875, -6.3807373046875, -5.8701171875, -5.3594970703125, -4.848876953125, -4.3382568359375, -3.82763671875, -3.3170166015625, -2.806396484375, -2.2957763671875, -1.78515625, -1.2745361328125, -0.763916015625, -0.2532958984375, 0.25732421875, 0.7679443359375, 1.278564453125, 1.7891845703125, 2.2998046875, 2.8104248046875, 3.321044921875, 3.8316650390625, 4.34228515625, 4.8529052734375, 5.363525390625, 5.8741455078125, 6.384765625, 6.8953857421875, 7.406005859375, 7.9166259765625, 8.42724609375, 8.9378662109375, 9.448486328125, 9.9591064453125, 10.4697265625, 10.9803466796875, 11.490966796875, 12.0015869140625, 12.51220703125, 13.0228271484375, 13.533447265625, 14.0440673828125, 14.5546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 7.0, 11.0, 11.0, 30.0, 43.0, 67.0, 93.0, 210.0, 493.0, 867.0, 1074.0, 591.0, 256.0, 144.0, 64.0, 35.0, 28.0, 19.0, 19.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.046875, -14.6060791015625, -14.165283203125, -13.7244873046875, -13.28369140625, -12.8428955078125, -12.402099609375, -11.9613037109375, -11.5205078125, -11.0797119140625, -10.638916015625, -10.1981201171875, -9.75732421875, -9.3165283203125, -8.875732421875, -8.4349365234375, -7.994140625, -7.5533447265625, -7.112548828125, -6.6717529296875, -6.23095703125, -5.7901611328125, -5.349365234375, -4.9085693359375, -4.4677734375, -4.0269775390625, -3.586181640625, -3.1453857421875, -2.70458984375, -2.2637939453125, -1.822998046875, -1.3822021484375, -0.94140625, -0.5006103515625, -0.059814453125, 0.3809814453125, 0.82177734375, 1.2625732421875, 1.703369140625, 2.1441650390625, 2.5849609375, 3.0257568359375, 3.466552734375, 3.9073486328125, 4.34814453125, 4.7889404296875, 5.229736328125, 5.6705322265625, 6.111328125, 6.5521240234375, 6.992919921875, 7.4337158203125, 7.87451171875, 8.3153076171875, 8.756103515625, 9.1968994140625, 9.6376953125, 10.0784912109375, 10.519287109375, 10.9600830078125, 11.40087890625, 11.8416748046875, 12.282470703125, 12.7232666015625, 13.1640625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 10.0, 18.0, 61.0, 185.0, 351.0, 268.0, 74.0, 21.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.16326141357422, -108.63911437988281, -103.11497497558594, -97.59082794189453, -92.06668853759766, -86.54254150390625, -81.01840209960938, -75.49425506591797, -69.97010803222656, -64.44596099853516, -58.92182159423828, -53.397674560546875, -47.87353515625, -42.349388122558594, -36.82524490356445, -31.301101684570312, -25.776962280273438, -20.252819061279297, -14.72867488861084, -9.204530715942383, -3.680387496948242, 1.8437557220458984, 7.367900848388672, 12.892044067382812, 18.416187286376953, 23.940330505371094, 29.464473724365234, 34.988616943359375, 40.51276397705078, 46.036903381347656, 51.56105041503906, 57.0851936340332, 62.609344482421875, 68.13349151611328, 73.65763092041016, 79.18177795410156, 84.70591735839844, 90.23006439208984, 95.75421142578125, 101.27835083007812, 106.802490234375, 112.3266372680664, 117.85077667236328, 123.37492370605469, 128.89906311035156, 134.42320251464844, 139.94735717773438, 145.47149658203125, 150.99563598632812, 156.519775390625, 162.04393005371094, 167.5680694580078, 173.0922088623047, 178.61634826660156, 184.1405029296875, 189.66464233398438, 195.1887969970703, 200.7129364013672, 206.23709106445312, 211.76123046875, 217.28536987304688, 222.80950927734375, 228.3336639404297, 233.85780334472656, 239.38194274902344]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 8.0, 20.0, 24.0, 26.0, 33.0, 35.0, 38.0, 45.0, 44.0, 49.0, 67.0, 72.0, 69.0, 61.0, 60.0, 40.0, 48.0, 42.0, 50.0, 32.0, 21.0, 20.0, 12.0, 16.0, 9.0, 8.0, 4.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-61.8324089050293, -60.15514373779297, -58.47787857055664, -56.80061340332031, -55.123348236083984, -53.446083068847656, -51.76881408691406, -50.091552734375, -48.414283752441406, -46.73701858520508, -45.05975341796875, -43.38248825073242, -41.705223083496094, -40.027957916259766, -38.35069274902344, -36.673423767089844, -34.99616241455078, -33.31889724731445, -31.641632080078125, -29.964366912841797, -28.28710174560547, -26.60983657836914, -24.93256950378418, -23.25530433654785, -21.578039169311523, -19.900774002075195, -18.223508834838867, -16.546241760253906, -14.868977546691895, -13.191712379455566, -11.514446258544922, -9.837181091308594, -8.159915924072266, -6.4826507568359375, -4.805385112762451, -3.128119468688965, -1.4508543014526367, 0.2264108657836914, 1.903676986694336, 3.580942153930664, 5.258207321166992, 6.93547248840332, 8.612737655639648, 10.290003776550293, 11.967268943786621, 13.64453411102295, 15.321800231933594, 16.999065399169922, 18.67633056640625, 20.353595733642578, 22.030860900878906, 23.708126068115234, 25.385391235351562, 27.06265640258789, 28.73992347717285, 30.41718864440918, 32.094451904296875, 33.7717170715332, 35.44898223876953, 37.12624740600586, 38.80351257324219, 40.480777740478516, 42.158042907714844, 43.83531188964844, 45.512577056884766]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 6.0, 8.0, 7.0, 9.0, 14.0, 16.0, 20.0, 39.0, 51.0, 72.0, 111.0, 179.0, 269.0, 477.0, 840.0, 1564.0, 3037.0, 6077.0, 12965.0, 30549.0, 74865.0, 194597.0, 355707.0, 219456.0, 85099.0, 34138.0, 14578.0, 6674.0, 3191.0, 1663.0, 848.0, 543.0, 290.0, 194.0, 123.0, 73.0, 58.0, 40.0, 33.0, 19.0, 14.0, 8.0, 6.0, 5.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.40625, -6.20953369140625, -6.0128173828125, -5.81610107421875, -5.619384765625, -5.42266845703125, -5.2259521484375, -5.02923583984375, -4.83251953125, -4.63580322265625, -4.4390869140625, -4.24237060546875, -4.045654296875, -3.84893798828125, -3.6522216796875, -3.45550537109375, -3.2587890625, -3.06207275390625, -2.8653564453125, -2.66864013671875, -2.471923828125, -2.27520751953125, -2.0784912109375, -1.88177490234375, -1.68505859375, -1.48834228515625, -1.2916259765625, -1.09490966796875, -0.898193359375, -0.70147705078125, -0.5047607421875, -0.30804443359375, -0.111328125, 0.08538818359375, 0.2821044921875, 0.47882080078125, 0.675537109375, 0.87225341796875, 1.0689697265625, 1.26568603515625, 1.46240234375, 1.65911865234375, 1.8558349609375, 2.05255126953125, 2.249267578125, 2.44598388671875, 2.6427001953125, 2.83941650390625, 3.0361328125, 3.23284912109375, 3.4295654296875, 3.62628173828125, 3.822998046875, 4.01971435546875, 4.2164306640625, 4.41314697265625, 4.60986328125, 4.80657958984375, 5.0032958984375, 5.20001220703125, 5.396728515625, 5.59344482421875, 5.7901611328125, 5.98687744140625, 6.18359375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 5.0, 7.0, 3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 11.0, 9.0, 12.0, 6.0, 14.0, 14.0, 13.0, 25.0, 34.0, 26.0, 32.0, 37.0, 37.0, 40.0, 49.0, 51.0, 46.0, 51.0, 48.0, 32.0, 45.0, 38.0, 30.0, 31.0, 29.0, 28.0, 28.0, 26.0, 15.0, 25.0, 20.0, 5.0, 17.0, 9.0, 9.0, 9.0, 10.0, 4.0, 4.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.376953125, -3.26318359375, -3.1494140625, -3.03564453125, -2.921875, -2.80810546875, -2.6943359375, -2.58056640625, -2.466796875, -2.35302734375, -2.2392578125, -2.12548828125, -2.01171875, -1.89794921875, -1.7841796875, -1.67041015625, -1.556640625, -1.44287109375, -1.3291015625, -1.21533203125, -1.1015625, -0.98779296875, -0.8740234375, -0.76025390625, -0.646484375, -0.53271484375, -0.4189453125, -0.30517578125, -0.19140625, -0.07763671875, 0.0361328125, 0.14990234375, 0.263671875, 0.37744140625, 0.4912109375, 0.60498046875, 0.71875, 0.83251953125, 0.9462890625, 1.06005859375, 1.173828125, 1.28759765625, 1.4013671875, 1.51513671875, 1.62890625, 1.74267578125, 1.8564453125, 1.97021484375, 2.083984375, 2.19775390625, 2.3115234375, 2.42529296875, 2.5390625, 2.65283203125, 2.7666015625, 2.88037109375, 2.994140625, 3.10791015625, 3.2216796875, 3.33544921875, 3.44921875, 3.56298828125, 3.6767578125, 3.79052734375, 3.904296875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 8.0, 13.0, 19.0, 30.0, 51.0, 68.0, 116.0, 146.0, 265.0, 465.0, 923.0, 1978.0, 5253.0, 19303.0, 109912.0, 734054.0, 142329.0, 23070.0, 6025.0, 2225.0, 972.0, 509.0, 289.0, 162.0, 111.0, 72.0, 53.0, 29.0, 25.0, 21.0, 10.0, 11.0, 9.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8984375, -12.5023193359375, -12.106201171875, -11.7100830078125, -11.31396484375, -10.9178466796875, -10.521728515625, -10.1256103515625, -9.7294921875, -9.3333740234375, -8.937255859375, -8.5411376953125, -8.14501953125, -7.7489013671875, -7.352783203125, -6.9566650390625, -6.560546875, -6.1644287109375, -5.768310546875, -5.3721923828125, -4.97607421875, -4.5799560546875, -4.183837890625, -3.7877197265625, -3.3916015625, -2.9954833984375, -2.599365234375, -2.2032470703125, -1.80712890625, -1.4110107421875, -1.014892578125, -0.6187744140625, -0.22265625, 0.1734619140625, 0.569580078125, 0.9656982421875, 1.36181640625, 1.7579345703125, 2.154052734375, 2.5501708984375, 2.9462890625, 3.3424072265625, 3.738525390625, 4.1346435546875, 4.53076171875, 4.9268798828125, 5.322998046875, 5.7191162109375, 6.115234375, 6.5113525390625, 6.907470703125, 7.3035888671875, 7.69970703125, 8.0958251953125, 8.491943359375, 8.8880615234375, 9.2841796875, 9.6802978515625, 10.076416015625, 10.4725341796875, 10.86865234375, 11.2647705078125, 11.660888671875, 12.0570068359375, 12.453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 9.0, 9.0, 15.0, 23.0, 22.0, 32.0, 23.0, 37.0, 47.0, 67.0, 59.0, 75.0, 60.0, 77.0, 60.0, 55.0, 55.0, 49.0, 42.0, 36.0, 34.0, 19.0, 14.0, 19.0, 9.0, 10.0, 5.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.90625, -14.31201171875, -13.7177734375, -13.12353515625, -12.529296875, -11.93505859375, -11.3408203125, -10.74658203125, -10.15234375, -9.55810546875, -8.9638671875, -8.36962890625, -7.775390625, -7.18115234375, -6.5869140625, -5.99267578125, -5.3984375, -4.80419921875, -4.2099609375, -3.61572265625, -3.021484375, -2.42724609375, -1.8330078125, -1.23876953125, -0.64453125, -0.05029296875, 0.5439453125, 1.13818359375, 1.732421875, 2.32666015625, 2.9208984375, 3.51513671875, 4.109375, 4.70361328125, 5.2978515625, 5.89208984375, 6.486328125, 7.08056640625, 7.6748046875, 8.26904296875, 8.86328125, 9.45751953125, 10.0517578125, 10.64599609375, 11.240234375, 11.83447265625, 12.4287109375, 13.02294921875, 13.6171875, 14.21142578125, 14.8056640625, 15.39990234375, 15.994140625, 16.58837890625, 17.1826171875, 17.77685546875, 18.37109375, 18.96533203125, 19.5595703125, 20.15380859375, 20.748046875, 21.34228515625, 21.9365234375, 22.53076171875, 23.125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 8.0, 7.0, 12.0, 15.0, 29.0, 25.0, 56.0, 51.0, 102.0, 137.0, 206.0, 315.0, 547.0, 1016.0, 2062.0, 4618.0, 11028.0, 30268.0, 100715.0, 609571.0, 204253.0, 52778.0, 17702.0, 6729.0, 2931.0, 1376.0, 744.0, 473.0, 256.0, 182.0, 89.0, 82.0, 45.0, 31.0, 26.0, 14.0, 11.0, 11.0, 7.0, 4.0, 3.0, 2.0, 1.0, 7.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-2.876953125, -2.79168701171875, -2.7064208984375, -2.62115478515625, -2.535888671875, -2.45062255859375, -2.3653564453125, -2.28009033203125, -2.19482421875, -2.10955810546875, -2.0242919921875, -1.93902587890625, -1.853759765625, -1.76849365234375, -1.6832275390625, -1.59796142578125, -1.5126953125, -1.42742919921875, -1.3421630859375, -1.25689697265625, -1.171630859375, -1.08636474609375, -1.0010986328125, -0.91583251953125, -0.83056640625, -0.74530029296875, -0.6600341796875, -0.57476806640625, -0.489501953125, -0.40423583984375, -0.3189697265625, -0.23370361328125, -0.1484375, -0.06317138671875, 0.0220947265625, 0.10736083984375, 0.192626953125, 0.27789306640625, 0.3631591796875, 0.44842529296875, 0.53369140625, 0.61895751953125, 0.7042236328125, 0.78948974609375, 0.874755859375, 0.96002197265625, 1.0452880859375, 1.13055419921875, 1.2158203125, 1.30108642578125, 1.3863525390625, 1.47161865234375, 1.556884765625, 1.64215087890625, 1.7274169921875, 1.81268310546875, 1.89794921875, 1.98321533203125, 2.0684814453125, 2.15374755859375, 2.239013671875, 2.32427978515625, 2.4095458984375, 2.49481201171875, 2.580078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 9.0, 6.0, 4.0, 7.0, 8.0, 12.0, 17.0, 28.0, 24.0, 27.0, 30.0, 29.0, 45.0, 49.0, 87.0, 100.0, 112.0, 90.0, 52.0, 52.0, 34.0, 30.0, 21.0, 20.0, 16.0, 16.0, 10.0, 8.0, 4.0, 11.0, 3.0, 6.0, 5.0, 5.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00098419189453125, -0.0009525120258331299, -0.0009208321571350098, -0.0008891522884368896, -0.0008574724197387695, -0.0008257925510406494, -0.0007941126823425293, -0.0007624328136444092, -0.0007307529449462891, -0.0006990730762481689, -0.0006673932075500488, -0.0006357133388519287, -0.0006040334701538086, -0.0005723536014556885, -0.0005406737327575684, -0.0005089938640594482, -0.0004773139953613281, -0.000445634126663208, -0.0004139542579650879, -0.0003822743892669678, -0.00035059452056884766, -0.00031891465187072754, -0.0002872347831726074, -0.0002555549144744873, -0.0002238750457763672, -0.00019219517707824707, -0.00016051530838012695, -0.00012883543968200684, -9.715557098388672e-05, -6.54757022857666e-05, -3.3795833587646484e-05, -2.115964889526367e-06, 2.956390380859375e-05, 6.124377250671387e-05, 9.292364120483398e-05, 0.0001246035099029541, 0.00015628337860107422, 0.00018796324729919434, 0.00021964311599731445, 0.00025132298469543457, 0.0002830028533935547, 0.0003146827220916748, 0.0003463625907897949, 0.00037804245948791504, 0.00040972232818603516, 0.0004414021968841553, 0.0004730820655822754, 0.0005047619342803955, 0.0005364418029785156, 0.0005681216716766357, 0.0005998015403747559, 0.000631481409072876, 0.0006631612777709961, 0.0006948411464691162, 0.0007265210151672363, 0.0007582008838653564, 0.0007898807525634766, 0.0008215606212615967, 0.0008532404899597168, 0.0008849203586578369, 0.000916600227355957, 0.0009482800960540771, 0.0009799599647521973, 0.0010116398334503174, 0.0010433197021484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 10.0, 20.0, 28.0, 36.0, 44.0, 76.0, 125.0, 169.0, 267.0, 505.0, 866.0, 1683.0, 3870.0, 9939.0, 31401.0, 127411.0, 664482.0, 151795.0, 35965.0, 11319.0, 4283.0, 1940.0, 944.0, 544.0, 282.0, 219.0, 101.0, 88.0, 48.0, 28.0, 18.0, 15.0, 8.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.47265625, -3.38018798828125, -3.2877197265625, -3.19525146484375, -3.102783203125, -3.01031494140625, -2.9178466796875, -2.82537841796875, -2.73291015625, -2.64044189453125, -2.5479736328125, -2.45550537109375, -2.363037109375, -2.27056884765625, -2.1781005859375, -2.08563232421875, -1.9931640625, -1.90069580078125, -1.8082275390625, -1.71575927734375, -1.623291015625, -1.53082275390625, -1.4383544921875, -1.34588623046875, -1.25341796875, -1.16094970703125, -1.0684814453125, -0.97601318359375, -0.883544921875, -0.79107666015625, -0.6986083984375, -0.60614013671875, -0.513671875, -0.42120361328125, -0.3287353515625, -0.23626708984375, -0.143798828125, -0.05133056640625, 0.0411376953125, 0.13360595703125, 0.22607421875, 0.31854248046875, 0.4110107421875, 0.50347900390625, 0.595947265625, 0.68841552734375, 0.7808837890625, 0.87335205078125, 0.9658203125, 1.05828857421875, 1.1507568359375, 1.24322509765625, 1.335693359375, 1.42816162109375, 1.5206298828125, 1.61309814453125, 1.70556640625, 1.79803466796875, 1.8905029296875, 1.98297119140625, 2.075439453125, 2.16790771484375, 2.2603759765625, 2.35284423828125, 2.4453125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 8.0, 9.0, 11.0, 14.0, 24.0, 20.0, 37.0, 40.0, 48.0, 63.0, 67.0, 91.0, 92.0, 87.0, 55.0, 82.0, 40.0, 32.0, 29.0, 23.0, 17.0, 19.0, 15.0, 14.0, 7.0, 8.0, 9.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6953125, -2.593475341796875, -2.49163818359375, -2.389801025390625, -2.2879638671875, -2.186126708984375, -2.08428955078125, -1.982452392578125, -1.880615234375, -1.778778076171875, -1.67694091796875, -1.575103759765625, -1.4732666015625, -1.371429443359375, -1.26959228515625, -1.167755126953125, -1.06591796875, -0.964080810546875, -0.86224365234375, -0.760406494140625, -0.6585693359375, -0.556732177734375, -0.45489501953125, -0.353057861328125, -0.251220703125, -0.149383544921875, -0.04754638671875, 0.054290771484375, 0.1561279296875, 0.257965087890625, 0.35980224609375, 0.461639404296875, 0.5634765625, 0.665313720703125, 0.76715087890625, 0.868988037109375, 0.9708251953125, 1.072662353515625, 1.17449951171875, 1.276336669921875, 1.378173828125, 1.480010986328125, 1.58184814453125, 1.683685302734375, 1.7855224609375, 1.887359619140625, 1.98919677734375, 2.091033935546875, 2.19287109375, 2.294708251953125, 2.39654541015625, 2.498382568359375, 2.6002197265625, 2.702056884765625, 2.80389404296875, 2.905731201171875, 3.007568359375, 3.109405517578125, 3.21124267578125, 3.313079833984375, 3.4149169921875, 3.516754150390625, 3.61859130859375, 3.720428466796875, 3.822265625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 28.0, 58.0, 97.0, 257.0, 333.0, 126.0, 48.0, 24.0, 11.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-198.7899169921875, -194.7440643310547, -190.69821166992188, -186.65234375, -182.6064910888672, -178.56063842773438, -174.51478576660156, -170.46893310546875, -166.42306518554688, -162.37721252441406, -158.33135986328125, -154.28549194335938, -150.23963928222656, -146.19378662109375, -142.14793395996094, -138.10208129882812, -134.0562286376953, -130.0103759765625, -125.96451568603516, -121.91866302490234, -117.872802734375, -113.82695007324219, -109.78109741210938, -105.73524475097656, -101.68938446044922, -97.6435317993164, -93.59767150878906, -89.55181884765625, -85.50596618652344, -81.4601058959961, -77.41425323486328, -73.36839294433594, -69.3225326538086, -65.27667999267578, -61.23081970214844, -57.184967041015625, -53.13911056518555, -49.09325408935547, -45.047401428222656, -41.00154495239258, -36.9556884765625, -32.90983200073242, -28.863977432250977, -24.81812286376953, -20.772266387939453, -16.726409912109375, -12.68055534362793, -8.634700775146484, -4.588844299316406, -0.5429887771606445, 3.502866744995117, 7.548722267150879, 11.59457778930664, 15.640434265136719, 19.686288833618164, 23.73214340209961, 27.777999877929688, 31.823856353759766, 35.869712829589844, 39.915565490722656, 43.961421966552734, 48.00727844238281, 52.053131103515625, 56.0989875793457, 60.14484405517578]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 9.0, 11.0, 11.0, 13.0, 11.0, 9.0, 13.0, 31.0, 17.0, 25.0, 23.0, 27.0, 40.0, 51.0, 57.0, 98.0, 99.0, 74.0, 56.0, 28.0, 33.0, 35.0, 32.0, 25.0, 27.0, 14.0, 19.0, 12.0, 13.0, 9.0, 16.0, 10.0, 7.0, 8.0, 7.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.53459548950195, -48.74828338623047, -46.96196746826172, -45.175655364990234, -43.38934326171875, -41.60302734375, -39.816715240478516, -38.03040313720703, -36.24408721923828, -34.4577751159668, -32.67145919799805, -30.885147094726562, -29.098833084106445, -27.312519073486328, -25.526206970214844, -23.739892959594727, -21.953580856323242, -20.167266845703125, -18.38095474243164, -16.594640731811523, -14.808326721191406, -13.022013664245605, -11.235700607299805, -9.449386596679688, -7.663073539733887, -5.876760005950928, -4.090446472167969, -2.304133415222168, -0.517819881439209, 1.26849365234375, 3.054806709289551, 4.841120719909668, 6.627433776855469, 8.41374683380127, 10.200060844421387, 11.986373901367188, 13.772687911987305, 15.559000968933105, 17.345314025878906, 19.131628036499023, 20.91794204711914, 22.704256057739258, 24.490568161010742, 26.27688217163086, 28.063196182250977, 29.849510192871094, 31.635822296142578, 33.42213439941406, 35.20845031738281, 36.9947624206543, 38.78107833862305, 40.56739044189453, 42.353702545166016, 44.140018463134766, 45.92633056640625, 47.712646484375, 49.49895477294922, 51.2852668762207, 53.07158279418945, 54.85789489746094, 56.64420700073242, 58.43052291870117, 60.216835021972656, 62.003150939941406, 63.78946304321289]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 12.0, 13.0, 15.0, 35.0, 49.0, 81.0, 121.0, 162.0, 240.0, 349.0, 530.0, 851.0, 1522.0, 2719.0, 5261.0, 10573.0, 27429.0, 91223.0, 398150.0, 1616941.0, 1538567.0, 365669.0, 85613.0, 26222.0, 10494.0, 4956.0, 2630.0, 1473.0, 830.0, 566.0, 313.0, 222.0, 146.0, 103.0, 69.0, 44.0, 34.0, 15.0, 12.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-4.87890625, -4.7432861328125, -4.607666015625, -4.4720458984375, -4.33642578125, -4.2008056640625, -4.065185546875, -3.9295654296875, -3.7939453125, -3.6583251953125, -3.522705078125, -3.3870849609375, -3.25146484375, -3.1158447265625, -2.980224609375, -2.8446044921875, -2.708984375, -2.5733642578125, -2.437744140625, -2.3021240234375, -2.16650390625, -2.0308837890625, -1.895263671875, -1.7596435546875, -1.6240234375, -1.4884033203125, -1.352783203125, -1.2171630859375, -1.08154296875, -0.9459228515625, -0.810302734375, -0.6746826171875, -0.5390625, -0.4034423828125, -0.267822265625, -0.1322021484375, 0.00341796875, 0.1390380859375, 0.274658203125, 0.4102783203125, 0.5458984375, 0.6815185546875, 0.817138671875, 0.9527587890625, 1.08837890625, 1.2239990234375, 1.359619140625, 1.4952392578125, 1.630859375, 1.7664794921875, 1.902099609375, 2.0377197265625, 2.17333984375, 2.3089599609375, 2.444580078125, 2.5802001953125, 2.7158203125, 2.8514404296875, 2.987060546875, 3.1226806640625, 3.25830078125, 3.3939208984375, 3.529541015625, 3.6651611328125, 3.80078125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 2.0, 6.0, 5.0, 11.0, 9.0, 12.0, 13.0, 10.0, 15.0, 18.0, 27.0, 26.0, 31.0, 28.0, 36.0, 52.0, 58.0, 54.0, 56.0, 47.0, 49.0, 40.0, 45.0, 27.0, 39.0, 28.0, 28.0, 35.0, 37.0, 19.0, 26.0, 26.0, 15.0, 12.0, 12.0, 12.0, 8.0, 8.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.7535400390625, -3.632080078125, -3.5106201171875, -3.38916015625, -3.2677001953125, -3.146240234375, -3.0247802734375, -2.9033203125, -2.7818603515625, -2.660400390625, -2.5389404296875, -2.41748046875, -2.2960205078125, -2.174560546875, -2.0531005859375, -1.931640625, -1.8101806640625, -1.688720703125, -1.5672607421875, -1.44580078125, -1.3243408203125, -1.202880859375, -1.0814208984375, -0.9599609375, -0.8385009765625, -0.717041015625, -0.5955810546875, -0.47412109375, -0.3526611328125, -0.231201171875, -0.1097412109375, 0.01171875, 0.1331787109375, 0.254638671875, 0.3760986328125, 0.49755859375, 0.6190185546875, 0.740478515625, 0.8619384765625, 0.9833984375, 1.1048583984375, 1.226318359375, 1.3477783203125, 1.46923828125, 1.5906982421875, 1.712158203125, 1.8336181640625, 1.955078125, 2.0765380859375, 2.197998046875, 2.3194580078125, 2.44091796875, 2.5623779296875, 2.683837890625, 2.8052978515625, 2.9267578125, 3.0482177734375, 3.169677734375, 3.2911376953125, 3.41259765625, 3.5340576171875, 3.655517578125, 3.7769775390625, 3.8984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 8.0, 6.0, 11.0, 13.0, 19.0, 23.0, 36.0, 62.0, 75.0, 115.0, 145.0, 283.0, 593.0, 1507.0, 5542.0, 33799.0, 667842.0, 3376126.0, 92427.0, 11378.0, 2467.0, 881.0, 336.0, 188.0, 107.0, 76.0, 51.0, 40.0, 32.0, 15.0, 18.0, 9.0, 6.0, 12.0, 6.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.87890625, -10.4296875, -9.98046875, -9.53125, -9.08203125, -8.6328125, -8.18359375, -7.734375, -7.28515625, -6.8359375, -6.38671875, -5.9375, -5.48828125, -5.0390625, -4.58984375, -4.140625, -3.69140625, -3.2421875, -2.79296875, -2.34375, -1.89453125, -1.4453125, -0.99609375, -0.546875, -0.09765625, 0.3515625, 0.80078125, 1.25, 1.69921875, 2.1484375, 2.59765625, 3.046875, 3.49609375, 3.9453125, 4.39453125, 4.84375, 5.29296875, 5.7421875, 6.19140625, 6.640625, 7.08984375, 7.5390625, 7.98828125, 8.4375, 8.88671875, 9.3359375, 9.78515625, 10.234375, 10.68359375, 11.1328125, 11.58203125, 12.03125, 12.48046875, 12.9296875, 13.37890625, 13.828125, 14.27734375, 14.7265625, 15.17578125, 15.625, 16.07421875, 16.5234375, 16.97265625, 17.421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 2.0, 7.0, 8.0, 10.0, 17.0, 18.0, 30.0, 46.0, 47.0, 70.0, 95.0, 152.0, 276.0, 420.0, 611.0, 765.0, 508.0, 327.0, 226.0, 141.0, 86.0, 63.0, 33.0, 29.0, 13.0, 12.0, 8.0, 15.0, 11.0, 4.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.8828125, -11.54638671875, -11.2099609375, -10.87353515625, -10.537109375, -10.20068359375, -9.8642578125, -9.52783203125, -9.19140625, -8.85498046875, -8.5185546875, -8.18212890625, -7.845703125, -7.50927734375, -7.1728515625, -6.83642578125, -6.5, -6.16357421875, -5.8271484375, -5.49072265625, -5.154296875, -4.81787109375, -4.4814453125, -4.14501953125, -3.80859375, -3.47216796875, -3.1357421875, -2.79931640625, -2.462890625, -2.12646484375, -1.7900390625, -1.45361328125, -1.1171875, -0.78076171875, -0.4443359375, -0.10791015625, 0.228515625, 0.56494140625, 0.9013671875, 1.23779296875, 1.57421875, 1.91064453125, 2.2470703125, 2.58349609375, 2.919921875, 3.25634765625, 3.5927734375, 3.92919921875, 4.265625, 4.60205078125, 4.9384765625, 5.27490234375, 5.611328125, 5.94775390625, 6.2841796875, 6.62060546875, 6.95703125, 7.29345703125, 7.6298828125, 7.96630859375, 8.302734375, 8.63916015625, 8.9755859375, 9.31201171875, 9.6484375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 17.0, 31.0, 60.0, 187.0, 315.0, 238.0, 97.0, 26.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.51271057128906, -169.1851043701172, -163.85748291015625, -158.52987670898438, -153.2022705078125, -147.87466430664062, -142.54705810546875, -137.2194366455078, -131.89183044433594, -126.56422424316406, -121.23661041259766, -115.90899658203125, -110.58139038085938, -105.2537841796875, -99.9261703491211, -94.59855651855469, -89.27095031738281, -83.94334411621094, -78.61573028564453, -73.28811645507812, -67.96051025390625, -62.63290023803711, -57.30529022216797, -51.97768020629883, -46.65007019042969, -41.32246017456055, -35.994850158691406, -30.667240142822266, -25.339630126953125, -20.012020111083984, -14.684410095214844, -9.356800079345703, -4.0291748046875, 1.2984352111816406, 6.626045227050781, 11.953655242919922, 17.281265258789062, 22.608875274658203, 27.936485290527344, 33.264095306396484, 38.591705322265625, 43.919315338134766, 49.246925354003906, 54.57453536987305, 59.90214538574219, 65.22975158691406, 70.55736541748047, 75.88497924804688, 81.21258544921875, 86.54019165039062, 91.86780548095703, 97.19541931152344, 102.52302551269531, 107.85063171386719, 113.1782455444336, 118.505859375, 123.83346557617188, 129.16107177734375, 134.48867797851562, 139.81629943847656, 145.14390563964844, 150.4715118408203, 155.79913330078125, 161.12673950195312, 166.454345703125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 9.0, 10.0, 20.0, 4.0, 21.0, 18.0, 25.0, 18.0, 25.0, 19.0, 23.0, 31.0, 45.0, 44.0, 55.0, 51.0, 41.0, 46.0, 44.0, 42.0, 24.0, 42.0, 40.0, 39.0, 35.0, 33.0, 23.0, 17.0, 20.0, 14.0, 13.0, 13.0, 18.0, 18.0, 13.0, 8.0, 8.0, 1.0, 1.0, 10.0, 7.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-43.146690368652344, -41.7572135925293, -40.36773681640625, -38.9782600402832, -37.588783264160156, -36.19930648803711, -34.80982971191406, -33.42034912109375, -32.03087615966797, -30.641399383544922, -29.251922607421875, -27.862445831298828, -26.47296905517578, -25.083492279052734, -23.694013595581055, -22.304536819458008, -20.915058135986328, -19.52558135986328, -18.136104583740234, -16.746627807617188, -15.357150077819824, -13.967673301696777, -12.578195571899414, -11.188718795776367, -9.79924201965332, -8.409765243530273, -7.020287990570068, -5.630810737609863, -4.241333961486816, -2.8518571853637695, -1.4623794555664062, -0.07290267944335938, 1.3165779113769531, 2.706054925918579, 4.095531940460205, 5.48500919342041, 6.874485969543457, 8.263962745666504, 9.653440475463867, 11.042917251586914, 12.432394027709961, 13.821870803833008, 15.211347579956055, 16.600826263427734, 17.99030303955078, 19.379779815673828, 20.769256591796875, 22.158733367919922, 23.54821014404297, 24.937686920166016, 26.327163696289062, 27.71664047241211, 29.106117248535156, 30.495594024658203, 31.885072708129883, 33.27455139160156, 34.664024353027344, 36.05350112915039, 37.44297790527344, 38.832454681396484, 40.22193145751953, 41.61140823364258, 43.000885009765625, 44.39036560058594, 45.779842376708984]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 8.0, 5.0, 9.0, 10.0, 18.0, 12.0, 29.0, 52.0, 88.0, 161.0, 236.0, 500.0, 928.0, 1872.0, 3891.0, 8327.0, 19187.0, 48957.0, 139289.0, 380976.0, 287464.0, 95005.0, 34774.0, 14222.0, 6472.0, 2870.0, 1429.0, 791.0, 402.0, 221.0, 134.0, 79.0, 48.0, 37.0, 20.0, 13.0, 10.0, 3.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.5526123046875, -6.308349609375, -6.0640869140625, -5.81982421875, -5.5755615234375, -5.331298828125, -5.0870361328125, -4.8427734375, -4.5985107421875, -4.354248046875, -4.1099853515625, -3.86572265625, -3.6214599609375, -3.377197265625, -3.1329345703125, -2.888671875, -2.6444091796875, -2.400146484375, -2.1558837890625, -1.91162109375, -1.6673583984375, -1.423095703125, -1.1788330078125, -0.9345703125, -0.6903076171875, -0.446044921875, -0.2017822265625, 0.04248046875, 0.2867431640625, 0.531005859375, 0.7752685546875, 1.01953125, 1.2637939453125, 1.508056640625, 1.7523193359375, 1.99658203125, 2.2408447265625, 2.485107421875, 2.7293701171875, 2.9736328125, 3.2178955078125, 3.462158203125, 3.7064208984375, 3.95068359375, 4.1949462890625, 4.439208984375, 4.6834716796875, 4.927734375, 5.1719970703125, 5.416259765625, 5.6605224609375, 5.90478515625, 6.1490478515625, 6.393310546875, 6.6375732421875, 6.8818359375, 7.1260986328125, 7.370361328125, 7.6146240234375, 7.85888671875, 8.1031494140625, 8.347412109375, 8.5916748046875, 8.8359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 9.0, 6.0, 10.0, 12.0, 18.0, 25.0, 23.0, 27.0, 29.0, 40.0, 39.0, 40.0, 43.0, 46.0, 67.0, 66.0, 56.0, 44.0, 47.0, 48.0, 51.0, 35.0, 32.0, 31.0, 23.0, 31.0, 19.0, 17.0, 13.0, 13.0, 10.0, 3.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.1944580078125, -4.045166015625, -3.8958740234375, -3.74658203125, -3.5972900390625, -3.447998046875, -3.2987060546875, -3.1494140625, -3.0001220703125, -2.850830078125, -2.7015380859375, -2.55224609375, -2.4029541015625, -2.253662109375, -2.1043701171875, -1.955078125, -1.8057861328125, -1.656494140625, -1.5072021484375, -1.35791015625, -1.2086181640625, -1.059326171875, -0.9100341796875, -0.7607421875, -0.6114501953125, -0.462158203125, -0.3128662109375, -0.16357421875, -0.0142822265625, 0.135009765625, 0.2843017578125, 0.43359375, 0.5828857421875, 0.732177734375, 0.8814697265625, 1.03076171875, 1.1800537109375, 1.329345703125, 1.4786376953125, 1.6279296875, 1.7772216796875, 1.926513671875, 2.0758056640625, 2.22509765625, 2.3743896484375, 2.523681640625, 2.6729736328125, 2.822265625, 2.9715576171875, 3.120849609375, 3.2701416015625, 3.41943359375, 3.5687255859375, 3.718017578125, 3.8673095703125, 4.0166015625, 4.1658935546875, 4.315185546875, 4.4644775390625, 4.61376953125, 4.7630615234375, 4.912353515625, 5.0616455078125, 5.2109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 7.0, 3.0, 12.0, 15.0, 25.0, 33.0, 54.0, 66.0, 97.0, 145.0, 205.0, 353.0, 559.0, 984.0, 2008.0, 5077.0, 18508.0, 124400.0, 785937.0, 87182.0, 14479.0, 4295.0, 1828.0, 873.0, 486.0, 296.0, 191.0, 128.0, 95.0, 62.0, 38.0, 32.0, 28.0, 15.0, 11.0, 5.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.5390625, -14.090576171875, -13.64208984375, -13.193603515625, -12.7451171875, -12.296630859375, -11.84814453125, -11.399658203125, -10.951171875, -10.502685546875, -10.05419921875, -9.605712890625, -9.1572265625, -8.708740234375, -8.26025390625, -7.811767578125, -7.36328125, -6.914794921875, -6.46630859375, -6.017822265625, -5.5693359375, -5.120849609375, -4.67236328125, -4.223876953125, -3.775390625, -3.326904296875, -2.87841796875, -2.429931640625, -1.9814453125, -1.532958984375, -1.08447265625, -0.635986328125, -0.1875, 0.260986328125, 0.70947265625, 1.157958984375, 1.6064453125, 2.054931640625, 2.50341796875, 2.951904296875, 3.400390625, 3.848876953125, 4.29736328125, 4.745849609375, 5.1943359375, 5.642822265625, 6.09130859375, 6.539794921875, 6.98828125, 7.436767578125, 7.88525390625, 8.333740234375, 8.7822265625, 9.230712890625, 9.67919921875, 10.127685546875, 10.576171875, 11.024658203125, 11.47314453125, 11.921630859375, 12.3701171875, 12.818603515625, 13.26708984375, 13.715576171875, 14.1640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 12.0, 19.0, 8.0, 19.0, 18.0, 20.0, 31.0, 33.0, 40.0, 38.0, 48.0, 48.0, 60.0, 54.0, 63.0, 79.0, 51.0, 52.0, 49.0, 42.0, 22.0, 33.0, 24.0, 25.0, 17.0, 13.0, 9.0, 11.0, 8.0, 10.0, 3.0, 5.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.5703125, -13.984375, -13.3984375, -12.8125, -12.2265625, -11.640625, -11.0546875, -10.46875, -9.8828125, -9.296875, -8.7109375, -8.125, -7.5390625, -6.953125, -6.3671875, -5.78125, -5.1953125, -4.609375, -4.0234375, -3.4375, -2.8515625, -2.265625, -1.6796875, -1.09375, -0.5078125, 0.078125, 0.6640625, 1.25, 1.8359375, 2.421875, 3.0078125, 3.59375, 4.1796875, 4.765625, 5.3515625, 5.9375, 6.5234375, 7.109375, 7.6953125, 8.28125, 8.8671875, 9.453125, 10.0390625, 10.625, 11.2109375, 11.796875, 12.3828125, 12.96875, 13.5546875, 14.140625, 14.7265625, 15.3125, 15.8984375, 16.484375, 17.0703125, 17.65625, 18.2421875, 18.828125, 19.4140625, 20.0, 20.5859375, 21.171875, 21.7578125, 22.34375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 2.0, 13.0, 8.0, 20.0, 15.0, 34.0, 28.0, 73.0, 104.0, 218.0, 497.0, 1129.0, 3582.0, 15771.0, 113910.0, 807367.0, 87716.0, 12971.0, 3169.0, 1016.0, 420.0, 183.0, 88.0, 67.0, 52.0, 29.0, 20.0, 15.0, 19.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7421875, -4.612060546875, -4.48193359375, -4.351806640625, -4.2216796875, -4.091552734375, -3.96142578125, -3.831298828125, -3.701171875, -3.571044921875, -3.44091796875, -3.310791015625, -3.1806640625, -3.050537109375, -2.92041015625, -2.790283203125, -2.66015625, -2.530029296875, -2.39990234375, -2.269775390625, -2.1396484375, -2.009521484375, -1.87939453125, -1.749267578125, -1.619140625, -1.489013671875, -1.35888671875, -1.228759765625, -1.0986328125, -0.968505859375, -0.83837890625, -0.708251953125, -0.578125, -0.447998046875, -0.31787109375, -0.187744140625, -0.0576171875, 0.072509765625, 0.20263671875, 0.332763671875, 0.462890625, 0.593017578125, 0.72314453125, 0.853271484375, 0.9833984375, 1.113525390625, 1.24365234375, 1.373779296875, 1.50390625, 1.634033203125, 1.76416015625, 1.894287109375, 2.0244140625, 2.154541015625, 2.28466796875, 2.414794921875, 2.544921875, 2.675048828125, 2.80517578125, 2.935302734375, 3.0654296875, 3.195556640625, 3.32568359375, 3.455810546875, 3.5859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 6.0, 10.0, 9.0, 12.0, 10.0, 21.0, 17.0, 25.0, 28.0, 47.0, 43.0, 71.0, 75.0, 94.0, 111.0, 69.0, 59.0, 57.0, 39.0, 35.0, 30.0, 28.0, 16.0, 10.0, 13.0, 12.0, 11.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010356903076171875, -0.0010052770376205444, -0.0009748637676239014, -0.0009444504976272583, -0.0009140372276306152, -0.0008836239576339722, -0.0008532106876373291, -0.000822797417640686, -0.000792384147644043, -0.0007619708776473999, -0.0007315576076507568, -0.0007011443376541138, -0.0006707310676574707, -0.0006403177976608276, -0.0006099045276641846, -0.0005794912576675415, -0.0005490779876708984, -0.0005186647176742554, -0.0004882514476776123, -0.00045783817768096924, -0.00042742490768432617, -0.0003970116376876831, -0.00036659836769104004, -0.00033618509769439697, -0.0003057718276977539, -0.00027535855770111084, -0.0002449452877044678, -0.0002145320177078247, -0.00018411874771118164, -0.00015370547771453857, -0.0001232922077178955, -9.287893772125244e-05, -6.246566772460938e-05, -3.205239772796631e-05, -1.6391277313232422e-06, 2.8774142265319824e-05, 5.918741226196289e-05, 8.960068225860596e-05, 0.00012001395225524902, 0.0001504272222518921, 0.00018084049224853516, 0.00021125376224517822, 0.0002416670322418213, 0.00027208030223846436, 0.0003024935722351074, 0.0003329068422317505, 0.00036332011222839355, 0.0003937333822250366, 0.0004241466522216797, 0.00045455992221832275, 0.0004849731922149658, 0.0005153864622116089, 0.000545799732208252, 0.000576213002204895, 0.0006066262722015381, 0.0006370395421981812, 0.0006674528121948242, 0.0006978660821914673, 0.0007282793521881104, 0.0007586926221847534, 0.0007891058921813965, 0.0008195191621780396, 0.0008499324321746826, 0.0008803457021713257, 0.0009107589721679688]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 6.0, 11.0, 18.0, 30.0, 41.0, 58.0, 92.0, 133.0, 222.0, 415.0, 741.0, 1455.0, 3340.0, 9011.0, 31772.0, 145853.0, 695635.0, 119325.0, 26576.0, 7804.0, 3023.0, 1343.0, 644.0, 378.0, 233.0, 128.0, 92.0, 46.0, 40.0, 26.0, 21.0, 11.0, 11.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.142578125, -3.060821533203125, -2.97906494140625, -2.897308349609375, -2.8155517578125, -2.733795166015625, -2.65203857421875, -2.570281982421875, -2.488525390625, -2.406768798828125, -2.32501220703125, -2.243255615234375, -2.1614990234375, -2.079742431640625, -1.99798583984375, -1.916229248046875, -1.83447265625, -1.752716064453125, -1.67095947265625, -1.589202880859375, -1.5074462890625, -1.425689697265625, -1.34393310546875, -1.262176513671875, -1.180419921875, -1.098663330078125, -1.01690673828125, -0.935150146484375, -0.8533935546875, -0.771636962890625, -0.68988037109375, -0.608123779296875, -0.5263671875, -0.444610595703125, -0.36285400390625, -0.281097412109375, -0.1993408203125, -0.117584228515625, -0.03582763671875, 0.045928955078125, 0.127685546875, 0.209442138671875, 0.29119873046875, 0.372955322265625, 0.4547119140625, 0.536468505859375, 0.61822509765625, 0.699981689453125, 0.78173828125, 0.863494873046875, 0.94525146484375, 1.027008056640625, 1.1087646484375, 1.190521240234375, 1.27227783203125, 1.354034423828125, 1.435791015625, 1.517547607421875, 1.59930419921875, 1.681060791015625, 1.7628173828125, 1.844573974609375, 1.92633056640625, 2.008087158203125, 2.08984375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 6.0, 8.0, 17.0, 22.0, 32.0, 20.0, 29.0, 29.0, 48.0, 45.0, 52.0, 44.0, 65.0, 57.0, 55.0, 58.0, 55.0, 54.0, 43.0, 30.0, 44.0, 35.0, 27.0, 20.0, 14.0, 6.0, 10.0, 13.0, 7.0, 5.0, 4.0, 3.0, 2.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.900390625, -1.8267822265625, -1.753173828125, -1.6795654296875, -1.60595703125, -1.5323486328125, -1.458740234375, -1.3851318359375, -1.3115234375, -1.2379150390625, -1.164306640625, -1.0906982421875, -1.01708984375, -0.9434814453125, -0.869873046875, -0.7962646484375, -0.72265625, -0.6490478515625, -0.575439453125, -0.5018310546875, -0.42822265625, -0.3546142578125, -0.281005859375, -0.2073974609375, -0.1337890625, -0.0601806640625, 0.013427734375, 0.0870361328125, 0.16064453125, 0.2342529296875, 0.307861328125, 0.3814697265625, 0.455078125, 0.5286865234375, 0.602294921875, 0.6759033203125, 0.74951171875, 0.8231201171875, 0.896728515625, 0.9703369140625, 1.0439453125, 1.1175537109375, 1.191162109375, 1.2647705078125, 1.33837890625, 1.4119873046875, 1.485595703125, 1.5592041015625, 1.6328125, 1.7064208984375, 1.780029296875, 1.8536376953125, 1.92724609375, 2.0008544921875, 2.074462890625, 2.1480712890625, 2.2216796875, 2.2952880859375, 2.368896484375, 2.4425048828125, 2.51611328125, 2.5897216796875, 2.663330078125, 2.7369384765625, 2.810546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 9.0, 12.0, 27.0, 81.0, 167.0, 429.0, 141.0, 69.0, 30.0, 21.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.93116760253906, -162.80755615234375, -158.68392944335938, -154.56031799316406, -150.43670654296875, -146.31309509277344, -142.18948364257812, -138.06585693359375, -133.94224548339844, -129.81863403320312, -125.69501495361328, -121.57139587402344, -117.44778442382812, -113.32417297363281, -109.20055389404297, -105.07693481445312, -100.95332336425781, -96.8297119140625, -92.70609283447266, -88.58247375488281, -84.4588623046875, -80.33525085449219, -76.21163177490234, -72.0880126953125, -67.96440124511719, -63.84078598022461, -59.71717071533203, -55.59355545043945, -51.469940185546875, -47.3463249206543, -43.22270965576172, -39.09909439086914, -34.97547912597656, -30.851863861083984, -26.728248596191406, -22.604633331298828, -18.48101806640625, -14.357402801513672, -10.233787536621094, -6.110172271728516, -1.9865570068359375, 2.1370582580566406, 6.260673522949219, 10.384288787841797, 14.507904052734375, 18.631519317626953, 22.75513458251953, 26.87874984741211, 31.002365112304688, 35.125980377197266, 39.249595642089844, 43.37321090698242, 47.496826171875, 51.62044143676758, 55.744056701660156, 59.867671966552734, 63.99128723144531, 68.11489868164062, 72.23851776123047, 76.36213684082031, 80.48574829101562, 84.60935974121094, 88.73297882080078, 92.85659790039062, 96.98020935058594]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 12.0, 5.0, 9.0, 17.0, 13.0, 15.0, 24.0, 23.0, 14.0, 33.0, 41.0, 42.0, 46.0, 75.0, 148.0, 108.0, 72.0, 46.0, 34.0, 18.0, 30.0, 23.0, 21.0, 28.0, 15.0, 21.0, 14.0, 6.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.50314331054688, -65.31613159179688, -63.129127502441406, -60.94211959838867, -58.75511169433594, -56.56809997558594, -54.3810920715332, -52.19408416748047, -50.007076263427734, -47.820068359375, -45.633060455322266, -43.44605255126953, -41.25904083251953, -39.07203674316406, -36.88502502441406, -34.69801712036133, -32.511009216308594, -30.32400131225586, -28.136993408203125, -25.949983596801758, -23.762975692749023, -21.57596778869629, -19.388957977294922, -17.201950073242188, -15.014942169189453, -12.827934265136719, -10.640925407409668, -8.453916549682617, -6.266908645629883, -4.079900741577148, -1.8928918838500977, 0.2941169738769531, 2.4811325073242188, 4.668140888214111, 6.855149269104004, 9.042158126831055, 11.229166030883789, 13.416173934936523, 15.603182792663574, 17.790191650390625, 19.97719955444336, 22.164207458496094, 24.351215362548828, 26.538225173950195, 28.72523307800293, 30.912240982055664, 33.09925079345703, 35.286258697509766, 37.4732666015625, 39.660274505615234, 41.84728240966797, 44.0342903137207, 46.22129821777344, 48.40830993652344, 50.59531784057617, 52.782325744628906, 54.96933364868164, 57.156341552734375, 59.34334945678711, 61.530357360839844, 63.717369079589844, 65.90437316894531, 68.09138488769531, 70.27839660644531, 72.46540069580078]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 12.0, 11.0, 17.0, 31.0, 57.0, 69.0, 88.0, 166.0, 253.0, 356.0, 655.0, 1221.0, 2088.0, 3690.0, 7954.0, 17520.0, 45971.0, 149781.0, 589963.0, 1722368.0, 1189422.0, 322196.0, 86302.0, 29615.0, 12352.0, 5611.0, 2865.0, 1556.0, 817.0, 488.0, 293.0, 177.0, 129.0, 71.0, 46.0, 32.0, 16.0, 10.0, 7.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.473876953125, -5.28369140625, -5.093505859375, -4.9033203125, -4.713134765625, -4.52294921875, -4.332763671875, -4.142578125, -3.952392578125, -3.76220703125, -3.572021484375, -3.3818359375, -3.191650390625, -3.00146484375, -2.811279296875, -2.62109375, -2.430908203125, -2.24072265625, -2.050537109375, -1.8603515625, -1.670166015625, -1.47998046875, -1.289794921875, -1.099609375, -0.909423828125, -0.71923828125, -0.529052734375, -0.3388671875, -0.148681640625, 0.04150390625, 0.231689453125, 0.421875, 0.612060546875, 0.80224609375, 0.992431640625, 1.1826171875, 1.372802734375, 1.56298828125, 1.753173828125, 1.943359375, 2.133544921875, 2.32373046875, 2.513916015625, 2.7041015625, 2.894287109375, 3.08447265625, 3.274658203125, 3.46484375, 3.655029296875, 3.84521484375, 4.035400390625, 4.2255859375, 4.415771484375, 4.60595703125, 4.796142578125, 4.986328125, 5.176513671875, 5.36669921875, 5.556884765625, 5.7470703125, 5.937255859375, 6.12744140625, 6.317626953125, 6.5078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 2.0, 2.0, 1.0, 5.0, 7.0, 9.0, 14.0, 13.0, 13.0, 20.0, 23.0, 28.0, 39.0, 45.0, 36.0, 50.0, 51.0, 57.0, 55.0, 60.0, 48.0, 53.0, 45.0, 54.0, 46.0, 27.0, 25.0, 23.0, 31.0, 23.0, 25.0, 15.0, 14.0, 9.0, 9.0, 5.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.466796875, -3.331634521484375, -3.19647216796875, -3.061309814453125, -2.9261474609375, -2.790985107421875, -2.65582275390625, -2.520660400390625, -2.385498046875, -2.250335693359375, -2.11517333984375, -1.980010986328125, -1.8448486328125, -1.709686279296875, -1.57452392578125, -1.439361572265625, -1.30419921875, -1.169036865234375, -1.03387451171875, -0.898712158203125, -0.7635498046875, -0.628387451171875, -0.49322509765625, -0.358062744140625, -0.222900390625, -0.087738037109375, 0.04742431640625, 0.182586669921875, 0.3177490234375, 0.452911376953125, 0.58807373046875, 0.723236083984375, 0.8583984375, 0.993560791015625, 1.12872314453125, 1.263885498046875, 1.3990478515625, 1.534210205078125, 1.66937255859375, 1.804534912109375, 1.939697265625, 2.074859619140625, 2.21002197265625, 2.345184326171875, 2.4803466796875, 2.615509033203125, 2.75067138671875, 2.885833740234375, 3.02099609375, 3.156158447265625, 3.29132080078125, 3.426483154296875, 3.5616455078125, 3.696807861328125, 3.83197021484375, 3.967132568359375, 4.102294921875, 4.237457275390625, 4.37261962890625, 4.507781982421875, 4.6429443359375, 4.778106689453125, 4.91326904296875, 5.048431396484375, 5.18359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 8.0, 7.0, 10.0, 17.0, 22.0, 34.0, 61.0, 78.0, 124.0, 227.0, 393.0, 753.0, 1996.0, 8169.0, 147829.0, 3945303.0, 79641.0, 6319.0, 1692.0, 701.0, 337.0, 204.0, 129.0, 76.0, 41.0, 37.0, 24.0, 17.0, 12.0, 6.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.90625, -24.030029296875, -23.15380859375, -22.277587890625, -21.4013671875, -20.525146484375, -19.64892578125, -18.772705078125, -17.896484375, -17.020263671875, -16.14404296875, -15.267822265625, -14.3916015625, -13.515380859375, -12.63916015625, -11.762939453125, -10.88671875, -10.010498046875, -9.13427734375, -8.258056640625, -7.3818359375, -6.505615234375, -5.62939453125, -4.753173828125, -3.876953125, -3.000732421875, -2.12451171875, -1.248291015625, -0.3720703125, 0.504150390625, 1.38037109375, 2.256591796875, 3.1328125, 4.009033203125, 4.88525390625, 5.761474609375, 6.6376953125, 7.513916015625, 8.39013671875, 9.266357421875, 10.142578125, 11.018798828125, 11.89501953125, 12.771240234375, 13.6474609375, 14.523681640625, 15.39990234375, 16.276123046875, 17.15234375, 18.028564453125, 18.90478515625, 19.781005859375, 20.6572265625, 21.533447265625, 22.40966796875, 23.285888671875, 24.162109375, 25.038330078125, 25.91455078125, 26.790771484375, 27.6669921875, 28.543212890625, 29.41943359375, 30.295654296875, 31.171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 21.0, 15.0, 36.0, 41.0, 56.0, 88.0, 152.0, 187.0, 261.0, 460.0, 604.0, 687.0, 450.0, 339.0, 229.0, 143.0, 96.0, 53.0, 43.0, 28.0, 18.0, 17.0, 15.0, 8.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.651611328125, -16.11572265625, -15.579833984375, -15.0439453125, -14.508056640625, -13.97216796875, -13.436279296875, -12.900390625, -12.364501953125, -11.82861328125, -11.292724609375, -10.7568359375, -10.220947265625, -9.68505859375, -9.149169921875, -8.61328125, -8.077392578125, -7.54150390625, -7.005615234375, -6.4697265625, -5.933837890625, -5.39794921875, -4.862060546875, -4.326171875, -3.790283203125, -3.25439453125, -2.718505859375, -2.1826171875, -1.646728515625, -1.11083984375, -0.574951171875, -0.0390625, 0.496826171875, 1.03271484375, 1.568603515625, 2.1044921875, 2.640380859375, 3.17626953125, 3.712158203125, 4.248046875, 4.783935546875, 5.31982421875, 5.855712890625, 6.3916015625, 6.927490234375, 7.46337890625, 7.999267578125, 8.53515625, 9.071044921875, 9.60693359375, 10.142822265625, 10.6787109375, 11.214599609375, 11.75048828125, 12.286376953125, 12.822265625, 13.358154296875, 13.89404296875, 14.429931640625, 14.9658203125, 15.501708984375, 16.03759765625, 16.573486328125, 17.109375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 12.0, 25.0, 42.0, 83.0, 146.0, 197.0, 161.0, 119.0, 77.0, 49.0, 27.0, 20.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.17025756835938, -114.39874267578125, -108.62723541259766, -102.85572814941406, -97.08421325683594, -91.31269836425781, -85.54119110107422, -79.76968383789062, -73.9981689453125, -68.22665405273438, -62.45514678955078, -56.68363571166992, -50.91212463378906, -45.1406135559082, -39.369102478027344, -33.597591400146484, -27.826080322265625, -22.054569244384766, -16.283058166503906, -10.511547088623047, -4.7400360107421875, 1.0314750671386719, 6.802986145019531, 12.57449722290039, 18.34600830078125, 24.11751937866211, 29.88903045654297, 35.66054153442383, 41.43205261230469, 47.20356369018555, 52.975074768066406, 58.746585845947266, 64.51809692382812, 70.28961181640625, 76.06111907958984, 81.83262634277344, 87.60414123535156, 93.37565612792969, 99.14716339111328, 104.91867065429688, 110.690185546875, 116.46170043945312, 122.23320770263672, 128.0047149658203, 133.77622985839844, 139.54774475097656, 145.31924438476562, 151.09075927734375, 156.86227416992188, 162.6337890625, 168.40530395507812, 174.1768035888672, 179.9483184814453, 185.71983337402344, 191.4913330078125, 197.26284790039062, 203.03436279296875, 208.80587768554688, 214.577392578125, 220.34889221191406, 226.1204071044922, 231.8919219970703, 237.66342163085938, 243.4349365234375, 249.20645141601562]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 9.0, 11.0, 10.0, 9.0, 18.0, 12.0, 13.0, 21.0, 25.0, 24.0, 26.0, 38.0, 42.0, 35.0, 40.0, 47.0, 40.0, 58.0, 62.0, 54.0, 45.0, 42.0, 39.0, 32.0, 32.0, 33.0, 27.0, 19.0, 22.0, 21.0, 20.0, 13.0, 12.0, 5.0, 6.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.97482299804688, -72.59039306640625, -70.20597076416016, -67.82154083251953, -65.43711853027344, -63.05268859863281, -60.66826248168945, -58.283836364746094, -55.89940643310547, -53.51498031616211, -51.13055419921875, -48.746124267578125, -46.361698150634766, -43.977272033691406, -41.59284591674805, -39.20841979980469, -36.82399368286133, -34.43956756591797, -32.05514144897461, -29.670713424682617, -27.286285400390625, -24.901859283447266, -22.517433166503906, -20.133005142211914, -17.748579025268555, -15.364151954650879, -12.979724884033203, -10.595298767089844, -8.210871696472168, -5.826444625854492, -3.442018508911133, -1.0575904846191406, 1.3268356323242188, 3.7112624645233154, 6.095689296722412, 8.48011589050293, 10.864542961120605, 13.248970031738281, 15.63339614868164, 18.017824172973633, 20.402250289916992, 22.78667640686035, 25.171104431152344, 27.555530548095703, 29.939956665039062, 32.32438659667969, 34.70880889892578, 37.093238830566406, 39.477664947509766, 41.862091064453125, 44.246517181396484, 46.630943298339844, 49.01537322998047, 51.39979934692383, 53.78422546386719, 56.16865539550781, 58.553077697753906, 60.937503814697266, 63.321929931640625, 65.70635986328125, 68.09078216552734, 70.47521209716797, 72.85963439941406, 75.24406433105469, 77.62849426269531]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 1.0, 9.0, 13.0, 7.0, 24.0, 33.0, 56.0, 84.0, 138.0, 219.0, 381.0, 686.0, 1407.0, 2983.0, 7220.0, 21034.0, 75565.0, 458989.0, 380577.0, 67547.0, 19115.0, 6800.0, 2762.0, 1278.0, 714.0, 375.0, 196.0, 121.0, 66.0, 53.0, 25.0, 29.0, 13.0, 7.0, 10.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.25, -8.9605712890625, -8.671142578125, -8.3817138671875, -8.09228515625, -7.8028564453125, -7.513427734375, -7.2239990234375, -6.9345703125, -6.6451416015625, -6.355712890625, -6.0662841796875, -5.77685546875, -5.4874267578125, -5.197998046875, -4.9085693359375, -4.619140625, -4.3297119140625, -4.040283203125, -3.7508544921875, -3.46142578125, -3.1719970703125, -2.882568359375, -2.5931396484375, -2.3037109375, -2.0142822265625, -1.724853515625, -1.4354248046875, -1.14599609375, -0.8565673828125, -0.567138671875, -0.2777099609375, 0.01171875, 0.3011474609375, 0.590576171875, 0.8800048828125, 1.16943359375, 1.4588623046875, 1.748291015625, 2.0377197265625, 2.3271484375, 2.6165771484375, 2.906005859375, 3.1954345703125, 3.48486328125, 3.7742919921875, 4.063720703125, 4.3531494140625, 4.642578125, 4.9320068359375, 5.221435546875, 5.5108642578125, 5.80029296875, 6.0897216796875, 6.379150390625, 6.6685791015625, 6.9580078125, 7.2474365234375, 7.536865234375, 7.8262939453125, 8.11572265625, 8.4051513671875, 8.694580078125, 8.9840087890625, 9.2734375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 14.0, 16.0, 20.0, 23.0, 31.0, 32.0, 42.0, 45.0, 49.0, 81.0, 65.0, 65.0, 66.0, 57.0, 56.0, 58.0, 44.0, 46.0, 38.0, 26.0, 23.0, 22.0, 13.0, 9.0, 10.0, 6.0, 8.0, 5.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.2928466796875, -5.097412109375, -4.9019775390625, -4.70654296875, -4.5111083984375, -4.315673828125, -4.1202392578125, -3.9248046875, -3.7293701171875, -3.533935546875, -3.3385009765625, -3.14306640625, -2.9476318359375, -2.752197265625, -2.5567626953125, -2.361328125, -2.1658935546875, -1.970458984375, -1.7750244140625, -1.57958984375, -1.3841552734375, -1.188720703125, -0.9932861328125, -0.7978515625, -0.6024169921875, -0.406982421875, -0.2115478515625, -0.01611328125, 0.1793212890625, 0.374755859375, 0.5701904296875, 0.765625, 0.9610595703125, 1.156494140625, 1.3519287109375, 1.54736328125, 1.7427978515625, 1.938232421875, 2.1336669921875, 2.3291015625, 2.5245361328125, 2.719970703125, 2.9154052734375, 3.11083984375, 3.3062744140625, 3.501708984375, 3.6971435546875, 3.892578125, 4.0880126953125, 4.283447265625, 4.4788818359375, 4.67431640625, 4.8697509765625, 5.065185546875, 5.2606201171875, 5.4560546875, 5.6514892578125, 5.846923828125, 6.0423583984375, 6.23779296875, 6.4332275390625, 6.628662109375, 6.8240966796875, 7.01953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 14.0, 6.0, 8.0, 10.0, 14.0, 25.0, 31.0, 46.0, 92.0, 100.0, 169.0, 268.0, 497.0, 999.0, 2582.0, 10755.0, 80605.0, 894279.0, 46738.0, 7340.0, 2042.0, 823.0, 391.0, 246.0, 135.0, 99.0, 56.0, 31.0, 39.0, 20.0, 23.0, 11.0, 21.0, 7.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.4296875, -12.97265625, -12.515625, -12.05859375, -11.6015625, -11.14453125, -10.6875, -10.23046875, -9.7734375, -9.31640625, -8.859375, -8.40234375, -7.9453125, -7.48828125, -7.03125, -6.57421875, -6.1171875, -5.66015625, -5.203125, -4.74609375, -4.2890625, -3.83203125, -3.375, -2.91796875, -2.4609375, -2.00390625, -1.546875, -1.08984375, -0.6328125, -0.17578125, 0.28125, 0.73828125, 1.1953125, 1.65234375, 2.109375, 2.56640625, 3.0234375, 3.48046875, 3.9375, 4.39453125, 4.8515625, 5.30859375, 5.765625, 6.22265625, 6.6796875, 7.13671875, 7.59375, 8.05078125, 8.5078125, 8.96484375, 9.421875, 9.87890625, 10.3359375, 10.79296875, 11.25, 11.70703125, 12.1640625, 12.62109375, 13.078125, 13.53515625, 13.9921875, 14.44921875, 14.90625, 15.36328125, 15.8203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 4.0, 5.0, 1.0, 7.0, 12.0, 5.0, 11.0, 19.0, 24.0, 12.0, 19.0, 34.0, 29.0, 35.0, 35.0, 49.0, 64.0, 94.0, 77.0, 87.0, 69.0, 58.0, 52.0, 35.0, 31.0, 25.0, 18.0, 13.0, 13.0, 10.0, 9.0, 10.0, 9.0, 8.0, 5.0, 3.0, 6.0, 4.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.390625, -18.605224609375, -17.81982421875, -17.034423828125, -16.2490234375, -15.463623046875, -14.67822265625, -13.892822265625, -13.107421875, -12.322021484375, -11.53662109375, -10.751220703125, -9.9658203125, -9.180419921875, -8.39501953125, -7.609619140625, -6.82421875, -6.038818359375, -5.25341796875, -4.468017578125, -3.6826171875, -2.897216796875, -2.11181640625, -1.326416015625, -0.541015625, 0.244384765625, 1.02978515625, 1.815185546875, 2.6005859375, 3.385986328125, 4.17138671875, 4.956787109375, 5.7421875, 6.527587890625, 7.31298828125, 8.098388671875, 8.8837890625, 9.669189453125, 10.45458984375, 11.239990234375, 12.025390625, 12.810791015625, 13.59619140625, 14.381591796875, 15.1669921875, 15.952392578125, 16.73779296875, 17.523193359375, 18.30859375, 19.093994140625, 19.87939453125, 20.664794921875, 21.4501953125, 22.235595703125, 23.02099609375, 23.806396484375, 24.591796875, 25.377197265625, 26.16259765625, 26.947998046875, 27.7333984375, 28.518798828125, 29.30419921875, 30.089599609375, 30.875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 8.0, 15.0, 8.0, 14.0, 20.0, 29.0, 49.0, 73.0, 116.0, 231.0, 533.0, 1491.0, 5816.0, 41773.0, 939004.0, 49928.0, 6628.0, 1613.0, 558.0, 268.0, 130.0, 77.0, 31.0, 27.0, 21.0, 22.0, 15.0, 12.0, 7.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.640625, -4.49798583984375, -4.3553466796875, -4.21270751953125, -4.070068359375, -3.92742919921875, -3.7847900390625, -3.64215087890625, -3.49951171875, -3.35687255859375, -3.2142333984375, -3.07159423828125, -2.928955078125, -2.78631591796875, -2.6436767578125, -2.50103759765625, -2.3583984375, -2.21575927734375, -2.0731201171875, -1.93048095703125, -1.787841796875, -1.64520263671875, -1.5025634765625, -1.35992431640625, -1.21728515625, -1.07464599609375, -0.9320068359375, -0.78936767578125, -0.646728515625, -0.50408935546875, -0.3614501953125, -0.21881103515625, -0.076171875, 0.06646728515625, 0.2091064453125, 0.35174560546875, 0.494384765625, 0.63702392578125, 0.7796630859375, 0.92230224609375, 1.06494140625, 1.20758056640625, 1.3502197265625, 1.49285888671875, 1.635498046875, 1.77813720703125, 1.9207763671875, 2.06341552734375, 2.2060546875, 2.34869384765625, 2.4913330078125, 2.63397216796875, 2.776611328125, 2.91925048828125, 3.0618896484375, 3.20452880859375, 3.34716796875, 3.48980712890625, 3.6324462890625, 3.77508544921875, 3.917724609375, 4.06036376953125, 4.2030029296875, 4.34564208984375, 4.48828125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 1.0, 2.0, 3.0, 8.0, 10.0, 14.0, 22.0, 20.0, 38.0, 77.0, 184.0, 236.0, 171.0, 67.0, 39.0, 28.0, 11.0, 9.0, 7.0, 6.0, 10.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001789093017578125, -0.001733824610710144, -0.001678556203842163, -0.0016232877969741821, -0.0015680193901062012, -0.0015127509832382202, -0.0014574825763702393, -0.0014022141695022583, -0.0013469457626342773, -0.0012916773557662964, -0.0012364089488983154, -0.0011811405420303345, -0.0011258721351623535, -0.0010706037282943726, -0.0010153353214263916, -0.0009600669145584106, -0.0009047985076904297, -0.0008495301008224487, -0.0007942616939544678, -0.0007389932870864868, -0.0006837248802185059, -0.0006284564733505249, -0.0005731880664825439, -0.000517919659614563, -0.00046265125274658203, -0.0004073828458786011, -0.0003521144390106201, -0.00029684603214263916, -0.0002415776252746582, -0.00018630921840667725, -0.0001310408115386963, -7.577240467071533e-05, -2.0503997802734375e-05, 3.476440906524658e-05, 9.003281593322754e-05, 0.0001453012228012085, 0.00020056962966918945, 0.0002558380365371704, 0.00031110644340515137, 0.0003663748502731323, 0.0004216432571411133, 0.00047691166400909424, 0.0005321800708770752, 0.0005874484777450562, 0.0006427168846130371, 0.0006979852914810181, 0.000753253698348999, 0.00080852210521698, 0.0008637905120849609, 0.0009190589189529419, 0.0009743273258209229, 0.0010295957326889038, 0.0010848641395568848, 0.0011401325464248657, 0.0011954009532928467, 0.0012506693601608276, 0.0013059377670288086, 0.0013612061738967896, 0.0014164745807647705, 0.0014717429876327515, 0.0015270113945007324, 0.0015822798013687134, 0.0016375482082366943, 0.0016928166151046753, 0.0017480850219726562]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 5.0, 12.0, 17.0, 29.0, 51.0, 83.0, 141.0, 279.0, 650.0, 1804.0, 5975.0, 29717.0, 881540.0, 110411.0, 12602.0, 3244.0, 1092.0, 453.0, 203.0, 96.0, 49.0, 28.0, 14.0, 15.0, 5.0, 10.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.376556396484375, -3.26678466796875, -3.157012939453125, -3.0472412109375, -2.937469482421875, -2.82769775390625, -2.717926025390625, -2.608154296875, -2.498382568359375, -2.38861083984375, -2.278839111328125, -2.1690673828125, -2.059295654296875, -1.94952392578125, -1.839752197265625, -1.72998046875, -1.620208740234375, -1.51043701171875, -1.400665283203125, -1.2908935546875, -1.181121826171875, -1.07135009765625, -0.961578369140625, -0.851806640625, -0.742034912109375, -0.63226318359375, -0.522491455078125, -0.4127197265625, -0.302947998046875, -0.19317626953125, -0.083404541015625, 0.0263671875, 0.136138916015625, 0.24591064453125, 0.355682373046875, 0.4654541015625, 0.575225830078125, 0.68499755859375, 0.794769287109375, 0.904541015625, 1.014312744140625, 1.12408447265625, 1.233856201171875, 1.3436279296875, 1.453399658203125, 1.56317138671875, 1.672943115234375, 1.78271484375, 1.892486572265625, 2.00225830078125, 2.112030029296875, 2.2218017578125, 2.331573486328125, 2.44134521484375, 2.551116943359375, 2.660888671875, 2.770660400390625, 2.88043212890625, 2.990203857421875, 3.0999755859375, 3.209747314453125, 3.31951904296875, 3.429290771484375, 3.5390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 12.0, 8.0, 11.0, 9.0, 13.0, 23.0, 16.0, 32.0, 43.0, 75.0, 101.0, 115.0, 116.0, 111.0, 77.0, 75.0, 39.0, 24.0, 19.0, 19.0, 11.0, 8.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.57421875, -2.488616943359375, -2.40301513671875, -2.317413330078125, -2.2318115234375, -2.146209716796875, -2.06060791015625, -1.975006103515625, -1.889404296875, -1.803802490234375, -1.71820068359375, -1.632598876953125, -1.5469970703125, -1.461395263671875, -1.37579345703125, -1.290191650390625, -1.20458984375, -1.118988037109375, -1.03338623046875, -0.947784423828125, -0.8621826171875, -0.776580810546875, -0.69097900390625, -0.605377197265625, -0.519775390625, -0.434173583984375, -0.34857177734375, -0.262969970703125, -0.1773681640625, -0.091766357421875, -0.00616455078125, 0.079437255859375, 0.1650390625, 0.250640869140625, 0.33624267578125, 0.421844482421875, 0.5074462890625, 0.593048095703125, 0.67864990234375, 0.764251708984375, 0.849853515625, 0.935455322265625, 1.02105712890625, 1.106658935546875, 1.1922607421875, 1.277862548828125, 1.36346435546875, 1.449066162109375, 1.53466796875, 1.620269775390625, 1.70587158203125, 1.791473388671875, 1.8770751953125, 1.962677001953125, 2.04827880859375, 2.133880615234375, 2.219482421875, 2.305084228515625, 2.39068603515625, 2.476287841796875, 2.5618896484375, 2.647491455078125, 2.73309326171875, 2.818695068359375, 2.904296875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 10.0, 13.0, 23.0, 35.0, 69.0, 190.0, 460.0, 93.0, 43.0, 26.0, 15.0, 10.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.88695526123047, -85.36268615722656, -81.83840942382812, -78.31414031982422, -74.78987121582031, -71.2656021118164, -67.7413330078125, -64.21705627441406, -60.692787170410156, -57.16851806640625, -53.64424514770508, -50.119972229003906, -46.595703125, -43.071434020996094, -39.54716110229492, -36.02288818359375, -32.498619079589844, -28.974348068237305, -25.450077056884766, -21.925806045532227, -18.401535034179688, -14.877264022827148, -11.35299301147461, -7.82872200012207, -4.304450988769531, -0.7801799774169922, 2.744091033935547, 6.268362045288086, 9.792633056640625, 13.316904067993164, 16.841175079345703, 20.365446090698242, 23.889724731445312, 27.41399574279785, 30.93826675415039, 34.46253967285156, 37.98680877685547, 41.511077880859375, 45.03535079956055, 48.55962371826172, 52.083892822265625, 55.60816192626953, 59.1324348449707, 62.656707763671875, 66.18097686767578, 69.70524597167969, 73.22952270507812, 76.75379180908203, 80.27806091308594, 83.80233001708984, 87.32659912109375, 90.85087585449219, 94.3751449584961, 97.8994140625, 101.42369079589844, 104.94795989990234, 108.47222900390625, 111.99649810791016, 115.52076721191406, 119.0450439453125, 122.5693130493164, 126.09358215332031, 129.61785888671875, 133.14212036132812, 136.66639709472656]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 5.0, 9.0, 11.0, 7.0, 22.0, 15.0, 26.0, 18.0, 19.0, 17.0, 19.0, 30.0, 77.0, 193.0, 208.0, 69.0, 24.0, 32.0, 27.0, 23.0, 21.0, 10.0, 18.0, 11.0, 13.0, 12.0, 12.0, 4.0, 3.0, 6.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.78363800048828, -51.8643684387207, -49.945098876953125, -48.02582550048828, -46.1065559387207, -44.187286376953125, -42.26801681518555, -40.34874725341797, -38.429473876953125, -36.51020431518555, -34.59093475341797, -32.671661376953125, -30.752391815185547, -28.83312225341797, -26.91385269165039, -24.994583129882812, -23.075313568115234, -21.156044006347656, -19.236772537231445, -17.317502975463867, -15.398232460021973, -13.478961944580078, -11.5596923828125, -9.640421867370605, -7.721151351928711, -5.801880836486816, -3.88261079788208, -1.9633407592773438, -0.04407024383544922, 1.8752002716064453, 3.7944698333740234, 5.713740348815918, 7.6330108642578125, 9.552281379699707, 11.471551895141602, 13.39082145690918, 15.310091972351074, 17.22936248779297, 19.148632049560547, 21.067901611328125, 22.987173080444336, 24.906442642211914, 26.825714111328125, 28.744983673095703, 30.66425323486328, 32.583526611328125, 34.50279235839844, 36.42206573486328, 38.34133529663086, 40.26060485839844, 42.179874420166016, 44.099143981933594, 46.01841735839844, 47.937686920166016, 49.856956481933594, 51.77622604370117, 53.69549560546875, 55.61476516723633, 57.534034729003906, 59.45330810546875, 61.37257766723633, 63.291847229003906, 65.21112060546875, 67.13038635253906, 69.0496597290039]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 8.0, 5.0, 9.0, 17.0, 13.0, 21.0, 15.0, 19.0, 30.0, 37.0, 46.0, 49.0, 91.0, 295.0, 89.0, 34.0, 28.0, 43.0, 37.0, 21.0, 18.0, 16.0, 14.0, 12.0, 7.0, 7.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5234375, -7.322509765625, -7.12158203125, -6.920654296875, -6.7197265625, -6.518798828125, -6.31787109375, -6.116943359375, -5.916015625, -5.715087890625, -5.51416015625, -5.313232421875, -5.1123046875, -4.911376953125, -4.71044921875, -4.509521484375, -4.30859375, -4.107666015625, -3.90673828125, -3.705810546875, -3.5048828125, -3.303955078125, -3.10302734375, -2.902099609375, -2.701171875, -2.500244140625, -2.29931640625, -2.098388671875, -1.8974609375, -1.696533203125, -1.49560546875, -1.294677734375, -1.09375, -0.892822265625, -0.69189453125, -0.490966796875, -0.2900390625, -0.089111328125, 0.11181640625, 0.312744140625, 0.513671875, 0.714599609375, 0.91552734375, 1.116455078125, 1.3173828125, 1.518310546875, 1.71923828125, 1.920166015625, 2.12109375, 2.322021484375, 2.52294921875, 2.723876953125, 2.9248046875, 3.125732421875, 3.32666015625, 3.527587890625, 3.728515625, 3.929443359375, 4.13037109375, 4.331298828125, 4.5322265625, 4.733154296875, 4.93408203125, 5.135009765625, 5.3359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 11.0, 10.0, 31.0, 38.0, 38.0, 61.0, 114.0, 198.0, 382.0, 887.0, 2214.0, 7309.0, 156293.0, 8206714.0, 9692.0, 2615.0, 995.0, 419.0, 208.0, 114.0, 73.0, 40.0, 29.0, 24.0, 14.0, 19.0, 7.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-45.53217697143555, -44.1966552734375, -42.86112976074219, -41.52560806274414, -40.19008255004883, -38.85456085205078, -37.51903533935547, -36.18351364135742, -34.847991943359375, -33.51247024536133, -32.176944732666016, -30.84142303466797, -29.505897521972656, -28.17037582397461, -26.83485221862793, -25.49932861328125, -24.163803100585938, -22.828279495239258, -21.492755889892578, -20.15723419189453, -18.82170867919922, -17.486186981201172, -16.150663375854492, -14.815139770507812, -13.479616165161133, -12.144092559814453, -10.808568954467773, -9.47304630279541, -8.13752269744873, -6.801999092102051, -5.4664764404296875, -4.130952835083008, -2.795429229736328, -1.4599058628082275, -0.12438249588012695, 1.2111406326293945, 2.546664237976074, 3.882187843322754, 5.217710494995117, 6.553234100341797, 7.888757705688477, 9.224281311035156, 10.559804916381836, 11.8953275680542, 13.230851173400879, 14.566374778747559, 15.901897430419922, 17.2374210357666, 18.57294464111328, 19.90846824645996, 21.24399185180664, 22.579513549804688, 23.9150390625, 25.250560760498047, 26.586084365844727, 27.921607971191406, 29.257131576538086, 30.592655181884766, 31.928178787231445, 33.263702392578125, 34.59922409057617, 35.934749603271484, 37.27027130126953, 38.605796813964844, 39.94131851196289]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 4.0, 7.0, 3.0, 4.0, 3.0, 1.0, 9.0, 3.0, 1.0, 3.0, 10.0, 4.0, 6.0, 5.0, 0.0, 3.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.83613204956055, -38.578125, -37.32012176513672, -36.06211853027344, -34.80411148071289, -33.546104431152344, -32.28810119628906, -31.03009605407715, -29.772090911865234, -28.51408576965332, -27.256080627441406, -25.998075485229492, -24.740070343017578, -23.482065200805664, -22.22406005859375, -20.966054916381836, -19.708049774169922, -18.450044631958008, -17.192039489746094, -15.93403434753418, -14.676029205322266, -13.418024063110352, -12.160018920898438, -10.902013778686523, -9.64400863647461, -8.386003494262695, -7.127998352050781, -5.869993209838867, -4.611988067626953, -3.353982925415039, -2.095977783203125, -0.8379726409912109, 0.4200286865234375, 1.6780338287353516, 2.9360389709472656, 4.19404411315918, 5.452049255371094, 6.710054397583008, 7.968059539794922, 9.226064682006836, 10.48406982421875, 11.742074966430664, 13.000080108642578, 14.258085250854492, 15.516090393066406, 16.77409553527832, 18.032100677490234, 19.29010581970215, 20.548110961914062, 21.806116104125977, 23.06412124633789, 24.322126388549805, 25.58013153076172, 26.838136672973633, 28.096141815185547, 29.35414695739746, 30.612152099609375, 31.87015724182129, 33.1281623840332, 34.38616943359375, 35.64417266845703, 36.90217590332031, 38.16018295288086, 39.418190002441406, 40.67619323730469]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 10.0, 5.0, 12.0, 23.0, 31.0, 48.0, 103.0, 168.0, 292.0, 689.0, 1664.0, 5980.0, 28577.0, 168325.0, 257577.0, 47278.0, 9516.0, 2355.0, 795.0, 363.0, 190.0, 125.0, 54.0, 39.0, 21.0, 12.0, 7.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.75, -81.49560546875, -79.2412109375, -76.98681640625, -74.732421875, -72.47802734375, -70.2236328125, -67.96923828125, -65.71484375, -63.46044921875, -61.2060546875, -58.95166015625, -56.697265625, -54.44287109375, -52.1884765625, -49.93408203125, -47.6796875, -45.42529296875, -43.1708984375, -40.91650390625, -38.662109375, -36.40771484375, -34.1533203125, -31.89892578125, -29.64453125, -27.39013671875, -25.1357421875, -22.88134765625, -20.626953125, -18.37255859375, -16.1181640625, -13.86376953125, -11.609375, -9.35498046875, -7.1005859375, -4.84619140625, -2.591796875, -0.33740234375, 1.9169921875, 4.17138671875, 6.42578125, 8.68017578125, 10.9345703125, 13.18896484375, 15.443359375, 17.69775390625, 19.9521484375, 22.20654296875, 24.4609375, 26.71533203125, 28.9697265625, 31.22412109375, 33.478515625, 35.73291015625, 37.9873046875, 40.24169921875, 42.49609375, 44.75048828125, 47.0048828125, 49.25927734375, 51.513671875, 53.76806640625, 56.0224609375, 58.27685546875, 60.53125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 6.0, 8.0, 8.0, 11.0, 9.0, 22.0, 19.0, 19.0, 29.0, 33.0, 40.0, 52.0, 71.0, 52.0, 62.0, 74.0, 55.0, 78.0, 63.0, 52.0, 47.0, 35.0, 30.0, 32.0, 18.0, 27.0, 7.0, 11.0, 6.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5234375, -6.3355712890625, -6.147705078125, -5.9598388671875, -5.77197265625, -5.5841064453125, -5.396240234375, -5.2083740234375, -5.0205078125, -4.8326416015625, -4.644775390625, -4.4569091796875, -4.26904296875, -4.0811767578125, -3.893310546875, -3.7054443359375, -3.517578125, -3.3297119140625, -3.141845703125, -2.9539794921875, -2.76611328125, -2.5782470703125, -2.390380859375, -2.2025146484375, -2.0146484375, -1.8267822265625, -1.638916015625, -1.4510498046875, -1.26318359375, -1.0753173828125, -0.887451171875, -0.6995849609375, -0.51171875, -0.3238525390625, -0.135986328125, 0.0518798828125, 0.23974609375, 0.4276123046875, 0.615478515625, 0.8033447265625, 0.9912109375, 1.1790771484375, 1.366943359375, 1.5548095703125, 1.74267578125, 1.9305419921875, 2.118408203125, 2.3062744140625, 2.494140625, 2.6820068359375, 2.869873046875, 3.0577392578125, 3.24560546875, 3.4334716796875, 3.621337890625, 3.8092041015625, 3.9970703125, 4.1849365234375, 4.372802734375, 4.5606689453125, 4.74853515625, 4.9364013671875, 5.124267578125, 5.3121337890625, 5.5]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 8.0, 8.0, 18.0, 31.0, 88.0, 146.0, 108.0, 36.0, 19.0, 13.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.5690689086914, -121.64833068847656, -118.72760009765625, -115.80686950683594, -112.8861312866211, -109.96539306640625, -107.04466247558594, -104.12393188476562, -101.20319366455078, -98.28245544433594, -95.36172485351562, -92.44099426269531, -89.52025604248047, -86.59951782226562, -83.67878723144531, -80.758056640625, -77.83731842041016, -74.91658020019531, -71.995849609375, -69.07511901855469, -66.15438079833984, -63.233646392822266, -60.31291198730469, -57.39217758178711, -54.47144317626953, -51.55070877075195, -48.629974365234375, -45.7092399597168, -42.78850555419922, -39.86777114868164, -36.94703674316406, -34.026302337646484, -31.105560302734375, -28.184825897216797, -25.26409149169922, -22.34335708618164, -19.422622680664062, -16.501888275146484, -13.581153869628906, -10.660419464111328, -7.73968505859375, -4.818950653076172, -1.8982162475585938, 1.0225181579589844, 3.9432525634765625, 6.863986968994141, 9.784721374511719, 12.705455780029297, 15.626190185546875, 18.546924591064453, 21.46765899658203, 24.38839340209961, 27.309127807617188, 30.229862213134766, 33.150596618652344, 36.07133102416992, 38.9920654296875, 41.91279983520508, 44.833534240722656, 47.754268646240234, 50.67500305175781, 53.59573745727539, 56.51647186279297, 59.43720626831055, 62.357940673828125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 11.0, 6.0, 10.0, 34.0, 48.0, 70.0, 78.0, 64.0, 51.0, 24.0, 14.0, 11.0, 7.0, 9.0, 3.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.507526397705078, -27.567724227905273, -26.62792205810547, -25.688119888305664, -24.74831771850586, -23.808517456054688, -22.86871337890625, -21.928913116455078, -20.989110946655273, -20.04930877685547, -19.109506607055664, -18.16970443725586, -17.229902267456055, -16.29010009765625, -15.350298881530762, -14.410497665405273, -13.470694541931152, -12.530892372131348, -11.591090202331543, -10.651288986206055, -9.71148681640625, -8.771684646606445, -7.831882476806641, -6.892080783843994, -5.9522786140441895, -5.012476444244385, -4.072674751281738, -3.1328725814819336, -2.193070650100708, -1.2532687187194824, -0.31346654891967773, 0.6263351440429688, 1.5661373138427734, 2.505939245223999, 3.4457411766052246, 4.385543346405029, 5.325345039367676, 6.2651472091674805, 7.204949378967285, 8.144750595092773, 9.084552764892578, 10.024354934692383, 10.964157104492188, 11.903959274291992, 12.84376049041748, 13.783562660217285, 14.72336483001709, 15.663166046142578, 16.602970123291016, 17.54277229309082, 18.482574462890625, 19.42237663269043, 20.362178802490234, 21.301979064941406, 22.241783142089844, 23.181583404541016, 24.12138557434082, 25.061187744140625, 26.00098991394043, 26.940792083740234, 27.88059425354004, 28.820396423339844, 29.760196685791016, 30.69999885559082, 31.639801025390625]}, "_wandb": {"runtime": 4156}}